{"train/loss": 3.1966, "train/learning_rate": 6.936416184971099e-08, "train/epoch": 10.0, "train/global_step": 2230, "_runtime": 51677, "_timestamp": 1648466626, "_step": 2234, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 33.0, 227.0, 474.0, 239.0, 34.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.604528427124023, -28.090166091918945, -27.5758056640625, -27.061443328857422, -26.547080993652344, -26.032718658447266, -25.51835823059082, -25.003995895385742, -24.489635467529297, -23.97527313232422, -23.460912704467773, -22.946550369262695, -22.432188034057617, -21.917827606201172, -21.403465270996094, -20.889102935791016, -20.374740600585938, -19.86037826538086, -19.346017837524414, -18.831655502319336, -18.317293167114258, -17.802932739257812, -17.288570404052734, -16.774208068847656, -16.259845733642578, -15.745484352111816, -15.231122016906738, -14.716760635375977, -14.202398300170898, -13.688036918640137, -13.173675537109375, -12.659313201904297, -12.144952774047852, -11.63059139251709, -11.116229057312012, -10.60186767578125, -10.087505340576172, -9.57314395904541, -9.058782577514648, -8.54442024230957, -8.030058860778809, -7.515697002410889, -7.001335144042969, -6.486973762512207, -5.972611904144287, -5.458250045776367, -4.9438886642456055, -4.4295268058776855, -3.9151649475097656, -3.4008030891418457, -2.886441469192505, -2.372079849243164, -1.8577179908752441, -1.3433561325073242, -0.8289945125579834, -0.3146328926086426, 0.19972896575927734, 0.7140907049179077, 1.228452444076538, 1.7428141832351685, 2.257175922393799, 2.7715377807617188, 3.2858994007110596, 3.8002610206604004, 4.31462287902832]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 7.0, 4.0, 4.0, 8.0, 11.0, 8.0, 13.0, 21.0, 14.0, 16.0, 24.0, 34.0, 26.0, 30.0, 44.0, 41.0, 35.0, 39.0, 53.0, 39.0, 48.0, 48.0, 44.0, 47.0, 39.0, 35.0, 40.0, 35.0, 23.0, 26.0, 31.0, 17.0, 17.0, 15.0, 10.0, 17.0, 13.0, 11.0, 4.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1261658668518066, -3.028174877166748, -2.9301838874816895, -2.83219313621521, -2.7342021465301514, -2.6362111568450928, -2.5382204055786133, -2.4402294158935547, -2.342238426208496, -2.2442474365234375, -2.146256446838379, -2.0482656955718994, -1.9502747058868408, -1.8522837162017822, -1.7542928457260132, -1.6563019752502441, -1.5583109855651855, -1.460319995880127, -1.362329125404358, -1.2643382549285889, -1.1663472652435303, -1.0683562755584717, -0.9703654050827026, -0.8723744750022888, -0.774383544921875, -0.6763926148414612, -0.5784016847610474, -0.48041075468063354, -0.3824198246002197, -0.2844288945198059, -0.1864379644393921, -0.08844703435897827, 0.009543895721435547, 0.10753482580184937, 0.20552575588226318, 0.303516685962677, 0.4015076160430908, 0.49949854612350464, 0.5974894762039185, 0.6954804062843323, 0.7934713363647461, 0.8914622664451599, 0.9894531965255737, 1.0874440670013428, 1.1854350566864014, 1.28342604637146, 1.381416916847229, 1.479407787322998, 1.5773987770080566, 1.6753897666931152, 1.7733806371688843, 1.8713715076446533, 1.969362497329712, 2.0673534870147705, 2.16534423828125, 2.2633352279663086, 2.361326217651367, 2.459317207336426, 2.5573081970214844, 2.655298948287964, 2.7532899379730225, 2.851280927658081, 2.9492716789245605, 3.047262668609619, 3.1452536582946777]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 10.0, 12.0, 12.0, 32.0, 44.0, 80.0, 118.0, 210.0, 327.0, 586.0, 1276.0, 2408.0, 4794.0, 10173.0, 21924.0, 49846.0, 117445.0, 270224.0, 570534.0, 958582.0, 1007810.0, 632998.0, 306153.0, 131826.0, 57542.0, 25910.0, 11827.0, 5585.0, 2770.0, 1463.0, 742.0, 401.0, 227.0, 137.0, 90.0, 56.0, 28.0, 25.0, 20.0, 3.0, 6.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.155609130859375, -4.02996826171875, -3.904327392578125, -3.7786865234375, -3.653045654296875, -3.52740478515625, -3.401763916015625, -3.276123046875, -3.150482177734375, -3.02484130859375, -2.899200439453125, -2.7735595703125, -2.647918701171875, -2.52227783203125, -2.396636962890625, -2.27099609375, -2.145355224609375, -2.01971435546875, -1.894073486328125, -1.7684326171875, -1.642791748046875, -1.51715087890625, -1.391510009765625, -1.265869140625, -1.140228271484375, -1.01458740234375, -0.888946533203125, -0.7633056640625, -0.637664794921875, -0.51202392578125, -0.386383056640625, -0.2607421875, -0.135101318359375, -0.00946044921875, 0.116180419921875, 0.2418212890625, 0.367462158203125, 0.49310302734375, 0.618743896484375, 0.744384765625, 0.870025634765625, 0.99566650390625, 1.121307373046875, 1.2469482421875, 1.372589111328125, 1.49822998046875, 1.623870849609375, 1.74951171875, 1.875152587890625, 2.00079345703125, 2.126434326171875, 2.2520751953125, 2.377716064453125, 2.50335693359375, 2.628997802734375, 2.754638671875, 2.880279541015625, 3.00592041015625, 3.131561279296875, 3.2572021484375, 3.382843017578125, 3.50848388671875, 3.634124755859375, 3.759765625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 6.0, 6.0, 11.0, 8.0, 12.0, 16.0, 19.0, 18.0, 23.0, 25.0, 26.0, 42.0, 29.0, 36.0, 32.0, 51.0, 45.0, 51.0, 48.0, 38.0, 46.0, 45.0, 45.0, 29.0, 35.0, 40.0, 27.0, 22.0, 25.0, 28.0, 21.0, 26.0, 18.0, 8.0, 7.0, 8.0, 7.0, 4.0, 1.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.27734375, -5.12713623046875, -4.9769287109375, -4.82672119140625, -4.676513671875, -4.52630615234375, -4.3760986328125, -4.22589111328125, -4.07568359375, -3.92547607421875, -3.7752685546875, -3.62506103515625, -3.474853515625, -3.32464599609375, -3.1744384765625, -3.02423095703125, -2.8740234375, -2.72381591796875, -2.5736083984375, -2.42340087890625, -2.273193359375, -2.12298583984375, -1.9727783203125, -1.82257080078125, -1.67236328125, -1.52215576171875, -1.3719482421875, -1.22174072265625, -1.071533203125, -0.92132568359375, -0.7711181640625, -0.62091064453125, -0.470703125, -0.32049560546875, -0.1702880859375, -0.02008056640625, 0.130126953125, 0.28033447265625, 0.4305419921875, 0.58074951171875, 0.73095703125, 0.88116455078125, 1.0313720703125, 1.18157958984375, 1.331787109375, 1.48199462890625, 1.6322021484375, 1.78240966796875, 1.9326171875, 2.08282470703125, 2.2330322265625, 2.38323974609375, 2.533447265625, 2.68365478515625, 2.8338623046875, 2.98406982421875, 3.13427734375, 3.28448486328125, 3.4346923828125, 3.58489990234375, 3.735107421875, 3.88531494140625, 4.0355224609375, 4.18572998046875, 4.3359375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 7.0, 13.0, 30.0, 62.0, 130.0, 320.0, 1114.0, 4176674.0, 14854.0, 689.0, 205.0, 87.0, 51.0, 8.0, 8.0, 8.0, 10.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.5625, -95.3837890625, -91.205078125, -87.0263671875, -82.84765625, -78.6689453125, -74.490234375, -70.3115234375, -66.1328125, -61.9541015625, -57.775390625, -53.5966796875, -49.41796875, -45.2392578125, -41.060546875, -36.8818359375, -32.703125, -28.5244140625, -24.345703125, -20.1669921875, -15.98828125, -11.8095703125, -7.630859375, -3.4521484375, 0.7265625, 4.9052734375, 9.083984375, 13.2626953125, 17.44140625, 21.6201171875, 25.798828125, 29.9775390625, 34.15625, 38.3349609375, 42.513671875, 46.6923828125, 50.87109375, 55.0498046875, 59.228515625, 63.4072265625, 67.5859375, 71.7646484375, 75.943359375, 80.1220703125, 84.30078125, 88.4794921875, 92.658203125, 96.8369140625, 101.015625, 105.1943359375, 109.373046875, 113.5517578125, 117.73046875, 121.9091796875, 126.087890625, 130.2666015625, 134.4453125, 138.6240234375, 142.802734375, 146.9814453125, 151.16015625, 155.3388671875, 159.517578125, 163.6962890625, 167.875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 2.0, 12.0, 24.0, 41.0, 52.0, 100.0, 194.0, 348.0, 645.0, 1004.0, 724.0, 432.0, 225.0, 117.0, 61.0, 36.0, 16.0, 17.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.916168212890625, -2.78741455078125, -2.658660888671875, -2.5299072265625, -2.401153564453125, -2.27239990234375, -2.143646240234375, -2.014892578125, -1.886138916015625, -1.75738525390625, -1.628631591796875, -1.4998779296875, -1.371124267578125, -1.24237060546875, -1.113616943359375, -0.98486328125, -0.856109619140625, -0.72735595703125, -0.598602294921875, -0.4698486328125, -0.341094970703125, -0.21234130859375, -0.083587646484375, 0.045166015625, 0.173919677734375, 0.30267333984375, 0.431427001953125, 0.5601806640625, 0.688934326171875, 0.81768798828125, 0.946441650390625, 1.0751953125, 1.203948974609375, 1.33270263671875, 1.461456298828125, 1.5902099609375, 1.718963623046875, 1.84771728515625, 1.976470947265625, 2.105224609375, 2.233978271484375, 2.36273193359375, 2.491485595703125, 2.6202392578125, 2.748992919921875, 2.87774658203125, 3.006500244140625, 3.13525390625, 3.264007568359375, 3.39276123046875, 3.521514892578125, 3.6502685546875, 3.779022216796875, 3.90777587890625, 4.036529541015625, 4.165283203125, 4.294036865234375, 4.42279052734375, 4.551544189453125, 4.6802978515625, 4.809051513671875, 4.93780517578125, 5.066558837890625, 5.1953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 7.0, 8.0, 10.0, 15.0, 25.0, 17.0, 29.0, 39.0, 32.0, 33.0, 59.0, 55.0, 59.0, 63.0, 53.0, 67.0, 59.0, 48.0, 57.0, 49.0, 42.0, 36.0, 29.0, 15.0, 20.0, 18.0, 12.0, 10.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.272556781768799, -3.123746156692505, -2.974935531616211, -2.826124906539917, -2.677314281463623, -2.528503656387329, -2.379693031311035, -2.230882167816162, -2.0820717811584473, -1.9332611560821533, -1.7844505310058594, -1.6356399059295654, -1.4868292808532715, -1.3380186557769775, -1.189207911491394, -1.0403972864151, -0.8915865421295166, -0.7427759170532227, -0.5939652919769287, -0.44515460729599, -0.29634398221969604, -0.1475333571434021, 0.001277327537536621, 0.15008795261383057, 0.2988985776901245, 0.44770920276641846, 0.5965198278427124, 0.7453305125236511, 0.8941411375999451, 1.0429518222808838, 1.1917624473571777, 1.3405730724334717, 1.4893836975097656, 1.6381943225860596, 1.7870049476623535, 1.9358155727386475, 2.0846261978149414, 2.2334368228912354, 2.3822474479675293, 2.5310583114624023, 2.679868698120117, 2.828679323196411, 2.977489948272705, 3.126300573348999, 3.275111198425293, 3.423921823501587, 3.572732448577881, 3.721543312072754, 3.870353937149048, 4.019164562225342, 4.167975425720215, 4.31678581237793, 4.465596675872803, 4.614407062530518, 4.763217926025391, 4.9120283126831055, 5.0608391761779785, 5.209650039672852, 5.358460426330566, 5.5072712898254395, 5.656081676483154, 5.804892539978027, 5.953702926635742, 6.102513790130615, 6.25132417678833]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 2.0, 6.0, 8.0, 9.0, 5.0, 14.0, 13.0, 19.0, 23.0, 26.0, 36.0, 36.0, 42.0, 36.0, 46.0, 46.0, 44.0, 41.0, 59.0, 40.0, 45.0, 37.0, 39.0, 42.0, 43.0, 39.0, 35.0, 24.0, 21.0, 23.0, 22.0, 12.0, 18.0, 13.0, 8.0, 6.0, 3.0, 4.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.665203094482422, -4.525174140930176, -4.385145664215088, -4.245116710662842, -4.105088233947754, -3.965059280395508, -3.825030565261841, -3.685001850128174, -3.544973134994507, -3.40494441986084, -3.264915704727173, -3.124886989593506, -2.9848580360412598, -2.844829559326172, -2.704800605773926, -2.564771890640259, -2.424743175506592, -2.284714460372925, -2.144685745239258, -2.004657030105591, -1.8646281957626343, -1.7245994806289673, -1.5845706462860107, -1.4445419311523438, -1.3045132160186768, -1.1644845008850098, -1.0244557857513428, -0.8844269514083862, -0.7443982362747192, -0.6043695211410522, -0.4643407464027405, -0.3243119716644287, -0.18428325653076172, -0.04425451159477234, 0.09577423334121704, 0.23580297827720642, 0.3758317232131958, 0.5158604383468628, 0.6558892130851746, 0.7959179878234863, 0.9359467029571533, 1.0759754180908203, 1.2160041332244873, 1.3560329675674438, 1.4960616827011108, 1.6360903978347778, 1.7761192321777344, 1.9161479473114014, 2.0561766624450684, 2.1962053775787354, 2.3362340927124023, 2.4762628078460693, 2.6162915229797363, 2.7563204765319824, 2.8963491916656494, 3.0363779067993164, 3.1764066219329834, 3.3164353370666504, 3.4564640522003174, 3.5964927673339844, 3.7365217208862305, 3.8765501976013184, 4.0165791511535645, 4.156607627868652, 4.296636581420898]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 2.0, 7.0, 10.0, 7.0, 8.0, 17.0, 25.0, 27.0, 46.0, 62.0, 81.0, 131.0, 145.0, 247.0, 430.0, 634.0, 1360.0, 3100.0, 9875.0, 41461.0, 175962.0, 424715.0, 286755.0, 77005.0, 17523.0, 4816.0, 1783.0, 836.0, 498.0, 317.0, 228.0, 138.0, 93.0, 56.0, 32.0, 33.0, 24.0, 22.0, 14.0, 14.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1181640625, -1.084991455078125, -1.05181884765625, -1.018646240234375, -0.9854736328125, -0.952301025390625, -0.91912841796875, -0.885955810546875, -0.852783203125, -0.819610595703125, -0.78643798828125, -0.753265380859375, -0.7200927734375, -0.686920166015625, -0.65374755859375, -0.620574951171875, -0.58740234375, -0.554229736328125, -0.52105712890625, -0.487884521484375, -0.4547119140625, -0.421539306640625, -0.38836669921875, -0.355194091796875, -0.322021484375, -0.288848876953125, -0.25567626953125, -0.222503662109375, -0.1893310546875, -0.156158447265625, -0.12298583984375, -0.089813232421875, -0.056640625, -0.023468017578125, 0.00970458984375, 0.042877197265625, 0.0760498046875, 0.109222412109375, 0.14239501953125, 0.175567626953125, 0.208740234375, 0.241912841796875, 0.27508544921875, 0.308258056640625, 0.3414306640625, 0.374603271484375, 0.40777587890625, 0.440948486328125, 0.47412109375, 0.507293701171875, 0.54046630859375, 0.573638916015625, 0.6068115234375, 0.639984130859375, 0.67315673828125, 0.706329345703125, 0.739501953125, 0.772674560546875, 0.80584716796875, 0.839019775390625, 0.8721923828125, 0.905364990234375, 0.93853759765625, 0.971710205078125, 1.0048828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 11.0, 9.0, 11.0, 21.0, 20.0, 21.0, 38.0, 35.0, 38.0, 28.0, 44.0, 49.0, 61.0, 43.0, 53.0, 47.0, 53.0, 45.0, 40.0, 33.0, 48.0, 33.0, 30.0, 39.0, 24.0, 19.0, 19.0, 12.0, 15.0, 9.0, 9.0, 7.0, 4.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.654296875, -3.533233642578125, -3.41217041015625, -3.291107177734375, -3.1700439453125, -3.048980712890625, -2.92791748046875, -2.806854248046875, -2.685791015625, -2.564727783203125, -2.44366455078125, -2.322601318359375, -2.2015380859375, -2.080474853515625, -1.95941162109375, -1.838348388671875, -1.71728515625, -1.596221923828125, -1.47515869140625, -1.354095458984375, -1.2330322265625, -1.111968994140625, -0.99090576171875, -0.869842529296875, -0.748779296875, -0.627716064453125, -0.50665283203125, -0.385589599609375, -0.2645263671875, -0.143463134765625, -0.02239990234375, 0.098663330078125, 0.2197265625, 0.340789794921875, 0.46185302734375, 0.582916259765625, 0.7039794921875, 0.825042724609375, 0.94610595703125, 1.067169189453125, 1.188232421875, 1.309295654296875, 1.43035888671875, 1.551422119140625, 1.6724853515625, 1.793548583984375, 1.91461181640625, 2.035675048828125, 2.15673828125, 2.277801513671875, 2.39886474609375, 2.519927978515625, 2.6409912109375, 2.762054443359375, 2.88311767578125, 3.004180908203125, 3.125244140625, 3.246307373046875, 3.36737060546875, 3.488433837890625, 3.6094970703125, 3.730560302734375, 3.85162353515625, 3.972686767578125, 4.09375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 16.0, 11.0, 25.0, 38.0, 65.0, 111.0, 171.0, 347.0, 583.0, 1132.0, 2019.0, 3709.0, 6841.0, 12575.0, 22487.0, 38292.0, 62771.0, 96458.0, 133815.0, 161359.0, 156514.0, 125992.0, 88283.0, 56578.0, 34106.0, 19589.0, 11019.0, 6239.0, 3336.0, 1792.0, 981.0, 544.0, 308.0, 187.0, 91.0, 65.0, 27.0, 25.0, 13.0, 11.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.302490234375, -0.2930030822753906, -0.28351593017578125, -0.2740287780761719, -0.2645416259765625, -0.2550544738769531, -0.24556732177734375, -0.23608016967773438, -0.226593017578125, -0.21710586547851562, -0.20761871337890625, -0.19813156127929688, -0.1886444091796875, -0.17915725708007812, -0.16967010498046875, -0.16018295288085938, -0.15069580078125, -0.14120864868164062, -0.13172149658203125, -0.12223434448242188, -0.1127471923828125, -0.10326004028320312, -0.09377288818359375, -0.08428573608398438, -0.074798583984375, -0.06531143188476562, -0.05582427978515625, -0.046337127685546875, -0.0368499755859375, -0.027362823486328125, -0.01787567138671875, -0.008388519287109375, 0.0010986328125, 0.010585784912109375, 0.02007293701171875, 0.029560089111328125, 0.0390472412109375, 0.048534393310546875, 0.05802154541015625, 0.06750869750976562, 0.076995849609375, 0.08648300170898438, 0.09597015380859375, 0.10545730590820312, 0.1149444580078125, 0.12443161010742188, 0.13391876220703125, 0.14340591430664062, 0.15289306640625, 0.16238021850585938, 0.17186737060546875, 0.18135452270507812, 0.1908416748046875, 0.20032882690429688, 0.20981597900390625, 0.21930313110351562, 0.228790283203125, 0.23827743530273438, 0.24776458740234375, 0.2572517395019531, 0.2667388916015625, 0.2762260437011719, 0.28571319580078125, 0.2952003479003906, 0.3046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 1.0, 6.0, 11.0, 14.0, 6.0, 13.0, 14.0, 13.0, 16.0, 37.0, 30.0, 30.0, 25.0, 29.0, 32.0, 43.0, 44.0, 34.0, 45.0, 37.0, 48.0, 43.0, 37.0, 34.0, 40.0, 23.0, 41.0, 31.0, 27.0, 27.0, 25.0, 26.0, 20.0, 11.0, 12.0, 17.0, 13.0, 7.0, 8.0, 6.0, 5.0, 5.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.26171875, -6.0599365234375, -5.858154296875, -5.6563720703125, -5.45458984375, -5.2528076171875, -5.051025390625, -4.8492431640625, -4.6474609375, -4.4456787109375, -4.243896484375, -4.0421142578125, -3.84033203125, -3.6385498046875, -3.436767578125, -3.2349853515625, -3.033203125, -2.8314208984375, -2.629638671875, -2.4278564453125, -2.22607421875, -2.0242919921875, -1.822509765625, -1.6207275390625, -1.4189453125, -1.2171630859375, -1.015380859375, -0.8135986328125, -0.61181640625, -0.4100341796875, -0.208251953125, -0.0064697265625, 0.1953125, 0.3970947265625, 0.598876953125, 0.8006591796875, 1.00244140625, 1.2042236328125, 1.406005859375, 1.6077880859375, 1.8095703125, 2.0113525390625, 2.213134765625, 2.4149169921875, 2.61669921875, 2.8184814453125, 3.020263671875, 3.2220458984375, 3.423828125, 3.6256103515625, 3.827392578125, 4.0291748046875, 4.23095703125, 4.4327392578125, 4.634521484375, 4.8363037109375, 5.0380859375, 5.2398681640625, 5.441650390625, 5.6434326171875, 5.84521484375, 6.0469970703125, 6.248779296875, 6.4505615234375, 6.65234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 10.0, 17.0, 15.0, 55.0, 68.0, 83.0, 185.0, 355.0, 639.0, 1300.0, 2798.0, 7264.0, 20976.0, 70512.0, 231863.0, 403376.0, 213656.0, 64017.0, 19429.0, 6752.0, 2736.0, 1125.0, 592.0, 315.0, 179.0, 87.0, 53.0, 41.0, 16.0, 14.0, 7.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062255859375, -0.05990314483642578, -0.05755043029785156, -0.055197715759277344, -0.052845001220703125, -0.050492286682128906, -0.04813957214355469, -0.04578685760498047, -0.04343414306640625, -0.04108142852783203, -0.03872871398925781, -0.036375999450683594, -0.034023284912109375, -0.031670570373535156, -0.029317855834960938, -0.02696514129638672, -0.0246124267578125, -0.02225971221923828, -0.019906997680664062, -0.017554283142089844, -0.015201568603515625, -0.012848854064941406, -0.010496139526367188, -0.008143424987792969, -0.00579071044921875, -0.0034379959106445312, -0.0010852813720703125, 0.0012674331665039062, 0.003620147705078125, 0.005972862243652344, 0.008325576782226562, 0.010678291320800781, 0.013031005859375, 0.015383720397949219, 0.017736434936523438, 0.020089149475097656, 0.022441864013671875, 0.024794578552246094, 0.027147293090820312, 0.02950000762939453, 0.03185272216796875, 0.03420543670654297, 0.03655815124511719, 0.038910865783691406, 0.041263580322265625, 0.043616294860839844, 0.04596900939941406, 0.04832172393798828, 0.0506744384765625, 0.05302715301513672, 0.05537986755371094, 0.057732582092285156, 0.060085296630859375, 0.062438011169433594, 0.06479072570800781, 0.06714344024658203, 0.06949615478515625, 0.07184886932373047, 0.07420158386230469, 0.0765542984008789, 0.07890701293945312, 0.08125972747802734, 0.08361244201660156, 0.08596515655517578, 0.08831787109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 4.0, 9.0, 10.0, 27.0, 27.0, 36.0, 38.0, 50.0, 80.0, 96.0, 97.0, 112.0, 105.0, 81.0, 58.0, 43.0, 45.0, 33.0, 14.0, 10.0, 7.0, 8.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.179115295410156e-05, -8.864142000675201e-05, -8.549168705940247e-05, -8.234195411205292e-05, -7.919222116470337e-05, -7.604248821735382e-05, -7.289275527000427e-05, -6.974302232265472e-05, -6.659328937530518e-05, -6.344355642795563e-05, -6.029382348060608e-05, -5.714409053325653e-05, -5.399435758590698e-05, -5.0844624638557434e-05, -4.7694891691207886e-05, -4.454515874385834e-05, -4.139542579650879e-05, -3.824569284915924e-05, -3.509595990180969e-05, -3.1946226954460144e-05, -2.8796494007110596e-05, -2.5646761059761047e-05, -2.24970281124115e-05, -1.934729516506195e-05, -1.6197562217712402e-05, -1.3047829270362854e-05, -9.898096323013306e-06, -6.748363375663757e-06, -3.598630428314209e-06, -4.4889748096466064e-07, 2.7008354663848877e-06, 5.850568413734436e-06, 9.000301361083984e-06, 1.2150034308433533e-05, 1.529976725578308e-05, 1.844950020313263e-05, 2.1599233150482178e-05, 2.4748966097831726e-05, 2.7898699045181274e-05, 3.104843199253082e-05, 3.419816493988037e-05, 3.734789788722992e-05, 4.049763083457947e-05, 4.3647363781929016e-05, 4.6797096729278564e-05, 4.994682967662811e-05, 5.309656262397766e-05, 5.624629557132721e-05, 5.939602851867676e-05, 6.25457614660263e-05, 6.569549441337585e-05, 6.88452273607254e-05, 7.199496030807495e-05, 7.51446932554245e-05, 7.829442620277405e-05, 8.14441591501236e-05, 8.459389209747314e-05, 8.774362504482269e-05, 9.089335799217224e-05, 9.404309093952179e-05, 9.719282388687134e-05, 0.00010034255683422089, 0.00010349228978157043, 0.00010664202272891998, 0.00010979175567626953]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 5.0, 3.0, 9.0, 11.0, 15.0, 17.0, 18.0, 24.0, 31.0, 44.0, 54.0, 87.0, 148.0, 296.0, 716.0, 2061.0, 8963.0, 69927.0, 619955.0, 311137.0, 28057.0, 4600.0, 1302.0, 443.0, 214.0, 111.0, 73.0, 59.0, 30.0, 32.0, 21.0, 17.0, 6.0, 11.0, 8.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.134521484375, -0.13015365600585938, -0.12578582763671875, -0.12141799926757812, -0.1170501708984375, -0.11268234252929688, -0.10831451416015625, -0.10394668579101562, -0.099578857421875, -0.09521102905273438, -0.09084320068359375, -0.08647537231445312, -0.0821075439453125, -0.07773971557617188, -0.07337188720703125, -0.06900405883789062, -0.06463623046875, -0.060268402099609375, -0.05590057373046875, -0.051532745361328125, -0.0471649169921875, -0.042797088623046875, -0.03842926025390625, -0.034061431884765625, -0.029693603515625, -0.025325775146484375, -0.02095794677734375, -0.016590118408203125, -0.0122222900390625, -0.007854461669921875, -0.00348663330078125, 0.000881195068359375, 0.0052490234375, 0.009616851806640625, 0.01398468017578125, 0.018352508544921875, 0.0227203369140625, 0.027088165283203125, 0.03145599365234375, 0.035823822021484375, 0.040191650390625, 0.044559478759765625, 0.04892730712890625, 0.053295135498046875, 0.0576629638671875, 0.062030792236328125, 0.06639862060546875, 0.07076644897460938, 0.07513427734375, 0.07950210571289062, 0.08386993408203125, 0.08823776245117188, 0.0926055908203125, 0.09697341918945312, 0.10134124755859375, 0.10570907592773438, 0.110076904296875, 0.11444473266601562, 0.11881256103515625, 0.12318038940429688, 0.1275482177734375, 0.13191604614257812, 0.13628387451171875, 0.14065170288085938, 0.14501953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 5.0, 5.0, 11.0, 11.0, 17.0, 23.0, 24.0, 34.0, 46.0, 47.0, 75.0, 73.0, 55.0, 83.0, 61.0, 71.0, 68.0, 50.0, 48.0, 44.0, 30.0, 23.0, 14.0, 16.0, 11.0, 13.0, 6.0, 2.0, 3.0, 7.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0177459716796875, -0.017147541046142578, -0.016549110412597656, -0.015950679779052734, -0.015352249145507812, -0.01475381851196289, -0.014155387878417969, -0.013556957244873047, -0.012958526611328125, -0.012360095977783203, -0.011761665344238281, -0.01116323471069336, -0.010564804077148438, -0.009966373443603516, -0.009367942810058594, -0.008769512176513672, -0.00817108154296875, -0.007572650909423828, -0.006974220275878906, -0.006375789642333984, -0.0057773590087890625, -0.005178928375244141, -0.004580497741699219, -0.003982067108154297, -0.003383636474609375, -0.002785205841064453, -0.0021867752075195312, -0.0015883445739746094, -0.0009899139404296875, -0.0003914833068847656, 0.00020694732666015625, 0.0008053779602050781, 0.00140380859375, 0.002002239227294922, 0.0026006698608398438, 0.0031991004943847656, 0.0037975311279296875, 0.004395961761474609, 0.004994392395019531, 0.005592823028564453, 0.006191253662109375, 0.006789684295654297, 0.007388114929199219, 0.00798654556274414, 0.008584976196289062, 0.009183406829833984, 0.009781837463378906, 0.010380268096923828, 0.01097869873046875, 0.011577129364013672, 0.012175559997558594, 0.012773990631103516, 0.013372421264648438, 0.01397085189819336, 0.014569282531738281, 0.015167713165283203, 0.015766143798828125, 0.016364574432373047, 0.01696300506591797, 0.01756143569946289, 0.018159866333007812, 0.018758296966552734, 0.019356727600097656, 0.019955158233642578, 0.0205535888671875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 11.0, 31.0, 57.0, 97.0, 160.0, 208.0, 189.0, 147.0, 55.0, 27.0, 12.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.97476863861084, -10.578423500061035, -10.182079315185547, -9.785734176635742, -9.389389038085938, -8.99304485321045, -8.596699714660645, -8.200355529785156, -7.804010391235352, -7.407665729522705, -7.011321067810059, -6.614975929260254, -6.218631267547607, -5.822286605834961, -5.425941467285156, -5.02959680557251, -4.633252143859863, -4.236907482147217, -3.840562582015991, -3.4442176818847656, -3.047873020172119, -2.6515283584594727, -2.255183458328247, -1.8588385581970215, -1.462493896484375, -1.066149115562439, -0.6698043346405029, -0.2734595537185669, 0.12288522720336914, 0.5192300081253052, 0.9155747890472412, 1.3119196891784668, 1.7082643508911133, 2.1046090126037598, 2.5009539127349854, 2.897298812866211, 3.2936434745788574, 3.689988136291504, 4.086333274841309, 4.482677936553955, 4.879022598266602, 5.275367259979248, 5.6717119216918945, 6.068057060241699, 6.464401721954346, 6.860746383666992, 7.257091522216797, 7.653436183929443, 8.04978084564209, 8.446125984191895, 8.842470169067383, 9.238815307617188, 9.635160446166992, 10.03150463104248, 10.427849769592285, 10.824193954467773, 11.220539093017578, 11.616884231567383, 12.013228416442871, 12.409573554992676, 12.805917739868164, 13.202262878417969, 13.598608016967773, 13.994953155517578, 14.391297340393066]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 4.0, 8.0, 12.0, 13.0, 16.0, 18.0, 31.0, 25.0, 40.0, 30.0, 45.0, 50.0, 43.0, 57.0, 49.0, 51.0, 48.0, 39.0, 45.0, 44.0, 33.0, 39.0, 52.0, 34.0, 31.0, 20.0, 25.0, 12.0, 18.0, 14.0, 10.0, 12.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.816917657852173, -3.698347806930542, -3.579777956008911, -3.4612081050872803, -3.3426382541656494, -3.2240684032440186, -3.1054985523223877, -2.986928701400757, -2.868358850479126, -2.749788999557495, -2.6312191486358643, -2.5126492977142334, -2.3940794467926025, -2.2755095958709717, -2.156939744949341, -2.03836989402771, -1.9198001623153687, -1.8012303113937378, -1.682660460472107, -1.564090609550476, -1.4455207586288452, -1.326951026916504, -1.208381175994873, -1.0898113250732422, -0.9712414145469666, -0.8526715636253357, -0.7341017127037048, -0.6155319213867188, -0.4969620406627655, -0.37839221954345703, -0.25982236862182617, -0.1412525177001953, -0.022682666778564453, 0.09588717669248581, 0.21445702016353607, 0.33302685618400574, 0.4515967071056366, 0.5701665282249451, 0.6887363791465759, 0.8073062300682068, 0.9258760809898376, 1.0444458723068237, 1.1630157232284546, 1.2815855741500854, 1.4001554250717163, 1.5187252759933472, 1.637295126914978, 1.7558649778366089, 1.8744348287582397, 1.9930046796798706, 2.111574411392212, 2.2301442623138428, 2.3487141132354736, 2.4672839641571045, 2.5858538150787354, 2.704423666000366, 2.822993516921997, 2.941563367843628, 3.060133218765259, 3.1787030696868896, 3.2972729206085205, 3.4158427715301514, 3.5344126224517822, 3.652982473373413, 3.771552324295044]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 5.0, 6.0, 8.0, 13.0, 24.0, 34.0, 55.0, 80.0, 120.0, 238.0, 360.0, 615.0, 1020.0, 1765.0, 3041.0, 5492.0, 9664.0, 17273.0, 29933.0, 51365.0, 84426.0, 126997.0, 165304.0, 173097.0, 139208.0, 96299.0, 59461.0, 35357.0, 20455.0, 11531.0, 6664.0, 3670.0, 2079.0, 1137.0, 664.0, 395.0, 269.0, 156.0, 93.0, 72.0, 39.0, 22.0, 15.0, 13.0, 11.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2666015625, -1.22314453125, -1.1796875, -1.13623046875, -1.0927734375, -1.04931640625, -1.005859375, -0.96240234375, -0.9189453125, -0.87548828125, -0.83203125, -0.78857421875, -0.7451171875, -0.70166015625, -0.658203125, -0.61474609375, -0.5712890625, -0.52783203125, -0.484375, -0.44091796875, -0.3974609375, -0.35400390625, -0.310546875, -0.26708984375, -0.2236328125, -0.18017578125, -0.13671875, -0.09326171875, -0.0498046875, -0.00634765625, 0.037109375, 0.08056640625, 0.1240234375, 0.16748046875, 0.2109375, 0.25439453125, 0.2978515625, 0.34130859375, 0.384765625, 0.42822265625, 0.4716796875, 0.51513671875, 0.55859375, 0.60205078125, 0.6455078125, 0.68896484375, 0.732421875, 0.77587890625, 0.8193359375, 0.86279296875, 0.90625, 0.94970703125, 0.9931640625, 1.03662109375, 1.080078125, 1.12353515625, 1.1669921875, 1.21044921875, 1.25390625, 1.29736328125, 1.3408203125, 1.38427734375, 1.427734375, 1.47119140625, 1.5146484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 7.0, 6.0, 5.0, 9.0, 16.0, 14.0, 20.0, 19.0, 22.0, 40.0, 25.0, 34.0, 43.0, 52.0, 54.0, 63.0, 49.0, 57.0, 62.0, 52.0, 48.0, 45.0, 50.0, 39.0, 32.0, 37.0, 27.0, 23.0, 11.0, 7.0, 3.0, 9.0, 6.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.53125, -19.96142578125, -19.3916015625, -18.82177734375, -18.251953125, -17.68212890625, -17.1123046875, -16.54248046875, -15.97265625, -15.40283203125, -14.8330078125, -14.26318359375, -13.693359375, -13.12353515625, -12.5537109375, -11.98388671875, -11.4140625, -10.84423828125, -10.2744140625, -9.70458984375, -9.134765625, -8.56494140625, -7.9951171875, -7.42529296875, -6.85546875, -6.28564453125, -5.7158203125, -5.14599609375, -4.576171875, -4.00634765625, -3.4365234375, -2.86669921875, -2.296875, -1.72705078125, -1.1572265625, -0.58740234375, -0.017578125, 0.55224609375, 1.1220703125, 1.69189453125, 2.26171875, 2.83154296875, 3.4013671875, 3.97119140625, 4.541015625, 5.11083984375, 5.6806640625, 6.25048828125, 6.8203125, 7.39013671875, 7.9599609375, 8.52978515625, 9.099609375, 9.66943359375, 10.2392578125, 10.80908203125, 11.37890625, 11.94873046875, 12.5185546875, 13.08837890625, 13.658203125, 14.22802734375, 14.7978515625, 15.36767578125, 15.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 9.0, 5.0, 9.0, 13.0, 13.0, 18.0, 21.0, 45.0, 42.0, 49.0, 74.0, 80.0, 112.0, 130.0, 191.0, 275.0, 490.0, 1426.0, 12472.0, 378457.0, 626953.0, 23926.0, 2000.0, 556.0, 287.0, 206.0, 142.0, 132.0, 92.0, 66.0, 72.0, 43.0, 33.0, 33.0, 22.0, 16.0, 12.0, 9.0, 6.0, 7.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0], "bins": [-11.265625, -10.969970703125, -10.67431640625, -10.378662109375, -10.0830078125, -9.787353515625, -9.49169921875, -9.196044921875, -8.900390625, -8.604736328125, -8.30908203125, -8.013427734375, -7.7177734375, -7.422119140625, -7.12646484375, -6.830810546875, -6.53515625, -6.239501953125, -5.94384765625, -5.648193359375, -5.3525390625, -5.056884765625, -4.76123046875, -4.465576171875, -4.169921875, -3.874267578125, -3.57861328125, -3.282958984375, -2.9873046875, -2.691650390625, -2.39599609375, -2.100341796875, -1.8046875, -1.509033203125, -1.21337890625, -0.917724609375, -0.6220703125, -0.326416015625, -0.03076171875, 0.264892578125, 0.560546875, 0.856201171875, 1.15185546875, 1.447509765625, 1.7431640625, 2.038818359375, 2.33447265625, 2.630126953125, 2.92578125, 3.221435546875, 3.51708984375, 3.812744140625, 4.1083984375, 4.404052734375, 4.69970703125, 4.995361328125, 5.291015625, 5.586669921875, 5.88232421875, 6.177978515625, 6.4736328125, 6.769287109375, 7.06494140625, 7.360595703125, 7.65625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 9.0, 9.0, 11.0, 6.0, 17.0, 10.0, 21.0, 21.0, 24.0, 29.0, 33.0, 38.0, 40.0, 34.0, 36.0, 51.0, 51.0, 40.0, 60.0, 43.0, 53.0, 43.0, 34.0, 31.0, 35.0, 33.0, 38.0, 27.0, 18.0, 19.0, 14.0, 16.0, 15.0, 7.0, 4.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.734375, -16.2696533203125, -15.804931640625, -15.3402099609375, -14.87548828125, -14.4107666015625, -13.946044921875, -13.4813232421875, -13.0166015625, -12.5518798828125, -12.087158203125, -11.6224365234375, -11.15771484375, -10.6929931640625, -10.228271484375, -9.7635498046875, -9.298828125, -8.8341064453125, -8.369384765625, -7.9046630859375, -7.43994140625, -6.9752197265625, -6.510498046875, -6.0457763671875, -5.5810546875, -5.1163330078125, -4.651611328125, -4.1868896484375, -3.72216796875, -3.2574462890625, -2.792724609375, -2.3280029296875, -1.86328125, -1.3985595703125, -0.933837890625, -0.4691162109375, -0.00439453125, 0.4603271484375, 0.925048828125, 1.3897705078125, 1.8544921875, 2.3192138671875, 2.783935546875, 3.2486572265625, 3.71337890625, 4.1781005859375, 4.642822265625, 5.1075439453125, 5.572265625, 6.0369873046875, 6.501708984375, 6.9664306640625, 7.43115234375, 7.8958740234375, 8.360595703125, 8.8253173828125, 9.2900390625, 9.7547607421875, 10.219482421875, 10.6842041015625, 11.14892578125, 11.6136474609375, 12.078369140625, 12.5430908203125, 13.0078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 6.0, 5.0, 11.0, 28.0, 47.0, 117.0, 469.0, 5239.0, 1035040.0, 6787.0, 572.0, 118.0, 48.0, 22.0, 16.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.57598876953125, -6.2965087890625, -6.01702880859375, -5.737548828125, -5.45806884765625, -5.1785888671875, -4.89910888671875, -4.61962890625, -4.34014892578125, -4.0606689453125, -3.78118896484375, -3.501708984375, -3.22222900390625, -2.9427490234375, -2.66326904296875, -2.3837890625, -2.10430908203125, -1.8248291015625, -1.54534912109375, -1.265869140625, -0.98638916015625, -0.7069091796875, -0.42742919921875, -0.14794921875, 0.13153076171875, 0.4110107421875, 0.69049072265625, 0.969970703125, 1.24945068359375, 1.5289306640625, 1.80841064453125, 2.087890625, 2.36737060546875, 2.6468505859375, 2.92633056640625, 3.205810546875, 3.48529052734375, 3.7647705078125, 4.04425048828125, 4.32373046875, 4.60321044921875, 4.8826904296875, 5.16217041015625, 5.441650390625, 5.72113037109375, 6.0006103515625, 6.28009033203125, 6.5595703125, 6.83905029296875, 7.1185302734375, 7.39801025390625, 7.677490234375, 7.95697021484375, 8.2364501953125, 8.51593017578125, 8.79541015625, 9.07489013671875, 9.3543701171875, 9.63385009765625, 9.913330078125, 10.19281005859375, 10.4722900390625, 10.75177001953125, 11.03125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 17.0, 26.0, 61.0, 115.0, 168.0, 187.0, 156.0, 95.0, 68.0, 41.0, 16.0, 10.0, 3.0, 7.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003647804260253906, -0.0003528296947479248, -0.000340878963470459, -0.00032892823219299316, -0.00031697750091552734, -0.0003050267696380615, -0.0002930760383605957, -0.0002811253070831299, -0.00026917457580566406, -0.00025722384452819824, -0.0002452731132507324, -0.0002333223819732666, -0.00022137165069580078, -0.00020942091941833496, -0.00019747018814086914, -0.00018551945686340332, -0.0001735687255859375, -0.00016161799430847168, -0.00014966726303100586, -0.00013771653175354004, -0.00012576580047607422, -0.0001138150691986084, -0.00010186433792114258, -8.991360664367676e-05, -7.796287536621094e-05, -6.601214408874512e-05, -5.40614128112793e-05, -4.2110681533813477e-05, -3.0159950256347656e-05, -1.8209218978881836e-05, -6.258487701416016e-06, 5.692243576049805e-06, 1.7642974853515625e-05, 2.9593706130981445e-05, 4.1544437408447266e-05, 5.3495168685913086e-05, 6.54458999633789e-05, 7.739663124084473e-05, 8.934736251831055e-05, 0.00010129809379577637, 0.00011324882507324219, 0.000125199556350708, 0.00013715028762817383, 0.00014910101890563965, 0.00016105175018310547, 0.0001730024814605713, 0.0001849532127380371, 0.00019690394401550293, 0.00020885467529296875, 0.00022080540657043457, 0.0002327561378479004, 0.0002447068691253662, 0.00025665760040283203, 0.00026860833168029785, 0.00028055906295776367, 0.0002925097942352295, 0.0003044605255126953, 0.00031641125679016113, 0.00032836198806762695, 0.0003403127193450928, 0.0003522634506225586, 0.0003642141819000244, 0.00037616491317749023, 0.00038811564445495605, 0.0004000663757324219]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 11.0, 16.0, 35.0, 39.0, 77.0, 141.0, 299.0, 979.0, 5133.0, 90292.0, 890402.0, 55586.0, 4086.0, 817.0, 257.0, 154.0, 86.0, 38.0, 25.0, 11.0, 8.0, 14.0, 6.0, 5.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31640625, -2.234954833984375, -2.15350341796875, -2.072052001953125, -1.9906005859375, -1.909149169921875, -1.82769775390625, -1.746246337890625, -1.664794921875, -1.583343505859375, -1.50189208984375, -1.420440673828125, -1.3389892578125, -1.257537841796875, -1.17608642578125, -1.094635009765625, -1.01318359375, -0.931732177734375, -0.85028076171875, -0.768829345703125, -0.6873779296875, -0.605926513671875, -0.52447509765625, -0.443023681640625, -0.361572265625, -0.280120849609375, -0.19866943359375, -0.117218017578125, -0.0357666015625, 0.045684814453125, 0.12713623046875, 0.208587646484375, 0.2900390625, 0.371490478515625, 0.45294189453125, 0.534393310546875, 0.6158447265625, 0.697296142578125, 0.77874755859375, 0.860198974609375, 0.941650390625, 1.023101806640625, 1.10455322265625, 1.186004638671875, 1.2674560546875, 1.348907470703125, 1.43035888671875, 1.511810302734375, 1.59326171875, 1.674713134765625, 1.75616455078125, 1.837615966796875, 1.9190673828125, 2.000518798828125, 2.08197021484375, 2.163421630859375, 2.244873046875, 2.326324462890625, 2.40777587890625, 2.489227294921875, 2.5706787109375, 2.652130126953125, 2.73358154296875, 2.815032958984375, 2.896484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 3.0, 9.0, 8.0, 10.0, 16.0, 18.0, 38.0, 36.0, 56.0, 59.0, 93.0, 66.0, 100.0, 97.0, 87.0, 81.0, 50.0, 56.0, 36.0, 27.0, 17.0, 9.0, 6.0, 6.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5537109375, -0.5372390747070312, -0.5207672119140625, -0.5042953491210938, -0.487823486328125, -0.47135162353515625, -0.4548797607421875, -0.43840789794921875, -0.42193603515625, -0.40546417236328125, -0.3889923095703125, -0.37252044677734375, -0.356048583984375, -0.33957672119140625, -0.3231048583984375, -0.30663299560546875, -0.2901611328125, -0.27368927001953125, -0.2572174072265625, -0.24074554443359375, -0.224273681640625, -0.20780181884765625, -0.1913299560546875, -0.17485809326171875, -0.15838623046875, -0.14191436767578125, -0.1254425048828125, -0.10897064208984375, -0.092498779296875, -0.07602691650390625, -0.0595550537109375, -0.04308319091796875, -0.026611328125, -0.01013946533203125, 0.0063323974609375, 0.02280426025390625, 0.039276123046875, 0.05574798583984375, 0.0722198486328125, 0.08869171142578125, 0.10516357421875, 0.12163543701171875, 0.1381072998046875, 0.15457916259765625, 0.171051025390625, 0.18752288818359375, 0.2039947509765625, 0.22046661376953125, 0.2369384765625, 0.25341033935546875, 0.2698822021484375, 0.28635406494140625, 0.302825927734375, 0.31929779052734375, 0.3357696533203125, 0.35224151611328125, 0.36871337890625, 0.38518524169921875, 0.4016571044921875, 0.41812896728515625, 0.434600830078125, 0.45107269287109375, 0.4675445556640625, 0.48401641845703125, 0.50048828125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 19.0, 55.0, 204.0, 341.0, 289.0, 80.0, 20.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.697264671325684, -7.567928314208984, -6.438591957092285, -5.309255123138428, -4.1799187660217285, -3.0505824089050293, -1.9212455749511719, -0.7919092178344727, 0.33742713928222656, 1.4667636156082153, 2.596100091934204, 3.7254366874694824, 4.854773044586182, 5.984109401702881, 7.113446235656738, 8.242782592773438, 9.372118949890137, 10.501455307006836, 11.630791664123535, 12.760128021240234, 13.88946533203125, 15.018800735473633, 16.14813804626465, 17.27747344970703, 18.406810760498047, 19.536148071289062, 20.665483474731445, 21.79482078552246, 22.924156188964844, 24.05349349975586, 25.182830810546875, 26.312166213989258, 27.44150161743164, 28.570838928222656, 29.70017433166504, 30.829511642456055, 31.958847045898438, 33.08818435668945, 34.21752166748047, 35.34685516357422, 36.476192474365234, 37.60552978515625, 38.734867095947266, 39.864200592041016, 40.99353790283203, 42.12287521362305, 43.25221252441406, 44.38154602050781, 45.510887145996094, 46.64022445678711, 47.769561767578125, 48.898895263671875, 50.02823257446289, 51.157569885253906, 52.28690719604492, 53.41624450683594, 54.54557800292969, 55.6749153137207, 56.80425262451172, 57.93358612060547, 59.062923431396484, 60.1922607421875, 61.321598052978516, 62.45093536376953, 63.58026885986328]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 5.0, 6.0, 8.0, 8.0, 7.0, 21.0, 14.0, 22.0, 25.0, 22.0, 22.0, 28.0, 34.0, 24.0, 44.0, 46.0, 51.0, 41.0, 48.0, 47.0, 50.0, 44.0, 49.0, 49.0, 48.0, 27.0, 37.0, 29.0, 26.0, 32.0, 17.0, 7.0, 7.0, 11.0, 12.0, 12.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.276214599609375, -25.53334617614746, -24.790477752685547, -24.047609329223633, -23.30474090576172, -22.561872482299805, -21.81900405883789, -21.07613754272461, -20.333267211914062, -19.59039878845215, -18.847530364990234, -18.10466194152832, -17.361793518066406, -16.618925094604492, -15.876057624816895, -15.13318920135498, -14.390321731567383, -13.647453308105469, -12.904584884643555, -12.16171646118164, -11.418848037719727, -10.675979614257812, -9.933112144470215, -9.1902437210083, -8.447375297546387, -7.704506874084473, -6.961638450622559, -6.218770503997803, -5.475902080535889, -4.733033657073975, -3.9901657104492188, -3.2472972869873047, -2.5044307708740234, -1.761562466621399, -1.0186941623687744, -0.27582597732543945, 0.4670424461364746, 1.2099108695983887, 1.9527788162231445, 2.6956472396850586, 3.4385156631469727, 4.181384086608887, 4.924252510070801, 5.667120456695557, 6.409988880157471, 7.152857303619385, 7.895725250244141, 8.638593673706055, 9.381462097167969, 10.124330520629883, 10.867198944091797, 11.610067367553711, 12.352935791015625, 13.095804214477539, 13.838671684265137, 14.58154010772705, 15.324408531188965, 16.067276000976562, 16.810144424438477, 17.55301284790039, 18.295881271362305, 19.03874969482422, 19.781618118286133, 20.524486541748047, 21.26735496520996]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 10.0, 20.0, 27.0, 35.0, 50.0, 86.0, 162.0, 271.0, 515.0, 1065.0, 2239.0, 5314.0, 13311.0, 36809.0, 115715.0, 384351.0, 1034491.0, 1419658.0, 798462.0, 261169.0, 77253.0, 25715.0, 9734.0, 4063.0, 1776.0, 839.0, 463.0, 256.0, 144.0, 85.0, 54.0, 38.0, 19.0, 13.0, 10.0, 10.0, 10.0, 8.0, 5.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.5234375, -4.37908935546875, -4.2347412109375, -4.09039306640625, -3.946044921875, -3.80169677734375, -3.6573486328125, -3.51300048828125, -3.36865234375, -3.22430419921875, -3.0799560546875, -2.93560791015625, -2.791259765625, -2.64691162109375, -2.5025634765625, -2.35821533203125, -2.2138671875, -2.06951904296875, -1.9251708984375, -1.78082275390625, -1.636474609375, -1.49212646484375, -1.3477783203125, -1.20343017578125, -1.05908203125, -0.91473388671875, -0.7703857421875, -0.62603759765625, -0.481689453125, -0.33734130859375, -0.1929931640625, -0.04864501953125, 0.095703125, 0.24005126953125, 0.3843994140625, 0.52874755859375, 0.673095703125, 0.81744384765625, 0.9617919921875, 1.10614013671875, 1.25048828125, 1.39483642578125, 1.5391845703125, 1.68353271484375, 1.827880859375, 1.97222900390625, 2.1165771484375, 2.26092529296875, 2.4052734375, 2.54962158203125, 2.6939697265625, 2.83831787109375, 2.982666015625, 3.12701416015625, 3.2713623046875, 3.41571044921875, 3.56005859375, 3.70440673828125, 3.8487548828125, 3.99310302734375, 4.137451171875, 4.28179931640625, 4.4261474609375, 4.57049560546875, 4.71484375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 9.0, 7.0, 8.0, 10.0, 16.0, 16.0, 31.0, 17.0, 26.0, 34.0, 38.0, 26.0, 28.0, 32.0, 44.0, 36.0, 47.0, 45.0, 49.0, 51.0, 36.0, 38.0, 44.0, 40.0, 30.0, 32.0, 41.0, 22.0, 21.0, 19.0, 20.0, 11.0, 10.0, 13.0, 6.0, 8.0, 5.0, 6.0, 5.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.76171875, -3.6334228515625, -3.505126953125, -3.3768310546875, -3.24853515625, -3.1202392578125, -2.991943359375, -2.8636474609375, -2.7353515625, -2.6070556640625, -2.478759765625, -2.3504638671875, -2.22216796875, -2.0938720703125, -1.965576171875, -1.8372802734375, -1.708984375, -1.5806884765625, -1.452392578125, -1.3240966796875, -1.19580078125, -1.0675048828125, -0.939208984375, -0.8109130859375, -0.6826171875, -0.5543212890625, -0.426025390625, -0.2977294921875, -0.16943359375, -0.0411376953125, 0.087158203125, 0.2154541015625, 0.34375, 0.4720458984375, 0.600341796875, 0.7286376953125, 0.85693359375, 0.9852294921875, 1.113525390625, 1.2418212890625, 1.3701171875, 1.4984130859375, 1.626708984375, 1.7550048828125, 1.88330078125, 2.0115966796875, 2.139892578125, 2.2681884765625, 2.396484375, 2.5247802734375, 2.653076171875, 2.7813720703125, 2.90966796875, 3.0379638671875, 3.166259765625, 3.2945556640625, 3.4228515625, 3.5511474609375, 3.679443359375, 3.8077392578125, 3.93603515625, 4.0643310546875, 4.192626953125, 4.3209228515625, 4.44921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 4.0, 8.0, 10.0, 17.0, 22.0, 75.0, 241.0, 27000.0, 4166308.0, 419.0, 63.0, 29.0, 21.0, 13.0, 4.0, 13.0, 10.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.4375, -96.2451171875, -93.052734375, -89.8603515625, -86.66796875, -83.4755859375, -80.283203125, -77.0908203125, -73.8984375, -70.7060546875, -67.513671875, -64.3212890625, -61.12890625, -57.9365234375, -54.744140625, -51.5517578125, -48.359375, -45.1669921875, -41.974609375, -38.7822265625, -35.58984375, -32.3974609375, -29.205078125, -26.0126953125, -22.8203125, -19.6279296875, -16.435546875, -13.2431640625, -10.05078125, -6.8583984375, -3.666015625, -0.4736328125, 2.71875, 5.9111328125, 9.103515625, 12.2958984375, 15.48828125, 18.6806640625, 21.873046875, 25.0654296875, 28.2578125, 31.4501953125, 34.642578125, 37.8349609375, 41.02734375, 44.2197265625, 47.412109375, 50.6044921875, 53.796875, 56.9892578125, 60.181640625, 63.3740234375, 66.56640625, 69.7587890625, 72.951171875, 76.1435546875, 79.3359375, 82.5283203125, 85.720703125, 88.9130859375, 92.10546875, 95.2978515625, 98.490234375, 101.6826171875, 104.875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 14.0, 11.0, 11.0, 16.0, 22.0, 25.0, 31.0, 57.0, 63.0, 93.0, 117.0, 168.0, 224.0, 313.0, 429.0, 508.0, 442.0, 409.0, 317.0, 217.0, 164.0, 114.0, 78.0, 66.0, 49.0, 30.0, 17.0, 27.0, 8.0, 12.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.4609375, -2.39410400390625, -2.3272705078125, -2.26043701171875, -2.193603515625, -2.12677001953125, -2.0599365234375, -1.99310302734375, -1.92626953125, -1.85943603515625, -1.7926025390625, -1.72576904296875, -1.658935546875, -1.59210205078125, -1.5252685546875, -1.45843505859375, -1.3916015625, -1.32476806640625, -1.2579345703125, -1.19110107421875, -1.124267578125, -1.05743408203125, -0.9906005859375, -0.92376708984375, -0.85693359375, -0.79010009765625, -0.7232666015625, -0.65643310546875, -0.589599609375, -0.52276611328125, -0.4559326171875, -0.38909912109375, -0.322265625, -0.25543212890625, -0.1885986328125, -0.12176513671875, -0.054931640625, 0.01190185546875, 0.0787353515625, 0.14556884765625, 0.21240234375, 0.27923583984375, 0.3460693359375, 0.41290283203125, 0.479736328125, 0.54656982421875, 0.6134033203125, 0.68023681640625, 0.7470703125, 0.81390380859375, 0.8807373046875, 0.94757080078125, 1.014404296875, 1.08123779296875, 1.1480712890625, 1.21490478515625, 1.28173828125, 1.34857177734375, 1.4154052734375, 1.48223876953125, 1.549072265625, 1.61590576171875, 1.6827392578125, 1.74957275390625, 1.81640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 7.0, 10.0, 21.0, 27.0, 33.0, 40.0, 58.0, 71.0, 81.0, 83.0, 98.0, 92.0, 83.0, 79.0, 55.0, 52.0, 36.0, 32.0, 16.0, 12.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.964637279510498, -4.736578941345215, -4.50852108001709, -4.280462741851807, -4.052404403686523, -3.8243460655212402, -3.596287965774536, -3.368229866027832, -3.140171527862549, -2.9121131896972656, -2.6840550899505615, -2.4559969902038574, -2.227938652038574, -1.9998804330825806, -1.771822214126587, -1.5437639951705933, -1.3157057762145996, -1.087647557258606, -0.8595893383026123, -0.6315311193466187, -0.403472900390625, -0.17541468143463135, 0.052643537521362305, 0.28070175647735596, 0.5087599754333496, 0.7368181943893433, 0.9648764133453369, 1.1929346323013306, 1.4209928512573242, 1.6490510702133179, 1.8771092891693115, 2.1051673889160156, 2.333226203918457, 2.5612845420837402, 2.7893426418304443, 3.0174007415771484, 3.2454590797424316, 3.473517417907715, 3.701575517654419, 3.929633617401123, 4.157691955566406, 4.3857502937316895, 4.613808631896973, 4.841866493225098, 5.069924831390381, 5.297983169555664, 5.526041030883789, 5.754099369049072, 5.9821577072143555, 6.210216045379639, 6.438274383544922, 6.666332244873047, 6.89439058303833, 7.122448921203613, 7.350506782531738, 7.5785651206970215, 7.806623458862305, 8.03468132019043, 8.262740135192871, 8.490797996520996, 8.718856811523438, 8.946914672851562, 9.174972534179688, 9.403031349182129, 9.631089210510254]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 7.0, 6.0, 5.0, 14.0, 21.0, 15.0, 23.0, 25.0, 23.0, 37.0, 33.0, 27.0, 42.0, 41.0, 41.0, 47.0, 57.0, 40.0, 30.0, 44.0, 35.0, 34.0, 37.0, 25.0, 36.0, 32.0, 26.0, 31.0, 20.0, 23.0, 22.0, 17.0, 13.0, 9.0, 5.0, 12.0, 7.0, 6.0, 4.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-4.238742351531982, -4.105901718139648, -3.9730613231658936, -3.8402206897735596, -3.7073802947998047, -3.5745396614074707, -3.4416990280151367, -3.3088583946228027, -3.176017999649048, -3.043177366256714, -2.910336971282959, -2.777496337890625, -2.644655704498291, -2.511815309524536, -2.378974676132202, -2.2461342811584473, -2.1132936477661133, -1.9804531335830688, -1.8476126194000244, -1.7147719860076904, -1.581931471824646, -1.4490909576416016, -1.3162503242492676, -1.1834098100662231, -1.0505692958831787, -0.9177287817001343, -0.7848882079124451, -0.6520476341247559, -0.5192071199417114, -0.386366605758667, -0.2535260319709778, -0.12068545818328857, 0.01215505599975586, 0.14499559998512268, 0.2778361439704895, 0.4106766879558563, 0.5435172319412231, 0.6763577461242676, 0.8091983199119568, 0.942038893699646, 1.0748794078826904, 1.2077199220657349, 1.3405604362487793, 1.4734010696411133, 1.6062415838241577, 1.7390820980072021, 1.8719227313995361, 2.004763126373291, 2.137603759765625, 2.270444393157959, 2.403284788131714, 2.536125421524048, 2.6689658164978027, 2.8018064498901367, 2.9346470832824707, 3.0674877166748047, 3.2003281116485596, 3.3331687450408936, 3.4660091400146484, 3.5988497734069824, 3.7316904067993164, 3.8645308017730713, 3.9973714351654053, 4.13021183013916, 4.263052463531494]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 10.0, 5.0, 10.0, 15.0, 26.0, 28.0, 35.0, 45.0, 57.0, 82.0, 117.0, 155.0, 171.0, 252.0, 355.0, 418.0, 532.0, 750.0, 1021.0, 1380.0, 2005.0, 3514.0, 8143.0, 29977.0, 132495.0, 402008.0, 335165.0, 92255.0, 21239.0, 6472.0, 2996.0, 1756.0, 1276.0, 933.0, 681.0, 542.0, 405.0, 299.0, 220.0, 162.0, 132.0, 97.0, 83.0, 57.0, 59.0, 35.0, 23.0, 20.0, 12.0, 15.0, 10.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.82763671875, -0.8016738891601562, -0.7757110595703125, -0.7497482299804688, -0.723785400390625, -0.6978225708007812, -0.6718597412109375, -0.6458969116210938, -0.61993408203125, -0.5939712524414062, -0.5680084228515625, -0.5420455932617188, -0.516082763671875, -0.49011993408203125, -0.4641571044921875, -0.43819427490234375, -0.4122314453125, -0.38626861572265625, -0.3603057861328125, -0.33434295654296875, -0.308380126953125, -0.28241729736328125, -0.2564544677734375, -0.23049163818359375, -0.20452880859375, -0.17856597900390625, -0.1526031494140625, -0.12664031982421875, -0.100677490234375, -0.07471466064453125, -0.0487518310546875, -0.02278900146484375, 0.003173828125, 0.02913665771484375, 0.0550994873046875, 0.08106231689453125, 0.107025146484375, 0.13298797607421875, 0.1589508056640625, 0.18491363525390625, 0.21087646484375, 0.23683929443359375, 0.2628021240234375, 0.28876495361328125, 0.314727783203125, 0.34069061279296875, 0.3666534423828125, 0.39261627197265625, 0.4185791015625, 0.44454193115234375, 0.4705047607421875, 0.49646759033203125, 0.522430419921875, 0.5483932495117188, 0.5743560791015625, 0.6003189086914062, 0.62628173828125, 0.6522445678710938, 0.6782073974609375, 0.7041702270507812, 0.730133056640625, 0.7560958862304688, 0.7820587158203125, 0.8080215454101562, 0.833984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 13.0, 10.0, 15.0, 29.0, 13.0, 22.0, 21.0, 34.0, 37.0, 39.0, 41.0, 35.0, 36.0, 46.0, 25.0, 52.0, 48.0, 42.0, 30.0, 43.0, 40.0, 35.0, 23.0, 38.0, 21.0, 34.0, 30.0, 25.0, 16.0, 11.0, 10.0, 13.0, 10.0, 10.0, 7.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.650390625, -2.560577392578125, -2.47076416015625, -2.380950927734375, -2.2911376953125, -2.201324462890625, -2.11151123046875, -2.021697998046875, -1.931884765625, -1.842071533203125, -1.75225830078125, -1.662445068359375, -1.5726318359375, -1.482818603515625, -1.39300537109375, -1.303192138671875, -1.21337890625, -1.123565673828125, -1.03375244140625, -0.943939208984375, -0.8541259765625, -0.764312744140625, -0.67449951171875, -0.584686279296875, -0.494873046875, -0.405059814453125, -0.31524658203125, -0.225433349609375, -0.1356201171875, -0.045806884765625, 0.04400634765625, 0.133819580078125, 0.2236328125, 0.313446044921875, 0.40325927734375, 0.493072509765625, 0.5828857421875, 0.672698974609375, 0.76251220703125, 0.852325439453125, 0.942138671875, 1.031951904296875, 1.12176513671875, 1.211578369140625, 1.3013916015625, 1.391204833984375, 1.48101806640625, 1.570831298828125, 1.66064453125, 1.750457763671875, 1.84027099609375, 1.930084228515625, 2.0198974609375, 2.109710693359375, 2.19952392578125, 2.289337158203125, 2.379150390625, 2.468963623046875, 2.55877685546875, 2.648590087890625, 2.7384033203125, 2.828216552734375, 2.91802978515625, 3.007843017578125, 3.09765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 14.0, 21.0, 37.0, 50.0, 105.0, 189.0, 295.0, 647.0, 1177.0, 2403.0, 4537.0, 8963.0, 17668.0, 32726.0, 60601.0, 105859.0, 164604.0, 202284.0, 178463.0, 118634.0, 69643.0, 37997.0, 19847.0, 10712.0, 5413.0, 2754.0, 1372.0, 706.0, 388.0, 194.0, 106.0, 47.0, 20.0, 22.0, 15.0, 10.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.28369140625, -0.2744255065917969, -0.26515960693359375, -0.2558937072753906, -0.2466278076171875, -0.23736190795898438, -0.22809600830078125, -0.21883010864257812, -0.209564208984375, -0.20029830932617188, -0.19103240966796875, -0.18176651000976562, -0.1725006103515625, -0.16323471069335938, -0.15396881103515625, -0.14470291137695312, -0.13543701171875, -0.12617111206054688, -0.11690521240234375, -0.10763931274414062, -0.0983734130859375, -0.08910751342773438, -0.07984161376953125, -0.07057571411132812, -0.061309814453125, -0.052043914794921875, -0.04277801513671875, -0.033512115478515625, -0.0242462158203125, -0.014980316162109375, -0.00571441650390625, 0.003551483154296875, 0.0128173828125, 0.022083282470703125, 0.03134918212890625, 0.040615081787109375, 0.0498809814453125, 0.059146881103515625, 0.06841278076171875, 0.07767868041992188, 0.086944580078125, 0.09621047973632812, 0.10547637939453125, 0.11474227905273438, 0.1240081787109375, 0.13327407836914062, 0.14253997802734375, 0.15180587768554688, 0.16107177734375, 0.17033767700195312, 0.17960357666015625, 0.18886947631835938, 0.1981353759765625, 0.20740127563476562, 0.21666717529296875, 0.22593307495117188, 0.235198974609375, 0.24446487426757812, 0.25373077392578125, 0.2629966735839844, 0.2722625732421875, 0.2815284729003906, 0.29079437255859375, 0.3000602722167969, 0.309326171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 5.0, 8.0, 5.0, 8.0, 6.0, 16.0, 18.0, 21.0, 13.0, 18.0, 26.0, 20.0, 32.0, 32.0, 37.0, 39.0, 44.0, 58.0, 43.0, 51.0, 75.0, 54.0, 56.0, 36.0, 34.0, 38.0, 27.0, 33.0, 30.0, 20.0, 25.0, 11.0, 14.0, 12.0, 9.0, 2.0, 6.0, 8.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.21484375, -6.0247802734375, -5.834716796875, -5.6446533203125, -5.45458984375, -5.2645263671875, -5.074462890625, -4.8843994140625, -4.6943359375, -4.5042724609375, -4.314208984375, -4.1241455078125, -3.93408203125, -3.7440185546875, -3.553955078125, -3.3638916015625, -3.173828125, -2.9837646484375, -2.793701171875, -2.6036376953125, -2.41357421875, -2.2235107421875, -2.033447265625, -1.8433837890625, -1.6533203125, -1.4632568359375, -1.273193359375, -1.0831298828125, -0.89306640625, -0.7030029296875, -0.512939453125, -0.3228759765625, -0.1328125, 0.0572509765625, 0.247314453125, 0.4373779296875, 0.62744140625, 0.8175048828125, 1.007568359375, 1.1976318359375, 1.3876953125, 1.5777587890625, 1.767822265625, 1.9578857421875, 2.14794921875, 2.3380126953125, 2.528076171875, 2.7181396484375, 2.908203125, 3.0982666015625, 3.288330078125, 3.4783935546875, 3.66845703125, 3.8585205078125, 4.048583984375, 4.2386474609375, 4.4287109375, 4.6187744140625, 4.808837890625, 4.9989013671875, 5.18896484375, 5.3790283203125, 5.569091796875, 5.7591552734375, 5.94921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 10.0, 8.0, 23.0, 32.0, 43.0, 64.0, 76.0, 133.0, 227.0, 350.0, 717.0, 1519.0, 3315.0, 8583.0, 27051.0, 104885.0, 361604.0, 379720.0, 115058.0, 29096.0, 9133.0, 3584.0, 1572.0, 755.0, 391.0, 207.0, 125.0, 92.0, 49.0, 46.0, 20.0, 17.0, 20.0, 3.0, 7.0, 6.0, 2.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0684814453125, -0.06640815734863281, -0.06433486938476562, -0.06226158142089844, -0.06018829345703125, -0.05811500549316406, -0.056041717529296875, -0.05396842956542969, -0.0518951416015625, -0.04982185363769531, -0.047748565673828125, -0.04567527770996094, -0.04360198974609375, -0.04152870178222656, -0.039455413818359375, -0.03738212585449219, -0.035308837890625, -0.03323554992675781, -0.031162261962890625, -0.029088973999023438, -0.02701568603515625, -0.024942398071289062, -0.022869110107421875, -0.020795822143554688, -0.0187225341796875, -0.016649246215820312, -0.014575958251953125, -0.012502670288085938, -0.01042938232421875, -0.008356094360351562, -0.006282806396484375, -0.0042095184326171875, -0.00213623046875, -6.29425048828125e-05, 0.002010345458984375, 0.0040836334228515625, 0.00615692138671875, 0.008230209350585938, 0.010303497314453125, 0.012376785278320312, 0.0144500732421875, 0.016523361206054688, 0.018596649169921875, 0.020669937133789062, 0.02274322509765625, 0.024816513061523438, 0.026889801025390625, 0.028963088989257812, 0.031036376953125, 0.03310966491699219, 0.035182952880859375, 0.03725624084472656, 0.03932952880859375, 0.04140281677246094, 0.043476104736328125, 0.04554939270019531, 0.0476226806640625, 0.04969596862792969, 0.051769256591796875, 0.05384254455566406, 0.05591583251953125, 0.05798912048339844, 0.060062408447265625, 0.06213569641113281, 0.064208984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 12.0, 12.0, 22.0, 25.0, 29.0, 42.0, 58.0, 46.0, 93.0, 97.0, 114.0, 65.0, 85.0, 89.0, 62.0, 37.0, 38.0, 17.0, 25.0, 5.0, 11.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-05, -5.1616691052913666e-05, -4.958920180797577e-05, -4.756171256303787e-05, -4.5534223318099976e-05, -4.350673407316208e-05, -4.147924482822418e-05, -3.9451755583286285e-05, -3.742426633834839e-05, -3.539677709341049e-05, -3.3369287848472595e-05, -3.13417986035347e-05, -2.9314309358596802e-05, -2.7286820113658905e-05, -2.5259330868721008e-05, -2.323184162378311e-05, -2.1204352378845215e-05, -1.9176863133907318e-05, -1.714937388896942e-05, -1.5121884644031525e-05, -1.3094395399093628e-05, -1.1066906154155731e-05, -9.039416909217834e-06, -7.011927664279938e-06, -4.984438419342041e-06, -2.9569491744041443e-06, -9.294599294662476e-07, 1.0980293154716492e-06, 3.125518560409546e-06, 5.153007805347443e-06, 7.180497050285339e-06, 9.207986295223236e-06, 1.1235475540161133e-05, 1.326296478509903e-05, 1.5290454030036926e-05, 1.7317943274974823e-05, 1.934543251991272e-05, 2.1372921764850616e-05, 2.3400411009788513e-05, 2.542790025472641e-05, 2.7455389499664307e-05, 2.9482878744602203e-05, 3.15103679895401e-05, 3.3537857234478e-05, 3.5565346479415894e-05, 3.759283572435379e-05, 3.962032496929169e-05, 4.1647814214229584e-05, 4.367530345916748e-05, 4.570279270410538e-05, 4.7730281949043274e-05, 4.975777119398117e-05, 5.178526043891907e-05, 5.3812749683856964e-05, 5.584023892879486e-05, 5.786772817373276e-05, 5.9895217418670654e-05, 6.192270666360855e-05, 6.395019590854645e-05, 6.597768515348434e-05, 6.800517439842224e-05, 7.003266364336014e-05, 7.206015288829803e-05, 7.408764213323593e-05, 7.611513137817383e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 8.0, 11.0, 25.0, 29.0, 32.0, 59.0, 85.0, 132.0, 433.0, 3419.0, 94243.0, 911685.0, 35643.0, 2025.0, 356.0, 127.0, 59.0, 43.0, 34.0, 20.0, 15.0, 10.0, 14.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2177734375, -0.21104812622070312, -0.20432281494140625, -0.19759750366210938, -0.1908721923828125, -0.18414688110351562, -0.17742156982421875, -0.17069625854492188, -0.163970947265625, -0.15724563598632812, -0.15052032470703125, -0.14379501342773438, -0.1370697021484375, -0.13034439086914062, -0.12361907958984375, -0.11689376831054688, -0.11016845703125, -0.10344314575195312, -0.09671783447265625, -0.08999252319335938, -0.0832672119140625, -0.07654190063476562, -0.06981658935546875, -0.06309127807617188, -0.056365966796875, -0.049640655517578125, -0.04291534423828125, -0.036190032958984375, -0.0294647216796875, -0.022739410400390625, -0.01601409912109375, -0.009288787841796875, -0.0025634765625, 0.004161834716796875, 0.01088714599609375, 0.017612457275390625, 0.0243377685546875, 0.031063079833984375, 0.03778839111328125, 0.044513702392578125, 0.051239013671875, 0.057964324951171875, 0.06468963623046875, 0.07141494750976562, 0.0781402587890625, 0.08486557006835938, 0.09159088134765625, 0.09831619262695312, 0.10504150390625, 0.11176681518554688, 0.11849212646484375, 0.12521743774414062, 0.1319427490234375, 0.13866806030273438, 0.14539337158203125, 0.15211868286132812, 0.158843994140625, 0.16556930541992188, 0.17229461669921875, 0.17901992797851562, 0.1857452392578125, 0.19247055053710938, 0.19919586181640625, 0.20592117309570312, 0.212646484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 11.0, 14.0, 22.0, 12.0, 31.0, 38.0, 55.0, 59.0, 91.0, 108.0, 118.0, 100.0, 89.0, 69.0, 52.0, 22.0, 23.0, 19.0, 11.0, 10.0, 9.0, 7.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0220947265625, -0.021407127380371094, -0.020719528198242188, -0.02003192901611328, -0.019344329833984375, -0.01865673065185547, -0.017969131469726562, -0.017281532287597656, -0.01659393310546875, -0.015906333923339844, -0.015218734741210938, -0.014531135559082031, -0.013843536376953125, -0.013155937194824219, -0.012468338012695312, -0.011780738830566406, -0.0110931396484375, -0.010405540466308594, -0.009717941284179688, -0.009030342102050781, -0.008342742919921875, -0.007655143737792969, -0.0069675445556640625, -0.006279945373535156, -0.00559234619140625, -0.004904747009277344, -0.0042171478271484375, -0.0035295486450195312, -0.002841949462890625, -0.0021543502807617188, -0.0014667510986328125, -0.0007791519165039062, -9.1552734375e-05, 0.0005960464477539062, 0.0012836456298828125, 0.0019712448120117188, 0.002658843994140625, 0.0033464431762695312, 0.0040340423583984375, 0.004721641540527344, 0.00540924072265625, 0.006096839904785156, 0.0067844390869140625, 0.007472038269042969, 0.008159637451171875, 0.008847236633300781, 0.009534835815429688, 0.010222434997558594, 0.0109100341796875, 0.011597633361816406, 0.012285232543945312, 0.012972831726074219, 0.013660430908203125, 0.014348030090332031, 0.015035629272460938, 0.015723228454589844, 0.01641082763671875, 0.017098426818847656, 0.017786026000976562, 0.01847362518310547, 0.019161224365234375, 0.01984882354736328, 0.020536422729492188, 0.021224021911621094, 0.02191162109375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 6.0, 11.0, 17.0, 26.0, 49.0, 58.0, 87.0, 97.0, 112.0, 119.0, 110.0, 81.0, 82.0, 54.0, 39.0, 25.0, 10.0, 3.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.748645305633545, -6.567481994628906, -6.386318206787109, -6.205154895782471, -6.023991584777832, -5.842827796936035, -5.6616644859313965, -5.480501174926758, -5.299337387084961, -5.118174076080322, -4.937010288238525, -4.755846977233887, -4.574683666229248, -4.393520355224609, -4.2123565673828125, -4.031193256378174, -3.850029945373535, -3.6688663959503174, -3.4877030849456787, -3.306539535522461, -3.1253762245178223, -2.9442126750946045, -2.7630491256713867, -2.581885814666748, -2.4007222652435303, -2.2195587158203125, -2.038395404815674, -1.857231855392456, -1.6760684251785278, -1.4949049949645996, -1.3137414455413818, -1.1325780153274536, -0.9514145851135254, -0.7702511548995972, -0.5890876650810242, -0.40792417526245117, -0.22676074504852295, -0.04559731483459473, 0.13556623458862305, 0.31672966480255127, 0.4978930950164795, 0.6790565252304077, 0.8602200150489807, 1.0413835048675537, 1.222546935081482, 1.4037103652954102, 1.584873914718628, 1.7660373449325562, 1.9472007751464844, 2.128364324569702, 2.309527635574341, 2.4906911849975586, 2.6718544960021973, 2.853018045425415, 3.034181594848633, 3.2153449058532715, 3.3965084552764893, 3.577672004699707, 3.7588353157043457, 3.9399988651275635, 4.121162414550781, 4.30232572555542, 4.483489036560059, 4.6646528244018555, 4.845816135406494]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 5.0, 10.0, 21.0, 16.0, 22.0, 21.0, 23.0, 30.0, 34.0, 35.0, 40.0, 42.0, 38.0, 44.0, 48.0, 43.0, 43.0, 39.0, 37.0, 36.0, 41.0, 27.0, 35.0, 34.0, 35.0, 23.0, 18.0, 25.0, 23.0, 16.0, 9.0, 14.0, 5.0, 10.0, 9.0, 7.0, 8.0, 0.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.8218719959259033, -2.735198974609375, -2.6485259532928467, -2.5618529319763184, -2.47517991065979, -2.3885068893432617, -2.3018336296081543, -2.215160846710205, -2.1284875869750977, -2.0418145656585693, -1.955141544342041, -1.8684685230255127, -1.7817955017089844, -1.695122480392456, -1.6084493398666382, -1.5217763185501099, -1.435103416442871, -1.3484303951263428, -1.2617573738098145, -1.1750843524932861, -1.0884113311767578, -1.0017383098602295, -0.9150651693344116, -0.8283921480178833, -0.741719126701355, -0.6550461053848267, -0.5683730840682983, -0.48170000314712524, -0.3950269818305969, -0.3083539605140686, -0.2216808795928955, -0.1350078582763672, -0.048334598541259766, 0.03833843767642975, 0.12501147389411926, 0.21168452501296997, 0.2983575463294983, 0.3850305676460266, 0.4717036485671997, 0.558376669883728, 0.6450496912002563, 0.7317227125167847, 0.818395733833313, 0.9050688147544861, 0.9917418360710144, 1.0784149169921875, 1.1650879383087158, 1.2517609596252441, 1.3384339809417725, 1.4251070022583008, 1.511780023574829, 1.5984530448913574, 1.6851260662078857, 1.771799087524414, 1.858472228050232, 1.9451452493667603, 2.031818389892578, 2.1184914112091064, 2.2051644325256348, 2.291837453842163, 2.3785104751586914, 2.4651834964752197, 2.551856517791748, 2.6385297775268555, 2.7252025604248047]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 2.0, 7.0, 11.0, 21.0, 25.0, 20.0, 51.0, 74.0, 125.0, 182.0, 289.0, 456.0, 776.0, 1384.0, 2275.0, 4503.0, 8769.0, 19064.0, 43174.0, 100931.0, 214778.0, 292768.0, 195680.0, 90182.0, 38462.0, 16907.0, 8090.0, 4206.0, 2182.0, 1275.0, 740.0, 423.0, 240.0, 180.0, 97.0, 64.0, 48.0, 26.0, 20.0, 12.0, 8.0, 7.0, 7.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.983642578125, -1.91845703125, -1.853271484375, -1.7880859375, -1.722900390625, -1.65771484375, -1.592529296875, -1.52734375, -1.462158203125, -1.39697265625, -1.331787109375, -1.2666015625, -1.201416015625, -1.13623046875, -1.071044921875, -1.005859375, -0.940673828125, -0.87548828125, -0.810302734375, -0.7451171875, -0.679931640625, -0.61474609375, -0.549560546875, -0.484375, -0.419189453125, -0.35400390625, -0.288818359375, -0.2236328125, -0.158447265625, -0.09326171875, -0.028076171875, 0.037109375, 0.102294921875, 0.16748046875, 0.232666015625, 0.2978515625, 0.363037109375, 0.42822265625, 0.493408203125, 0.55859375, 0.623779296875, 0.68896484375, 0.754150390625, 0.8193359375, 0.884521484375, 0.94970703125, 1.014892578125, 1.080078125, 1.145263671875, 1.21044921875, 1.275634765625, 1.3408203125, 1.406005859375, 1.47119140625, 1.536376953125, 1.6015625, 1.666748046875, 1.73193359375, 1.797119140625, 1.8623046875, 1.927490234375, 1.99267578125, 2.057861328125, 2.123046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 10.0, 11.0, 8.0, 10.0, 6.0, 20.0, 13.0, 13.0, 13.0, 26.0, 32.0, 27.0, 33.0, 34.0, 47.0, 58.0, 43.0, 46.0, 46.0, 38.0, 44.0, 49.0, 33.0, 40.0, 59.0, 38.0, 29.0, 29.0, 23.0, 25.0, 21.0, 19.0, 13.0, 13.0, 11.0, 5.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.21875, -8.95611572265625, -8.6934814453125, -8.43084716796875, -8.168212890625, -7.90557861328125, -7.6429443359375, -7.38031005859375, -7.11767578125, -6.85504150390625, -6.5924072265625, -6.32977294921875, -6.067138671875, -5.80450439453125, -5.5418701171875, -5.27923583984375, -5.0166015625, -4.75396728515625, -4.4913330078125, -4.22869873046875, -3.966064453125, -3.70343017578125, -3.4407958984375, -3.17816162109375, -2.91552734375, -2.65289306640625, -2.3902587890625, -2.12762451171875, -1.864990234375, -1.60235595703125, -1.3397216796875, -1.07708740234375, -0.814453125, -0.55181884765625, -0.2891845703125, -0.02655029296875, 0.236083984375, 0.49871826171875, 0.7613525390625, 1.02398681640625, 1.28662109375, 1.54925537109375, 1.8118896484375, 2.07452392578125, 2.337158203125, 2.59979248046875, 2.8624267578125, 3.12506103515625, 3.3876953125, 3.65032958984375, 3.9129638671875, 4.17559814453125, 4.438232421875, 4.70086669921875, 4.9635009765625, 5.22613525390625, 5.48876953125, 5.75140380859375, 6.0140380859375, 6.27667236328125, 6.539306640625, 6.80194091796875, 7.0645751953125, 7.32720947265625, 7.58984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 10.0, 5.0, 6.0, 8.0, 5.0, 12.0, 24.0, 26.0, 20.0, 20.0, 29.0, 29.0, 67.0, 73.0, 90.0, 159.0, 282.0, 726.0, 29629.0, 1011862.0, 4252.0, 478.0, 222.0, 123.0, 92.0, 78.0, 37.0, 37.0, 33.0, 25.0, 13.0, 6.0, 10.0, 7.0, 16.0, 8.0, 5.0, 10.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-23.453125, -22.789306640625, -22.12548828125, -21.461669921875, -20.7978515625, -20.134033203125, -19.47021484375, -18.806396484375, -18.142578125, -17.478759765625, -16.81494140625, -16.151123046875, -15.4873046875, -14.823486328125, -14.15966796875, -13.495849609375, -12.83203125, -12.168212890625, -11.50439453125, -10.840576171875, -10.1767578125, -9.512939453125, -8.84912109375, -8.185302734375, -7.521484375, -6.857666015625, -6.19384765625, -5.530029296875, -4.8662109375, -4.202392578125, -3.53857421875, -2.874755859375, -2.2109375, -1.547119140625, -0.88330078125, -0.219482421875, 0.4443359375, 1.108154296875, 1.77197265625, 2.435791015625, 3.099609375, 3.763427734375, 4.42724609375, 5.091064453125, 5.7548828125, 6.418701171875, 7.08251953125, 7.746337890625, 8.41015625, 9.073974609375, 9.73779296875, 10.401611328125, 11.0654296875, 11.729248046875, 12.39306640625, 13.056884765625, 13.720703125, 14.384521484375, 15.04833984375, 15.712158203125, 16.3759765625, 17.039794921875, 17.70361328125, 18.367431640625, 19.03125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 7.0, 6.0, 7.0, 7.0, 6.0, 14.0, 21.0, 18.0, 15.0, 27.0, 20.0, 22.0, 43.0, 36.0, 36.0, 33.0, 53.0, 46.0, 51.0, 51.0, 63.0, 49.0, 56.0, 35.0, 36.0, 32.0, 34.0, 25.0, 22.0, 31.0, 16.0, 7.0, 7.0, 13.0, 8.0, 6.0, 10.0, 5.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.609375, -9.32958984375, -9.0498046875, -8.77001953125, -8.490234375, -8.21044921875, -7.9306640625, -7.65087890625, -7.37109375, -7.09130859375, -6.8115234375, -6.53173828125, -6.251953125, -5.97216796875, -5.6923828125, -5.41259765625, -5.1328125, -4.85302734375, -4.5732421875, -4.29345703125, -4.013671875, -3.73388671875, -3.4541015625, -3.17431640625, -2.89453125, -2.61474609375, -2.3349609375, -2.05517578125, -1.775390625, -1.49560546875, -1.2158203125, -0.93603515625, -0.65625, -0.37646484375, -0.0966796875, 0.18310546875, 0.462890625, 0.74267578125, 1.0224609375, 1.30224609375, 1.58203125, 1.86181640625, 2.1416015625, 2.42138671875, 2.701171875, 2.98095703125, 3.2607421875, 3.54052734375, 3.8203125, 4.10009765625, 4.3798828125, 4.65966796875, 4.939453125, 5.21923828125, 5.4990234375, 5.77880859375, 6.05859375, 6.33837890625, 6.6181640625, 6.89794921875, 7.177734375, 7.45751953125, 7.7373046875, 8.01708984375, 8.296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 10.0, 9.0, 5.0, 15.0, 20.0, 46.0, 54.0, 74.0, 132.0, 213.0, 636.0, 3333.0, 89107.0, 926992.0, 25162.0, 1815.0, 420.0, 172.0, 120.0, 72.0, 45.0, 23.0, 17.0, 14.0, 13.0, 6.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.392578125, -3.28082275390625, -3.1690673828125, -3.05731201171875, -2.945556640625, -2.83380126953125, -2.7220458984375, -2.61029052734375, -2.49853515625, -2.38677978515625, -2.2750244140625, -2.16326904296875, -2.051513671875, -1.93975830078125, -1.8280029296875, -1.71624755859375, -1.6044921875, -1.49273681640625, -1.3809814453125, -1.26922607421875, -1.157470703125, -1.04571533203125, -0.9339599609375, -0.82220458984375, -0.71044921875, -0.59869384765625, -0.4869384765625, -0.37518310546875, -0.263427734375, -0.15167236328125, -0.0399169921875, 0.07183837890625, 0.18359375, 0.29534912109375, 0.4071044921875, 0.51885986328125, 0.630615234375, 0.74237060546875, 0.8541259765625, 0.96588134765625, 1.07763671875, 1.18939208984375, 1.3011474609375, 1.41290283203125, 1.524658203125, 1.63641357421875, 1.7481689453125, 1.85992431640625, 1.9716796875, 2.08343505859375, 2.1951904296875, 2.30694580078125, 2.418701171875, 2.53045654296875, 2.6422119140625, 2.75396728515625, 2.86572265625, 2.97747802734375, 3.0892333984375, 3.20098876953125, 3.312744140625, 3.42449951171875, 3.5362548828125, 3.64801025390625, 3.759765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 8.0, 8.0, 12.0, 13.0, 8.0, 18.0, 34.0, 34.0, 56.0, 73.0, 75.0, 110.0, 105.0, 86.0, 103.0, 60.0, 44.0, 48.0, 22.0, 27.0, 20.0, 12.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000213623046875, -0.00020686909556388855, -0.0002001151442527771, -0.00019336119294166565, -0.0001866072416305542, -0.00017985329031944275, -0.0001730993390083313, -0.00016634538769721985, -0.0001595914363861084, -0.00015283748507499695, -0.0001460835337638855, -0.00013932958245277405, -0.0001325756311416626, -0.00012582167983055115, -0.0001190677285194397, -0.00011231377720832825, -0.0001055598258972168, -9.880587458610535e-05, -9.20519232749939e-05, -8.529797196388245e-05, -7.8544020652771e-05, -7.179006934165955e-05, -6.50361180305481e-05, -5.8282166719436646e-05, -5.1528215408325195e-05, -4.4774264097213745e-05, -3.8020312786102295e-05, -3.1266361474990845e-05, -2.4512410163879395e-05, -1.7758458852767944e-05, -1.1004507541656494e-05, -4.250556230545044e-06, 2.5033950805664062e-06, 9.257346391677856e-06, 1.6011297702789307e-05, 2.2765249013900757e-05, 2.9519200325012207e-05, 3.627315163612366e-05, 4.302710294723511e-05, 4.978105425834656e-05, 5.653500556945801e-05, 6.328895688056946e-05, 7.004290819168091e-05, 7.679685950279236e-05, 8.355081081390381e-05, 9.030476212501526e-05, 9.705871343612671e-05, 0.00010381266474723816, 0.00011056661605834961, 0.00011732056736946106, 0.0001240745186805725, 0.00013082846999168396, 0.0001375824213027954, 0.00014433637261390686, 0.0001510903239250183, 0.00015784427523612976, 0.0001645982265472412, 0.00017135217785835266, 0.0001781061291694641, 0.00018486008048057556, 0.000191614031791687, 0.00019836798310279846, 0.0002051219344139099, 0.00021187588572502136, 0.0002186298370361328]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 6.0, 6.0, 21.0, 17.0, 45.0, 53.0, 153.0, 354.0, 1641.0, 32139.0, 975824.0, 35878.0, 1686.0, 394.0, 143.0, 76.0, 43.0, 19.0, 21.0, 10.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8671875, -4.730133056640625, -4.59307861328125, -4.456024169921875, -4.3189697265625, -4.181915283203125, -4.04486083984375, -3.907806396484375, -3.770751953125, -3.633697509765625, -3.49664306640625, -3.359588623046875, -3.2225341796875, -3.085479736328125, -2.94842529296875, -2.811370849609375, -2.67431640625, -2.537261962890625, -2.40020751953125, -2.263153076171875, -2.1260986328125, -1.989044189453125, -1.85198974609375, -1.714935302734375, -1.577880859375, -1.440826416015625, -1.30377197265625, -1.166717529296875, -1.0296630859375, -0.892608642578125, -0.75555419921875, -0.618499755859375, -0.4814453125, -0.344390869140625, -0.20733642578125, -0.070281982421875, 0.0667724609375, 0.203826904296875, 0.34088134765625, 0.477935791015625, 0.614990234375, 0.752044677734375, 0.88909912109375, 1.026153564453125, 1.1632080078125, 1.300262451171875, 1.43731689453125, 1.574371337890625, 1.71142578125, 1.848480224609375, 1.98553466796875, 2.122589111328125, 2.2596435546875, 2.396697998046875, 2.53375244140625, 2.670806884765625, 2.807861328125, 2.944915771484375, 3.08197021484375, 3.219024658203125, 3.3560791015625, 3.493133544921875, 3.63018798828125, 3.767242431640625, 3.904296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 12.0, 22.0, 29.0, 71.0, 87.0, 127.0, 158.0, 151.0, 108.0, 79.0, 64.0, 34.0, 21.0, 11.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82568359375, -0.7960739135742188, -0.7664642333984375, -0.7368545532226562, -0.707244873046875, -0.6776351928710938, -0.6480255126953125, -0.6184158325195312, -0.58880615234375, -0.5591964721679688, -0.5295867919921875, -0.49997711181640625, -0.470367431640625, -0.44075775146484375, -0.4111480712890625, -0.38153839111328125, -0.3519287109375, -0.32231903076171875, -0.2927093505859375, -0.26309967041015625, -0.233489990234375, -0.20388031005859375, -0.1742706298828125, -0.14466094970703125, -0.11505126953125, -0.08544158935546875, -0.0558319091796875, -0.02622222900390625, 0.003387451171875, 0.03299713134765625, 0.0626068115234375, 0.09221649169921875, 0.121826171875, 0.15143585205078125, 0.1810455322265625, 0.21065521240234375, 0.240264892578125, 0.26987457275390625, 0.2994842529296875, 0.32909393310546875, 0.35870361328125, 0.38831329345703125, 0.4179229736328125, 0.44753265380859375, 0.477142333984375, 0.5067520141601562, 0.5363616943359375, 0.5659713745117188, 0.5955810546875, 0.6251907348632812, 0.6548004150390625, 0.6844100952148438, 0.714019775390625, 0.7436294555664062, 0.7732391357421875, 0.8028488159179688, 0.83245849609375, 0.8620681762695312, 0.8916778564453125, 0.9212875366210938, 0.950897216796875, 0.9805068969726562, 1.0101165771484375, 1.0397262573242188, 1.0693359375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 9.0, 11.0, 18.0, 20.0, 26.0, 42.0, 52.0, 53.0, 58.0, 87.0, 87.0, 88.0, 92.0, 87.0, 73.0, 49.0, 46.0, 35.0, 23.0, 15.0, 12.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.76408576965332, -10.501669883728027, -10.239253997802734, -9.976838111877441, -9.714422225952148, -9.452006340026855, -9.189590454101562, -8.92717456817627, -8.664758682250977, -8.402342796325684, -8.13992691040039, -7.877511024475098, -7.615095138549805, -7.352679252624512, -7.090263366699219, -6.827847480773926, -6.565432071685791, -6.303016185760498, -6.040600299835205, -5.778184413909912, -5.515768527984619, -5.253352642059326, -4.990937232971191, -4.728521347045898, -4.4661054611206055, -4.2036895751953125, -3.9412736892700195, -3.6788578033447266, -3.4164419174194336, -3.1540260314941406, -2.8916103839874268, -2.629194498062134, -2.3667778968811035, -2.1043620109558105, -1.8419461250305176, -1.5795303583145142, -1.3171144723892212, -1.0546985864639282, -0.7922828197479248, -0.5298669338226318, -0.26745104789733887, -0.005035191774368286, 0.2573806643486023, 0.5197964906692505, 0.7822123765945435, 1.0446282625198364, 1.3070440292358398, 1.5694599151611328, 1.8318758010864258, 2.0942916870117188, 2.3567075729370117, 2.6191234588623047, 2.8815393447875977, 3.1439552307128906, 3.4063708782196045, 3.6687867641448975, 3.9312026500701904, 4.193618297576904, 4.456034183502197, 4.71845006942749, 4.980865955352783, 5.243281841278076, 5.505697727203369, 5.768113613128662, 6.030529499053955]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 4.0, 13.0, 10.0, 9.0, 16.0, 16.0, 20.0, 19.0, 25.0, 20.0, 31.0, 22.0, 36.0, 32.0, 45.0, 44.0, 33.0, 46.0, 42.0, 50.0, 30.0, 42.0, 36.0, 27.0, 21.0, 34.0, 35.0, 23.0, 29.0, 23.0, 19.0, 22.0, 27.0, 22.0, 8.0, 8.0, 13.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.694212913513184, -11.369037628173828, -11.043863296508789, -10.718688011169434, -10.393512725830078, -10.068337440490723, -9.743162155151367, -9.417987823486328, -9.092812538146973, -8.767637252807617, -8.442462921142578, -8.117287635803223, -7.792112350463867, -7.466937065124512, -7.1417622566223145, -6.816587448120117, -6.491412162780762, -6.166236877441406, -5.841062068939209, -5.515887260437012, -5.190711975097656, -4.865536689758301, -4.5403618812561035, -4.215187072753906, -3.890011787414551, -3.5648367404937744, -3.239661693572998, -2.9144866466522217, -2.5893115997314453, -2.264136552810669, -1.9389615058898926, -1.6137864589691162, -1.2886123657226562, -0.9634373188018799, -0.6382622718811035, -0.31308722496032715, 0.012087821960449219, 0.3372628688812256, 0.662437915802002, 0.9876129627227783, 1.3127880096435547, 1.637963056564331, 1.9631381034851074, 2.288313150405884, 2.61348819732666, 2.9386632442474365, 3.263838291168213, 3.5890133380889893, 3.9141883850097656, 4.239363670349121, 4.564538478851318, 4.889713287353516, 5.214888572692871, 5.540063858032227, 5.865238666534424, 6.190413475036621, 6.515588760375977, 6.840764045715332, 7.165938854217529, 7.491113662719727, 7.816288948059082, 8.141464233398438, 8.466638565063477, 8.791813850402832, 9.116989135742188]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 6.0, 3.0, 1.0, 6.0, 10.0, 8.0, 18.0, 14.0, 24.0, 37.0, 41.0, 69.0, 106.0, 140.0, 265.0, 465.0, 1164.0, 3899.0, 19349.0, 139522.0, 1061807.0, 2259843.0, 620578.0, 72017.0, 11013.0, 2410.0, 660.0, 283.0, 147.0, 102.0, 66.0, 47.0, 31.0, 21.0, 19.0, 24.0, 19.0, 14.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.20703125, -6.9771728515625, -6.747314453125, -6.5174560546875, -6.28759765625, -6.0577392578125, -5.827880859375, -5.5980224609375, -5.3681640625, -5.1383056640625, -4.908447265625, -4.6785888671875, -4.44873046875, -4.2188720703125, -3.989013671875, -3.7591552734375, -3.529296875, -3.2994384765625, -3.069580078125, -2.8397216796875, -2.60986328125, -2.3800048828125, -2.150146484375, -1.9202880859375, -1.6904296875, -1.4605712890625, -1.230712890625, -1.0008544921875, -0.77099609375, -0.5411376953125, -0.311279296875, -0.0814208984375, 0.1484375, 0.3782958984375, 0.608154296875, 0.8380126953125, 1.06787109375, 1.2977294921875, 1.527587890625, 1.7574462890625, 1.9873046875, 2.2171630859375, 2.447021484375, 2.6768798828125, 2.90673828125, 3.1365966796875, 3.366455078125, 3.5963134765625, 3.826171875, 4.0560302734375, 4.285888671875, 4.5157470703125, 4.74560546875, 4.9754638671875, 5.205322265625, 5.4351806640625, 5.6650390625, 5.8948974609375, 6.124755859375, 6.3546142578125, 6.58447265625, 6.8143310546875, 7.044189453125, 7.2740478515625, 7.50390625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 6.0, 13.0, 17.0, 17.0, 19.0, 24.0, 23.0, 33.0, 37.0, 41.0, 42.0, 52.0, 42.0, 59.0, 63.0, 42.0, 45.0, 53.0, 46.0, 40.0, 41.0, 39.0, 27.0, 28.0, 29.0, 21.0, 25.0, 18.0, 9.0, 12.0, 7.0, 9.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1640625, -4.02703857421875, -3.8900146484375, -3.75299072265625, -3.615966796875, -3.47894287109375, -3.3419189453125, -3.20489501953125, -3.06787109375, -2.93084716796875, -2.7938232421875, -2.65679931640625, -2.519775390625, -2.38275146484375, -2.2457275390625, -2.10870361328125, -1.9716796875, -1.83465576171875, -1.6976318359375, -1.56060791015625, -1.423583984375, -1.28656005859375, -1.1495361328125, -1.01251220703125, -0.87548828125, -0.73846435546875, -0.6014404296875, -0.46441650390625, -0.327392578125, -0.19036865234375, -0.0533447265625, 0.08367919921875, 0.220703125, 0.35772705078125, 0.4947509765625, 0.63177490234375, 0.768798828125, 0.90582275390625, 1.0428466796875, 1.17987060546875, 1.31689453125, 1.45391845703125, 1.5909423828125, 1.72796630859375, 1.864990234375, 2.00201416015625, 2.1390380859375, 2.27606201171875, 2.4130859375, 2.55010986328125, 2.6871337890625, 2.82415771484375, 2.961181640625, 3.09820556640625, 3.2352294921875, 3.37225341796875, 3.50927734375, 3.64630126953125, 3.7833251953125, 3.92034912109375, 4.057373046875, 4.19439697265625, 4.3314208984375, 4.46844482421875, 4.60546875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 6.0, 2.0, 14.0, 12.0, 24.0, 46.0, 73.0, 197.0, 493.0, 2469.0, 3795448.0, 393405.0, 1436.0, 358.0, 136.0, 81.0, 40.0, 13.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.71875, -41.560302734375, -40.40185546875, -39.243408203125, -38.0849609375, -36.926513671875, -35.76806640625, -34.609619140625, -33.451171875, -32.292724609375, -31.13427734375, -29.975830078125, -28.8173828125, -27.658935546875, -26.50048828125, -25.342041015625, -24.18359375, -23.025146484375, -21.86669921875, -20.708251953125, -19.5498046875, -18.391357421875, -17.23291015625, -16.074462890625, -14.916015625, -13.757568359375, -12.59912109375, -11.440673828125, -10.2822265625, -9.123779296875, -7.96533203125, -6.806884765625, -5.6484375, -4.489990234375, -3.33154296875, -2.173095703125, -1.0146484375, 0.143798828125, 1.30224609375, 2.460693359375, 3.619140625, 4.777587890625, 5.93603515625, 7.094482421875, 8.2529296875, 9.411376953125, 10.56982421875, 11.728271484375, 12.88671875, 14.045166015625, 15.20361328125, 16.362060546875, 17.5205078125, 18.678955078125, 19.83740234375, 20.995849609375, 22.154296875, 23.312744140625, 24.47119140625, 25.629638671875, 26.7880859375, 27.946533203125, 29.10498046875, 30.263427734375, 31.421875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 11.0, 6.0, 13.0, 18.0, 26.0, 38.0, 35.0, 67.0, 68.0, 101.0, 126.0, 155.0, 195.0, 251.0, 321.0, 385.0, 354.0, 371.0, 334.0, 280.0, 223.0, 173.0, 126.0, 108.0, 62.0, 49.0, 34.0, 20.0, 28.0, 25.0, 15.0, 8.0, 14.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814453125, -1.7605438232421875, -1.706634521484375, -1.6527252197265625, -1.59881591796875, -1.5449066162109375, -1.490997314453125, -1.4370880126953125, -1.3831787109375, -1.3292694091796875, -1.275360107421875, -1.2214508056640625, -1.16754150390625, -1.1136322021484375, -1.059722900390625, -1.0058135986328125, -0.951904296875, -0.8979949951171875, -0.844085693359375, -0.7901763916015625, -0.73626708984375, -0.6823577880859375, -0.628448486328125, -0.5745391845703125, -0.5206298828125, -0.4667205810546875, -0.412811279296875, -0.3589019775390625, -0.30499267578125, -0.2510833740234375, -0.197174072265625, -0.1432647705078125, -0.08935546875, -0.0354461669921875, 0.018463134765625, 0.0723724365234375, 0.12628173828125, 0.1801910400390625, 0.234100341796875, 0.2880096435546875, 0.3419189453125, 0.3958282470703125, 0.449737548828125, 0.5036468505859375, 0.55755615234375, 0.6114654541015625, 0.665374755859375, 0.7192840576171875, 0.773193359375, 0.8271026611328125, 0.881011962890625, 0.9349212646484375, 0.98883056640625, 1.0427398681640625, 1.096649169921875, 1.1505584716796875, 1.2044677734375, 1.2583770751953125, 1.312286376953125, 1.3661956787109375, 1.42010498046875, 1.4740142822265625, 1.527923583984375, 1.5818328857421875, 1.6357421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 10.0, 22.0, 43.0, 56.0, 133.0, 168.0, 159.0, 164.0, 121.0, 79.0, 30.0, 15.0, 9.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.579390048980713, -4.14121675491333, -3.7030434608459473, -3.2648701667785645, -2.8266968727111816, -2.388523817062378, -1.9503505229949951, -1.5121772289276123, -1.0740039348602295, -0.6358306407928467, -0.19765740633010864, 0.2405158281326294, 0.6786891222000122, 1.1168622970581055, 1.5550355911254883, 1.993208885192871, 2.431382179260254, 2.8695554733276367, 3.3077287673950195, 3.7459020614624023, 4.184075355529785, 4.622248649597168, 5.060421943664551, 5.498595237731934, 5.936768531799316, 6.374941825866699, 6.813115119934082, 7.251288414001465, 7.689461708068848, 8.12763500213623, 8.565808296203613, 9.003981590270996, 9.442154884338379, 9.880328178405762, 10.318501472473145, 10.756674766540527, 11.19484806060791, 11.633021354675293, 12.071194648742676, 12.509367942810059, 12.947541236877441, 13.385714530944824, 13.823887825012207, 14.26206111907959, 14.700234413146973, 15.138407707214355, 15.576581001281738, 16.014753341674805, 16.452926635742188, 16.89109992980957, 17.329273223876953, 17.767446517944336, 18.20561981201172, 18.6437931060791, 19.081966400146484, 19.520139694213867, 19.95831298828125, 20.396486282348633, 20.834659576416016, 21.2728328704834, 21.71100616455078, 22.149179458618164, 22.587352752685547, 23.02552604675293, 23.463699340820312]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 10.0, 7.0, 4.0, 13.0, 12.0, 15.0, 20.0, 21.0, 13.0, 23.0, 16.0, 32.0, 31.0, 31.0, 25.0, 29.0, 40.0, 46.0, 43.0, 30.0, 35.0, 50.0, 42.0, 45.0, 42.0, 37.0, 28.0, 24.0, 21.0, 26.0, 17.0, 22.0, 25.0, 17.0, 10.0, 10.0, 11.0, 11.0, 7.0, 7.0, 10.0, 8.0, 6.0, 6.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.3748116493225098, -3.2615673542022705, -3.1483232975006104, -3.035079002380371, -2.921834707260132, -2.8085904121398926, -2.6953463554382324, -2.582102060317993, -2.468857765197754, -2.3556134700775146, -2.2423694133758545, -2.1291251182556152, -2.015880823135376, -1.9026366472244263, -1.7893924713134766, -1.6761481761932373, -1.5629041194915771, -1.4496599435806274, -1.3364156484603882, -1.2231714725494385, -1.1099271774291992, -0.9966830015182495, -0.8834388256072998, -0.7701945900917053, -0.6569503545761108, -0.5437061190605164, -0.43046191334724426, -0.31721770763397217, -0.20397347211837769, -0.0907292366027832, 0.022514939308166504, 0.135759174823761, 0.24900341033935547, 0.36224764585494995, 0.47549185156822205, 0.5887360572814941, 0.7019802927970886, 0.8152245283126831, 0.9284687042236328, 1.041712999343872, 1.1549571752548218, 1.2682013511657715, 1.3814456462860107, 1.4946898221969604, 1.6079339981079102, 1.7211782932281494, 1.8344224691390991, 1.9476666450500488, 2.060910940170288, 2.1741552352905273, 2.2873992919921875, 2.4006435871124268, 2.513887882232666, 2.627131938934326, 2.7403762340545654, 2.8536205291748047, 2.966864585876465, 3.080108880996704, 3.1933529376983643, 3.3065972328186035, 3.4198415279388428, 3.533085823059082, 3.646329879760742, 3.7595741748809814, 3.8728184700012207]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 6.0, 10.0, 17.0, 36.0, 54.0, 84.0, 119.0, 183.0, 374.0, 590.0, 897.0, 1536.0, 2536.0, 4820.0, 14282.0, 128138.0, 683076.0, 181452.0, 18110.0, 5255.0, 2731.0, 1676.0, 982.0, 594.0, 375.0, 238.0, 122.0, 91.0, 55.0, 36.0, 20.0, 14.0, 11.0, 5.0, 5.0, 2.0, 6.0, 3.0, 0.0, 3.0], "bins": [-1.6484375, -1.6078033447265625, -1.567169189453125, -1.5265350341796875, -1.48590087890625, -1.4452667236328125, -1.404632568359375, -1.3639984130859375, -1.3233642578125, -1.2827301025390625, -1.242095947265625, -1.2014617919921875, -1.16082763671875, -1.1201934814453125, -1.079559326171875, -1.0389251708984375, -0.998291015625, -0.9576568603515625, -0.917022705078125, -0.8763885498046875, -0.83575439453125, -0.7951202392578125, -0.754486083984375, -0.7138519287109375, -0.6732177734375, -0.6325836181640625, -0.591949462890625, -0.5513153076171875, -0.51068115234375, -0.4700469970703125, -0.429412841796875, -0.3887786865234375, -0.34814453125, -0.3075103759765625, -0.266876220703125, -0.2262420654296875, -0.18560791015625, -0.1449737548828125, -0.104339599609375, -0.0637054443359375, -0.0230712890625, 0.0175628662109375, 0.058197021484375, 0.0988311767578125, 0.13946533203125, 0.1800994873046875, 0.220733642578125, 0.2613677978515625, 0.302001953125, 0.3426361083984375, 0.383270263671875, 0.4239044189453125, 0.46453857421875, 0.5051727294921875, 0.545806884765625, 0.5864410400390625, 0.6270751953125, 0.6677093505859375, 0.708343505859375, 0.7489776611328125, 0.78961181640625, 0.8302459716796875, 0.870880126953125, 0.9115142822265625, 0.9521484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 5.0, 8.0, 16.0, 12.0, 17.0, 14.0, 16.0, 35.0, 35.0, 36.0, 20.0, 50.0, 42.0, 49.0, 46.0, 54.0, 70.0, 62.0, 48.0, 52.0, 43.0, 39.0, 41.0, 30.0, 32.0, 18.0, 15.0, 19.0, 23.0, 15.0, 9.0, 6.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.18792724609375, -2.0906982421875, -1.99346923828125, -1.896240234375, -1.79901123046875, -1.7017822265625, -1.60455322265625, -1.50732421875, -1.41009521484375, -1.3128662109375, -1.21563720703125, -1.118408203125, -1.02117919921875, -0.9239501953125, -0.82672119140625, -0.7294921875, -0.63226318359375, -0.5350341796875, -0.43780517578125, -0.340576171875, -0.24334716796875, -0.1461181640625, -0.04888916015625, 0.04833984375, 0.14556884765625, 0.2427978515625, 0.34002685546875, 0.437255859375, 0.53448486328125, 0.6317138671875, 0.72894287109375, 0.826171875, 0.92340087890625, 1.0206298828125, 1.11785888671875, 1.215087890625, 1.31231689453125, 1.4095458984375, 1.50677490234375, 1.60400390625, 1.70123291015625, 1.7984619140625, 1.89569091796875, 1.992919921875, 2.09014892578125, 2.1873779296875, 2.28460693359375, 2.3818359375, 2.47906494140625, 2.5762939453125, 2.67352294921875, 2.770751953125, 2.86798095703125, 2.9652099609375, 3.06243896484375, 3.15966796875, 3.25689697265625, 3.3541259765625, 3.45135498046875, 3.548583984375, 3.64581298828125, 3.7430419921875, 3.84027099609375, 3.9375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 8.0, 10.0, 9.0, 27.0, 27.0, 49.0, 75.0, 119.0, 222.0, 439.0, 905.0, 1781.0, 3606.0, 7392.0, 14966.0, 31104.0, 64726.0, 124038.0, 202728.0, 232767.0, 172379.0, 97242.0, 48562.0, 23269.0, 11147.0, 5474.0, 2703.0, 1330.0, 675.0, 338.0, 150.0, 119.0, 61.0, 42.0, 19.0, 15.0, 5.0, 2.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.261962890625, -0.25331878662109375, -0.2446746826171875, -0.23603057861328125, -0.227386474609375, -0.21874237060546875, -0.2100982666015625, -0.20145416259765625, -0.19281005859375, -0.18416595458984375, -0.1755218505859375, -0.16687774658203125, -0.158233642578125, -0.14958953857421875, -0.1409454345703125, -0.13230133056640625, -0.1236572265625, -0.11501312255859375, -0.1063690185546875, -0.09772491455078125, -0.089080810546875, -0.08043670654296875, -0.0717926025390625, -0.06314849853515625, -0.05450439453125, -0.04586029052734375, -0.0372161865234375, -0.02857208251953125, -0.019927978515625, -0.01128387451171875, -0.0026397705078125, 0.00600433349609375, 0.0146484375, 0.02329254150390625, 0.0319366455078125, 0.04058074951171875, 0.049224853515625, 0.05786895751953125, 0.0665130615234375, 0.07515716552734375, 0.08380126953125, 0.09244537353515625, 0.1010894775390625, 0.10973358154296875, 0.118377685546875, 0.12702178955078125, 0.1356658935546875, 0.14430999755859375, 0.1529541015625, 0.16159820556640625, 0.1702423095703125, 0.17888641357421875, 0.187530517578125, 0.19617462158203125, 0.2048187255859375, 0.21346282958984375, 0.22210693359375, 0.23075103759765625, 0.2393951416015625, 0.24803924560546875, 0.256683349609375, 0.26532745361328125, 0.2739715576171875, 0.28261566162109375, 0.291259765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 5.0, 10.0, 12.0, 10.0, 12.0, 19.0, 14.0, 16.0, 21.0, 32.0, 34.0, 37.0, 34.0, 46.0, 55.0, 67.0, 56.0, 68.0, 67.0, 37.0, 63.0, 26.0, 46.0, 38.0, 36.0, 21.0, 13.0, 16.0, 24.0, 16.0, 10.0, 8.0, 5.0, 5.0, 2.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.546875, -5.369140625, -5.19140625, -5.013671875, -4.8359375, -4.658203125, -4.48046875, -4.302734375, -4.125, -3.947265625, -3.76953125, -3.591796875, -3.4140625, -3.236328125, -3.05859375, -2.880859375, -2.703125, -2.525390625, -2.34765625, -2.169921875, -1.9921875, -1.814453125, -1.63671875, -1.458984375, -1.28125, -1.103515625, -0.92578125, -0.748046875, -0.5703125, -0.392578125, -0.21484375, -0.037109375, 0.140625, 0.318359375, 0.49609375, 0.673828125, 0.8515625, 1.029296875, 1.20703125, 1.384765625, 1.5625, 1.740234375, 1.91796875, 2.095703125, 2.2734375, 2.451171875, 2.62890625, 2.806640625, 2.984375, 3.162109375, 3.33984375, 3.517578125, 3.6953125, 3.873046875, 4.05078125, 4.228515625, 4.40625, 4.583984375, 4.76171875, 4.939453125, 5.1171875, 5.294921875, 5.47265625, 5.650390625, 5.828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 7.0, 9.0, 12.0, 18.0, 26.0, 28.0, 42.0, 78.0, 106.0, 159.0, 275.0, 440.0, 702.0, 1214.0, 2505.0, 6270.0, 21068.0, 132440.0, 647862.0, 194091.0, 27470.0, 7612.0, 2872.0, 1414.0, 738.0, 413.0, 252.0, 135.0, 108.0, 43.0, 43.0, 26.0, 28.0, 17.0, 12.0, 9.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0853271484375, -0.08234214782714844, -0.07935714721679688, -0.07637214660644531, -0.07338714599609375, -0.07040214538574219, -0.06741714477539062, -0.06443214416503906, -0.0614471435546875, -0.05846214294433594, -0.055477142333984375, -0.05249214172363281, -0.04950714111328125, -0.04652214050292969, -0.043537139892578125, -0.04055213928222656, -0.037567138671875, -0.03458213806152344, -0.031597137451171875, -0.028612136840820312, -0.02562713623046875, -0.022642135620117188, -0.019657135009765625, -0.016672134399414062, -0.0136871337890625, -0.010702133178710938, -0.007717132568359375, -0.0047321319580078125, -0.00174713134765625, 0.0012378692626953125, 0.004222869873046875, 0.0072078704833984375, 0.01019287109375, 0.013177871704101562, 0.016162872314453125, 0.019147872924804688, 0.02213287353515625, 0.025117874145507812, 0.028102874755859375, 0.031087875366210938, 0.0340728759765625, 0.03705787658691406, 0.040042877197265625, 0.04302787780761719, 0.04601287841796875, 0.04899787902832031, 0.051982879638671875, 0.05496788024902344, 0.057952880859375, 0.06093788146972656, 0.06392288208007812, 0.06690788269042969, 0.06989288330078125, 0.07287788391113281, 0.07586288452148438, 0.07884788513183594, 0.0818328857421875, 0.08481788635253906, 0.08780288696289062, 0.09078788757324219, 0.09377288818359375, 0.09675788879394531, 0.09974288940429688, 0.10272789001464844, 0.105712890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 8.0, 16.0, 16.0, 21.0, 29.0, 25.0, 47.0, 68.0, 76.0, 93.0, 121.0, 75.0, 83.0, 87.0, 60.0, 53.0, 30.0, 22.0, 18.0, 13.0, 12.0, 3.0, 8.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26173210144043e-05, -4.090741276741028e-05, -3.919750452041626e-05, -3.748759627342224e-05, -3.577768802642822e-05, -3.4067779779434204e-05, -3.2357871532440186e-05, -3.064796328544617e-05, -2.893805503845215e-05, -2.722814679145813e-05, -2.551823854446411e-05, -2.3808330297470093e-05, -2.2098422050476074e-05, -2.0388513803482056e-05, -1.8678605556488037e-05, -1.696869730949402e-05, -1.52587890625e-05, -1.3548880815505981e-05, -1.1838972568511963e-05, -1.0129064321517944e-05, -8.419156074523926e-06, -6.709247827529907e-06, -4.999339580535889e-06, -3.28943133354187e-06, -1.5795230865478516e-06, 1.30385160446167e-07, 1.8402934074401855e-06, 3.550201654434204e-06, 5.260109901428223e-06, 6.970018148422241e-06, 8.67992639541626e-06, 1.0389834642410278e-05, 1.2099742889404297e-05, 1.3809651136398315e-05, 1.5519559383392334e-05, 1.7229467630386353e-05, 1.893937587738037e-05, 2.064928412437439e-05, 2.2359192371368408e-05, 2.4069100618362427e-05, 2.5779008865356445e-05, 2.7488917112350464e-05, 2.9198825359344482e-05, 3.09087336063385e-05, 3.261864185333252e-05, 3.432855010032654e-05, 3.603845834732056e-05, 3.7748366594314575e-05, 3.9458274841308594e-05, 4.116818308830261e-05, 4.287809133529663e-05, 4.458799958229065e-05, 4.629790782928467e-05, 4.8007816076278687e-05, 4.9717724323272705e-05, 5.1427632570266724e-05, 5.313754081726074e-05, 5.484744906425476e-05, 5.655735731124878e-05, 5.82672655582428e-05, 5.9977173805236816e-05, 6.168708205223083e-05, 6.339699029922485e-05, 6.510689854621887e-05, 6.681680679321289e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 13.0, 30.0, 64.0, 187.0, 532.0, 1610.0, 5887.0, 182114.0, 845639.0, 9259.0, 2100.0, 669.0, 250.0, 93.0, 43.0, 13.0, 14.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317138671875, -0.30625152587890625, -0.2953643798828125, -0.28447723388671875, -0.273590087890625, -0.26270294189453125, -0.2518157958984375, -0.24092864990234375, -0.23004150390625, -0.21915435791015625, -0.2082672119140625, -0.19738006591796875, -0.186492919921875, -0.17560577392578125, -0.1647186279296875, -0.15383148193359375, -0.1429443359375, -0.13205718994140625, -0.1211700439453125, -0.11028289794921875, -0.099395751953125, -0.08850860595703125, -0.0776214599609375, -0.06673431396484375, -0.05584716796875, -0.04496002197265625, -0.0340728759765625, -0.02318572998046875, -0.012298583984375, -0.00141143798828125, 0.0094757080078125, 0.02036285400390625, 0.03125, 0.04213714599609375, 0.0530242919921875, 0.06391143798828125, 0.074798583984375, 0.08568572998046875, 0.0965728759765625, 0.10746002197265625, 0.11834716796875, 0.12923431396484375, 0.1401214599609375, 0.15100860595703125, 0.161895751953125, 0.17278289794921875, 0.1836700439453125, 0.19455718994140625, 0.2054443359375, 0.21633148193359375, 0.2272186279296875, 0.23810577392578125, 0.248992919921875, 0.25988006591796875, 0.2707672119140625, 0.28165435791015625, 0.29254150390625, 0.30342864990234375, 0.3143157958984375, 0.32520294189453125, 0.336090087890625, 0.34697723388671875, 0.3578643798828125, 0.36875152587890625, 0.379638671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 6.0, 9.0, 13.0, 17.0, 21.0, 47.0, 59.0, 104.0, 163.0, 180.0, 144.0, 78.0, 52.0, 28.0, 16.0, 11.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.026056289672851562, -0.025135040283203125, -0.024213790893554688, -0.02329254150390625, -0.022371292114257812, -0.021450042724609375, -0.020528793334960938, -0.0196075439453125, -0.018686294555664062, -0.017765045166015625, -0.016843795776367188, -0.01592254638671875, -0.015001296997070312, -0.014080047607421875, -0.013158798217773438, -0.012237548828125, -0.011316299438476562, -0.010395050048828125, -0.009473800659179688, -0.00855255126953125, -0.0076313018798828125, -0.006710052490234375, -0.0057888031005859375, -0.0048675537109375, -0.0039463043212890625, -0.003025054931640625, -0.0021038055419921875, -0.00118255615234375, -0.0002613067626953125, 0.000659942626953125, 0.0015811920166015625, 0.00250244140625, 0.0034236907958984375, 0.004344940185546875, 0.0052661895751953125, 0.00618743896484375, 0.0071086883544921875, 0.008029937744140625, 0.008951187133789062, 0.0098724365234375, 0.010793685913085938, 0.011714935302734375, 0.012636184692382812, 0.01355743408203125, 0.014478683471679688, 0.015399932861328125, 0.016321182250976562, 0.017242431640625, 0.018163681030273438, 0.019084930419921875, 0.020006179809570312, 0.02092742919921875, 0.021848678588867188, 0.022769927978515625, 0.023691177368164062, 0.0246124267578125, 0.025533676147460938, 0.026454925537109375, 0.027376174926757812, 0.02829742431640625, 0.029218673706054688, 0.030139923095703125, 0.031061172485351562, 0.031982421875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 15.0, 19.0, 19.0, 23.0, 29.0, 55.0, 73.0, 83.0, 72.0, 83.0, 77.0, 81.0, 81.0, 65.0, 66.0, 47.0, 37.0, 18.0, 12.0, 10.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0147171020507812, -2.890411615371704, -2.766105890274048, -2.6418004035949707, -2.5174946784973145, -2.3931891918182373, -2.268883466720581, -2.144577980041504, -2.0202722549438477, -1.895966649055481, -1.7716610431671143, -1.6473554372787476, -1.5230498313903809, -1.3987443447113037, -1.2744386196136475, -1.1501331329345703, -1.0258275270462036, -0.9015219211578369, -0.7772163152694702, -0.6529107093811035, -0.5286051034927368, -0.4042995572090149, -0.2799939513206482, -0.1556883454322815, -0.031382739543914795, 0.09292285889387131, 0.2172284573316574, 0.3415340483188629, 0.4658396542072296, 0.5901452302932739, 0.7144508361816406, 0.8387564420700073, 0.963062047958374, 1.0873676538467407, 1.2116732597351074, 1.3359788656234741, 1.4602844715118408, 1.584589958190918, 1.7088956832885742, 1.8332011699676514, 1.9575068950653076, 2.0818123817443848, 2.206118106842041, 2.330423593521118, 2.4547293186187744, 2.5790348052978516, 2.703340530395508, 2.827646017074585, 2.951951503753662, 3.0762569904327393, 3.2005627155303955, 3.3248682022094727, 3.449173927307129, 3.573479413986206, 3.6977851390838623, 3.8220906257629395, 3.9463963508605957, 4.070702075958252, 4.19500732421875, 4.319313049316406, 4.4436187744140625, 4.567924499511719, 4.692229747772217, 4.816535472869873, 4.940841197967529]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 6.0, 8.0, 10.0, 13.0, 11.0, 19.0, 19.0, 24.0, 23.0, 18.0, 28.0, 36.0, 30.0, 32.0, 42.0, 46.0, 49.0, 43.0, 47.0, 48.0, 58.0, 55.0, 43.0, 36.0, 33.0, 23.0, 25.0, 26.0, 26.0, 24.0, 14.0, 12.0, 9.0, 10.0, 10.0, 11.0, 9.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.269278049468994, -2.1899757385253906, -2.110673427581787, -2.0313708782196045, -1.952068567276001, -1.8727662563323975, -1.7934638261795044, -1.7141613960266113, -1.6348590850830078, -1.5555567741394043, -1.4762543439865112, -1.3969519138336182, -1.3176496028900146, -1.2383472919464111, -1.159044861793518, -1.079742431640625, -1.0004401206970215, -0.9211377501487732, -0.8418353796005249, -0.7625330090522766, -0.6832306385040283, -0.60392826795578, -0.5246258974075317, -0.44532352685928345, -0.36602115631103516, -0.28671878576278687, -0.20741641521453857, -0.12811404466629028, -0.04881167411804199, 0.0304906964302063, 0.10979306697845459, 0.18909543752670288, 0.26839780807495117, 0.34770017862319946, 0.42700254917144775, 0.506304919719696, 0.5856072902679443, 0.6649096608161926, 0.7442120313644409, 0.8235144019126892, 0.9028167724609375, 0.9821191430091858, 1.061421513557434, 1.1407239437103271, 1.2200262546539307, 1.2993285655975342, 1.3786309957504272, 1.4579334259033203, 1.5372357368469238, 1.6165380477905273, 1.6958404779434204, 1.7751429080963135, 1.854445219039917, 1.9337475299835205, 2.013050079345703, 2.0923523902893066, 2.17165470123291, 2.2509570121765137, 2.330259323120117, 2.4095618724823, 2.4888641834259033, 2.568166494369507, 2.6474690437316895, 2.726771354675293, 2.8060736656188965]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 7.0, 15.0, 19.0, 14.0, 37.0, 52.0, 66.0, 92.0, 136.0, 243.0, 411.0, 743.0, 1245.0, 2101.0, 4051.0, 7320.0, 14065.0, 29786.0, 64835.0, 137096.0, 248483.0, 255580.0, 147124.0, 69903.0, 32365.0, 15253.0, 7882.0, 4109.0, 2307.0, 1302.0, 744.0, 382.0, 275.0, 157.0, 121.0, 57.0, 39.0, 30.0, 21.0, 18.0, 17.0, 12.0, 5.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0], "bins": [-2.14453125, -2.083343505859375, -2.02215576171875, -1.960968017578125, -1.8997802734375, -1.838592529296875, -1.77740478515625, -1.716217041015625, -1.655029296875, -1.593841552734375, -1.53265380859375, -1.471466064453125, -1.4102783203125, -1.349090576171875, -1.28790283203125, -1.226715087890625, -1.16552734375, -1.104339599609375, -1.04315185546875, -0.981964111328125, -0.9207763671875, -0.859588623046875, -0.79840087890625, -0.737213134765625, -0.676025390625, -0.614837646484375, -0.55364990234375, -0.492462158203125, -0.4312744140625, -0.370086669921875, -0.30889892578125, -0.247711181640625, -0.1865234375, -0.125335693359375, -0.06414794921875, -0.002960205078125, 0.0582275390625, 0.119415283203125, 0.18060302734375, 0.241790771484375, 0.302978515625, 0.364166259765625, 0.42535400390625, 0.486541748046875, 0.5477294921875, 0.608917236328125, 0.67010498046875, 0.731292724609375, 0.79248046875, 0.853668212890625, 0.91485595703125, 0.976043701171875, 1.0372314453125, 1.098419189453125, 1.15960693359375, 1.220794677734375, 1.281982421875, 1.343170166015625, 1.40435791015625, 1.465545654296875, 1.5267333984375, 1.587921142578125, 1.64910888671875, 1.710296630859375, 1.771484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 7.0, 5.0, 18.0, 11.0, 18.0, 15.0, 20.0, 14.0, 22.0, 30.0, 35.0, 30.0, 47.0, 41.0, 38.0, 40.0, 53.0, 50.0, 57.0, 47.0, 50.0, 44.0, 35.0, 43.0, 35.0, 16.0, 24.0, 27.0, 23.0, 18.0, 10.0, 8.0, 20.0, 15.0, 6.0, 7.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0859375, -4.92730712890625, -4.7686767578125, -4.61004638671875, -4.451416015625, -4.29278564453125, -4.1341552734375, -3.97552490234375, -3.81689453125, -3.65826416015625, -3.4996337890625, -3.34100341796875, -3.182373046875, -3.02374267578125, -2.8651123046875, -2.70648193359375, -2.5478515625, -2.38922119140625, -2.2305908203125, -2.07196044921875, -1.913330078125, -1.75469970703125, -1.5960693359375, -1.43743896484375, -1.27880859375, -1.12017822265625, -0.9615478515625, -0.80291748046875, -0.644287109375, -0.48565673828125, -0.3270263671875, -0.16839599609375, -0.009765625, 0.14886474609375, 0.3074951171875, 0.46612548828125, 0.624755859375, 0.78338623046875, 0.9420166015625, 1.10064697265625, 1.25927734375, 1.41790771484375, 1.5765380859375, 1.73516845703125, 1.893798828125, 2.05242919921875, 2.2110595703125, 2.36968994140625, 2.5283203125, 2.68695068359375, 2.8455810546875, 3.00421142578125, 3.162841796875, 3.32147216796875, 3.4801025390625, 3.63873291015625, 3.79736328125, 3.95599365234375, 4.1146240234375, 4.27325439453125, 4.431884765625, 4.59051513671875, 4.7491455078125, 4.90777587890625, 5.06640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 6.0, 9.0, 10.0, 9.0, 13.0, 9.0, 10.0, 14.0, 24.0, 21.0, 30.0, 32.0, 56.0, 60.0, 98.0, 153.0, 231.0, 633.0, 26660.0, 1009278.0, 9996.0, 475.0, 206.0, 129.0, 79.0, 52.0, 57.0, 48.0, 36.0, 22.0, 26.0, 22.0, 12.0, 3.0, 10.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.078125, -18.470703125, -17.86328125, -17.255859375, -16.6484375, -16.041015625, -15.43359375, -14.826171875, -14.21875, -13.611328125, -13.00390625, -12.396484375, -11.7890625, -11.181640625, -10.57421875, -9.966796875, -9.359375, -8.751953125, -8.14453125, -7.537109375, -6.9296875, -6.322265625, -5.71484375, -5.107421875, -4.5, -3.892578125, -3.28515625, -2.677734375, -2.0703125, -1.462890625, -0.85546875, -0.248046875, 0.359375, 0.966796875, 1.57421875, 2.181640625, 2.7890625, 3.396484375, 4.00390625, 4.611328125, 5.21875, 5.826171875, 6.43359375, 7.041015625, 7.6484375, 8.255859375, 8.86328125, 9.470703125, 10.078125, 10.685546875, 11.29296875, 11.900390625, 12.5078125, 13.115234375, 13.72265625, 14.330078125, 14.9375, 15.544921875, 16.15234375, 16.759765625, 17.3671875, 17.974609375, 18.58203125, 19.189453125, 19.796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 9.0, 7.0, 15.0, 17.0, 17.0, 18.0, 15.0, 20.0, 25.0, 24.0, 28.0, 34.0, 35.0, 35.0, 41.0, 45.0, 49.0, 55.0, 46.0, 52.0, 45.0, 42.0, 40.0, 29.0, 38.0, 33.0, 32.0, 20.0, 27.0, 16.0, 20.0, 12.0, 8.0, 12.0, 7.0, 4.0, 4.0, 5.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.38665771484375, -4.2342529296875, -4.08184814453125, -3.929443359375, -3.77703857421875, -3.6246337890625, -3.47222900390625, -3.31982421875, -3.16741943359375, -3.0150146484375, -2.86260986328125, -2.710205078125, -2.55780029296875, -2.4053955078125, -2.25299072265625, -2.1005859375, -1.94818115234375, -1.7957763671875, -1.64337158203125, -1.490966796875, -1.33856201171875, -1.1861572265625, -1.03375244140625, -0.88134765625, -0.72894287109375, -0.5765380859375, -0.42413330078125, -0.271728515625, -0.11932373046875, 0.0330810546875, 0.18548583984375, 0.337890625, 0.49029541015625, 0.6427001953125, 0.79510498046875, 0.947509765625, 1.09991455078125, 1.2523193359375, 1.40472412109375, 1.55712890625, 1.70953369140625, 1.8619384765625, 2.01434326171875, 2.166748046875, 2.31915283203125, 2.4715576171875, 2.62396240234375, 2.7763671875, 2.92877197265625, 3.0811767578125, 3.23358154296875, 3.385986328125, 3.53839111328125, 3.6907958984375, 3.84320068359375, 3.99560546875, 4.14801025390625, 4.3004150390625, 4.45281982421875, 4.605224609375, 4.75762939453125, 4.9100341796875, 5.06243896484375, 5.21484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 7.0, 11.0, 15.0, 17.0, 31.0, 41.0, 58.0, 127.0, 342.0, 1225.0, 9220.0, 465741.0, 558655.0, 11094.0, 1267.0, 337.0, 124.0, 65.0, 35.0, 31.0, 15.0, 16.0, 13.0, 9.0, 1.0, 6.0, 10.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.404296875, -3.298004150390625, -3.19171142578125, -3.085418701171875, -2.9791259765625, -2.872833251953125, -2.76654052734375, -2.660247802734375, -2.553955078125, -2.447662353515625, -2.34136962890625, -2.235076904296875, -2.1287841796875, -2.022491455078125, -1.91619873046875, -1.809906005859375, -1.70361328125, -1.597320556640625, -1.49102783203125, -1.384735107421875, -1.2784423828125, -1.172149658203125, -1.06585693359375, -0.959564208984375, -0.853271484375, -0.746978759765625, -0.64068603515625, -0.534393310546875, -0.4281005859375, -0.321807861328125, -0.21551513671875, -0.109222412109375, -0.0029296875, 0.103363037109375, 0.20965576171875, 0.315948486328125, 0.4222412109375, 0.528533935546875, 0.63482666015625, 0.741119384765625, 0.847412109375, 0.953704833984375, 1.05999755859375, 1.166290283203125, 1.2725830078125, 1.378875732421875, 1.48516845703125, 1.591461181640625, 1.69775390625, 1.804046630859375, 1.91033935546875, 2.016632080078125, 2.1229248046875, 2.229217529296875, 2.33551025390625, 2.441802978515625, 2.548095703125, 2.654388427734375, 2.76068115234375, 2.866973876953125, 2.9732666015625, 3.079559326171875, 3.18585205078125, 3.292144775390625, 3.3984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 5.0, 9.0, 12.0, 19.0, 11.0, 34.0, 39.0, 39.0, 56.0, 80.0, 71.0, 74.0, 79.0, 81.0, 77.0, 72.0, 61.0, 42.0, 37.0, 19.0, 22.0, 19.0, 6.0, 12.0, 7.0, 6.0, 5.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002384185791015625, -0.00023208186030387878, -0.00022574514150619507, -0.00021940842270851135, -0.00021307170391082764, -0.00020673498511314392, -0.0002003982663154602, -0.0001940615475177765, -0.00018772482872009277, -0.00018138810992240906, -0.00017505139112472534, -0.00016871467232704163, -0.0001623779535293579, -0.0001560412347316742, -0.00014970451593399048, -0.00014336779713630676, -0.00013703107833862305, -0.00013069435954093933, -0.00012435764074325562, -0.0001180209219455719, -0.00011168420314788818, -0.00010534748435020447, -9.901076555252075e-05, -9.267404675483704e-05, -8.633732795715332e-05, -8.00006091594696e-05, -7.366389036178589e-05, -6.732717156410217e-05, -6.099045276641846e-05, -5.465373396873474e-05, -4.8317015171051025e-05, -4.198029637336731e-05, -3.5643577575683594e-05, -2.9306858777999878e-05, -2.2970139980316162e-05, -1.6633421182632446e-05, -1.029670238494873e-05, -3.959983587265015e-06, 2.376735210418701e-06, 8.713454008102417e-06, 1.5050172805786133e-05, 2.138689160346985e-05, 2.7723610401153564e-05, 3.406032919883728e-05, 4.0397047996520996e-05, 4.673376679420471e-05, 5.307048559188843e-05, 5.9407204389572144e-05, 6.574392318725586e-05, 7.208064198493958e-05, 7.841736078262329e-05, 8.475407958030701e-05, 9.109079837799072e-05, 9.742751717567444e-05, 0.00010376423597335815, 0.00011010095477104187, 0.00011643767356872559, 0.0001227743923664093, 0.00012911111116409302, 0.00013544782996177673, 0.00014178454875946045, 0.00014812126755714417, 0.00015445798635482788, 0.0001607947051525116, 0.0001671314239501953]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 8.0, 15.0, 23.0, 41.0, 56.0, 115.0, 266.0, 841.0, 3937.0, 70290.0, 905479.0, 62335.0, 3783.0, 818.0, 270.0, 109.0, 44.0, 51.0, 24.0, 15.0, 6.0, 3.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2265625, -3.12408447265625, -3.0216064453125, -2.91912841796875, -2.816650390625, -2.71417236328125, -2.6116943359375, -2.50921630859375, -2.40673828125, -2.30426025390625, -2.2017822265625, -2.09930419921875, -1.996826171875, -1.89434814453125, -1.7918701171875, -1.68939208984375, -1.5869140625, -1.48443603515625, -1.3819580078125, -1.27947998046875, -1.177001953125, -1.07452392578125, -0.9720458984375, -0.86956787109375, -0.76708984375, -0.66461181640625, -0.5621337890625, -0.45965576171875, -0.357177734375, -0.25469970703125, -0.1522216796875, -0.04974365234375, 0.052734375, 0.15521240234375, 0.2576904296875, 0.36016845703125, 0.462646484375, 0.56512451171875, 0.6676025390625, 0.77008056640625, 0.87255859375, 0.97503662109375, 1.0775146484375, 1.17999267578125, 1.282470703125, 1.38494873046875, 1.4874267578125, 1.58990478515625, 1.6923828125, 1.79486083984375, 1.8973388671875, 1.99981689453125, 2.102294921875, 2.20477294921875, 2.3072509765625, 2.40972900390625, 2.51220703125, 2.61468505859375, 2.7171630859375, 2.81964111328125, 2.922119140625, 3.02459716796875, 3.1270751953125, 3.22955322265625, 3.33203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 26.0, 41.0, 66.0, 96.0, 123.0, 144.0, 156.0, 105.0, 81.0, 47.0, 26.0, 23.0, 21.0, 9.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.986328125, -0.95526123046875, -0.9241943359375, -0.89312744140625, -0.862060546875, -0.83099365234375, -0.7999267578125, -0.76885986328125, -0.73779296875, -0.70672607421875, -0.6756591796875, -0.64459228515625, -0.613525390625, -0.58245849609375, -0.5513916015625, -0.52032470703125, -0.4892578125, -0.45819091796875, -0.4271240234375, -0.39605712890625, -0.364990234375, -0.33392333984375, -0.3028564453125, -0.27178955078125, -0.24072265625, -0.20965576171875, -0.1785888671875, -0.14752197265625, -0.116455078125, -0.08538818359375, -0.0543212890625, -0.02325439453125, 0.0078125, 0.03887939453125, 0.0699462890625, 0.10101318359375, 0.132080078125, 0.16314697265625, 0.1942138671875, 0.22528076171875, 0.25634765625, 0.28741455078125, 0.3184814453125, 0.34954833984375, 0.380615234375, 0.41168212890625, 0.4427490234375, 0.47381591796875, 0.5048828125, 0.53594970703125, 0.5670166015625, 0.59808349609375, 0.629150390625, 0.66021728515625, 0.6912841796875, 0.72235107421875, 0.75341796875, 0.78448486328125, 0.8155517578125, 0.84661865234375, 0.877685546875, 0.90875244140625, 0.9398193359375, 0.97088623046875, 1.001953125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 16.0, 23.0, 78.0, 162.0, 246.0, 208.0, 185.0, 65.0, 21.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.61861038208008, -35.89997863769531, -35.18135070800781, -34.46271896362305, -33.74409103393555, -33.02545928955078, -32.30683135986328, -31.588199615478516, -30.869569778442383, -30.15093994140625, -29.432310104370117, -28.713680267333984, -27.99504852294922, -27.276418685913086, -26.557788848876953, -25.83915901184082, -25.120529174804688, -24.401899337768555, -23.683269500732422, -22.964637756347656, -22.246007919311523, -21.52737808227539, -20.808748245239258, -20.090118408203125, -19.37148666381836, -18.652856826782227, -17.934226989746094, -17.215595245361328, -16.496965408325195, -15.778335571289062, -15.05970573425293, -14.341075897216797, -13.622445106506348, -12.903815269470215, -12.185184478759766, -11.466554641723633, -10.7479248046875, -10.029294967651367, -9.310664176940918, -8.592034339904785, -7.873404026031494, -7.154773712158203, -6.43614387512207, -5.717513561248779, -4.998883247375488, -4.2802534103393555, -3.5616230964660645, -2.8429932594299316, -2.1243629455566406, -1.4057328701019287, -0.6871026754379272, 0.03152751922607422, 0.7501575946807861, 1.468787670135498, 2.187417984008789, 2.906047821044922, 3.624678134918213, 4.343308448791504, 5.061938285827637, 5.780568599700928, 6.499198913574219, 7.217828750610352, 7.936459064483643, 8.655088424682617, 9.373719215393066]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 17.0, 10.0, 15.0, 16.0, 18.0, 26.0, 27.0, 29.0, 33.0, 45.0, 34.0, 54.0, 44.0, 47.0, 44.0, 47.0, 50.0, 51.0, 42.0, 45.0, 44.0, 45.0, 41.0, 31.0, 24.0, 23.0, 21.0, 16.0, 6.0, 8.0, 9.0, 7.0, 11.0, 3.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.641238689422607, -6.403675556182861, -6.166112899780273, -5.928549766540527, -5.690986633300781, -5.453423976898193, -5.215860843658447, -4.978298187255859, -4.740735054016113, -4.503171920776367, -4.265609264373779, -4.028046131134033, -3.790483236312866, -3.552920341491699, -3.315357208251953, -3.077794313430786, -2.840231418609619, -2.602668523788452, -2.365105628967285, -2.127542495727539, -1.889979600906372, -1.652416706085205, -1.4148536920547485, -1.177290678024292, -0.939727783203125, -0.7021648287773132, -0.46460187435150146, -0.2270389199256897, 0.01052403450012207, 0.24808692932128906, 0.4856499433517456, 0.7232129573822021, 0.9607763290405273, 1.1983392238616943, 1.4359022378921509, 1.6734652519226074, 1.9110281467437744, 2.1485910415649414, 2.3861541748046875, 2.6237170696258545, 2.8612799644470215, 3.0988428592681885, 3.3364057540893555, 3.5739688873291016, 3.8115317821502686, 4.0490946769714355, 4.286657810211182, 4.5242204666137695, 4.761783599853516, 4.999346733093262, 5.23690938949585, 5.474472522735596, 5.712035179138184, 5.94959831237793, 6.187161445617676, 6.424724578857422, 6.66228723526001, 6.899850368499756, 7.137413024902344, 7.37497615814209, 7.612539291381836, 7.850101947784424, 8.087664604187012, 8.325227737426758, 8.562790870666504]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 19.0, 16.0, 35.0, 45.0, 48.0, 67.0, 125.0, 197.0, 258.0, 577.0, 1721.0, 9056.0, 81838.0, 870989.0, 2450739.0, 701835.0, 66051.0, 7794.0, 1552.0, 501.0, 241.0, 189.0, 115.0, 72.0, 52.0, 38.0, 24.0, 17.0, 15.0, 15.0, 6.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9453125, -7.707763671875, -7.47021484375, -7.232666015625, -6.9951171875, -6.757568359375, -6.52001953125, -6.282470703125, -6.044921875, -5.807373046875, -5.56982421875, -5.332275390625, -5.0947265625, -4.857177734375, -4.61962890625, -4.382080078125, -4.14453125, -3.906982421875, -3.66943359375, -3.431884765625, -3.1943359375, -2.956787109375, -2.71923828125, -2.481689453125, -2.244140625, -2.006591796875, -1.76904296875, -1.531494140625, -1.2939453125, -1.056396484375, -0.81884765625, -0.581298828125, -0.34375, -0.106201171875, 0.13134765625, 0.368896484375, 0.6064453125, 0.843994140625, 1.08154296875, 1.319091796875, 1.556640625, 1.794189453125, 2.03173828125, 2.269287109375, 2.5068359375, 2.744384765625, 2.98193359375, 3.219482421875, 3.45703125, 3.694580078125, 3.93212890625, 4.169677734375, 4.4072265625, 4.644775390625, 4.88232421875, 5.119873046875, 5.357421875, 5.594970703125, 5.83251953125, 6.070068359375, 6.3076171875, 6.545166015625, 6.78271484375, 7.020263671875, 7.2578125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 7.0, 4.0, 8.0, 7.0, 5.0, 10.0, 9.0, 19.0, 13.0, 18.0, 19.0, 20.0, 20.0, 40.0, 24.0, 25.0, 33.0, 51.0, 47.0, 40.0, 38.0, 55.0, 39.0, 39.0, 43.0, 42.0, 51.0, 32.0, 39.0, 28.0, 29.0, 25.0, 29.0, 18.0, 17.0, 9.0, 12.0, 8.0, 7.0, 6.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3828125, -3.272735595703125, -3.16265869140625, -3.052581787109375, -2.9425048828125, -2.832427978515625, -2.72235107421875, -2.612274169921875, -2.502197265625, -2.392120361328125, -2.28204345703125, -2.171966552734375, -2.0618896484375, -1.951812744140625, -1.84173583984375, -1.731658935546875, -1.62158203125, -1.511505126953125, -1.40142822265625, -1.291351318359375, -1.1812744140625, -1.071197509765625, -0.96112060546875, -0.851043701171875, -0.740966796875, -0.630889892578125, -0.52081298828125, -0.410736083984375, -0.3006591796875, -0.190582275390625, -0.08050537109375, 0.029571533203125, 0.1396484375, 0.249725341796875, 0.35980224609375, 0.469879150390625, 0.5799560546875, 0.690032958984375, 0.80010986328125, 0.910186767578125, 1.020263671875, 1.130340576171875, 1.24041748046875, 1.350494384765625, 1.4605712890625, 1.570648193359375, 1.68072509765625, 1.790802001953125, 1.90087890625, 2.010955810546875, 2.12103271484375, 2.231109619140625, 2.3411865234375, 2.451263427734375, 2.56134033203125, 2.671417236328125, 2.781494140625, 2.891571044921875, 3.00164794921875, 3.111724853515625, 3.2218017578125, 3.331878662109375, 3.44195556640625, 3.552032470703125, 3.662109375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 14.0, 10.0, 18.0, 24.0, 36.0, 57.0, 99.0, 163.0, 292.0, 580.0, 1585.0, 10450.0, 490817.0, 3602586.0, 81371.0, 4194.0, 975.0, 409.0, 218.0, 134.0, 69.0, 58.0, 44.0, 24.0, 14.0, 9.0, 9.0, 7.0, 11.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.6640625, -15.275390625, -14.88671875, -14.498046875, -14.109375, -13.720703125, -13.33203125, -12.943359375, -12.5546875, -12.166015625, -11.77734375, -11.388671875, -11.0, -10.611328125, -10.22265625, -9.833984375, -9.4453125, -9.056640625, -8.66796875, -8.279296875, -7.890625, -7.501953125, -7.11328125, -6.724609375, -6.3359375, -5.947265625, -5.55859375, -5.169921875, -4.78125, -4.392578125, -4.00390625, -3.615234375, -3.2265625, -2.837890625, -2.44921875, -2.060546875, -1.671875, -1.283203125, -0.89453125, -0.505859375, -0.1171875, 0.271484375, 0.66015625, 1.048828125, 1.4375, 1.826171875, 2.21484375, 2.603515625, 2.9921875, 3.380859375, 3.76953125, 4.158203125, 4.546875, 4.935546875, 5.32421875, 5.712890625, 6.1015625, 6.490234375, 6.87890625, 7.267578125, 7.65625, 8.044921875, 8.43359375, 8.822265625, 9.2109375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 10.0, 13.0, 5.0, 12.0, 20.0, 25.0, 26.0, 39.0, 43.0, 61.0, 88.0, 133.0, 160.0, 196.0, 296.0, 356.0, 371.0, 395.0, 391.0, 348.0, 245.0, 206.0, 166.0, 117.0, 97.0, 68.0, 46.0, 32.0, 35.0, 17.0, 18.0, 9.0, 3.0, 6.0, 4.0, 6.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.529296875, -1.4757843017578125, -1.422271728515625, -1.3687591552734375, -1.31524658203125, -1.2617340087890625, -1.208221435546875, -1.1547088623046875, -1.1011962890625, -1.0476837158203125, -0.994171142578125, -0.9406585693359375, -0.88714599609375, -0.8336334228515625, -0.780120849609375, -0.7266082763671875, -0.673095703125, -0.6195831298828125, -0.566070556640625, -0.5125579833984375, -0.45904541015625, -0.4055328369140625, -0.352020263671875, -0.2985076904296875, -0.2449951171875, -0.1914825439453125, -0.137969970703125, -0.0844573974609375, -0.03094482421875, 0.0225677490234375, 0.076080322265625, 0.1295928955078125, 0.18310546875, 0.2366180419921875, 0.290130615234375, 0.3436431884765625, 0.39715576171875, 0.4506683349609375, 0.504180908203125, 0.5576934814453125, 0.6112060546875, 0.6647186279296875, 0.718231201171875, 0.7717437744140625, 0.82525634765625, 0.8787689208984375, 0.932281494140625, 0.9857940673828125, 1.039306640625, 1.0928192138671875, 1.146331787109375, 1.1998443603515625, 1.25335693359375, 1.3068695068359375, 1.360382080078125, 1.4138946533203125, 1.4674072265625, 1.5209197998046875, 1.574432373046875, 1.6279449462890625, 1.68145751953125, 1.7349700927734375, 1.788482666015625, 1.8419952392578125, 1.8955078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 13.0, 39.0, 58.0, 83.0, 80.0, 139.0, 148.0, 144.0, 109.0, 83.0, 49.0, 25.0, 13.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.708285331726074, -4.360116481781006, -4.0119476318359375, -3.6637792587280273, -3.315610408782959, -2.9674415588378906, -2.6192729473114014, -2.271104335784912, -1.9229354858398438, -1.574766755104065, -1.2265980243682861, -0.8784292936325073, -0.5302605628967285, -0.1820918321609497, 0.1660768985748291, 0.5142455101013184, 0.8624143600463867, 1.2105830907821655, 1.5587518215179443, 1.9069205522537231, 2.255089282989502, 2.6032581329345703, 2.9514267444610596, 3.299595355987549, 3.647764205932617, 3.9959330558776855, 4.344101905822754, 4.692270278930664, 5.040439128875732, 5.388607978820801, 5.736776351928711, 6.084945201873779, 6.433113098144531, 6.7812819480896, 7.129450798034668, 7.477619171142578, 7.8257880210876465, 8.173956871032715, 8.522125244140625, 8.870294570922852, 9.218462944030762, 9.566631317138672, 9.914800643920898, 10.262969017028809, 10.611137390136719, 10.959306716918945, 11.307475090026855, 11.655643463134766, 12.003812789916992, 12.351981163024902, 12.700150489807129, 13.048318862915039, 13.396488189697266, 13.744656562805176, 14.092824935913086, 14.440994262695312, 14.789162635803223, 15.137331008911133, 15.48550033569336, 15.83366870880127, 16.18183708190918, 16.530006408691406, 16.878175735473633, 17.226343154907227, 17.574512481689453]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 5.0, 10.0, 11.0, 17.0, 16.0, 20.0, 18.0, 15.0, 30.0, 25.0, 27.0, 31.0, 26.0, 27.0, 38.0, 38.0, 31.0, 49.0, 33.0, 38.0, 43.0, 38.0, 40.0, 30.0, 49.0, 37.0, 34.0, 21.0, 28.0, 27.0, 18.0, 13.0, 13.0, 13.0, 17.0, 13.0, 7.0, 11.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.094571113586426, -3.9765985012054443, -3.858625650405884, -3.7406530380249023, -3.622680187225342, -3.5047075748443604, -3.3867347240448, -3.2687621116638184, -3.150789260864258, -3.0328166484832764, -2.914843797683716, -2.7968711853027344, -2.678898334503174, -2.5609257221221924, -2.442952871322632, -2.3249802589416504, -2.20700740814209, -2.0890347957611084, -1.9710619449615479, -1.8530892133712769, -1.7351164817810059, -1.6171438694000244, -1.4991710186004639, -1.3811984062194824, -1.263225793838501, -1.14525306224823, -1.027280330657959, -0.909307599067688, -0.791334867477417, -0.6733621954917908, -0.5553894639015198, -0.4374167323112488, -0.319443941116333, -0.201471209526062, -0.08349849283695221, 0.03447422385215759, 0.1524469554424286, 0.2704196572303772, 0.3883923888206482, 0.5063651204109192, 0.6243378520011902, 0.7423105835914612, 0.8602833151817322, 0.9782559871673584, 1.0962287187576294, 1.2142014503479004, 1.3321741819381714, 1.4501469135284424, 1.5681196451187134, 1.6860923767089844, 1.8040651082992554, 1.9220378398895264, 2.040010452270508, 2.1579833030700684, 2.27595591545105, 2.3939287662506104, 2.511901378631592, 2.6298739910125732, 2.747846841812134, 2.8658194541931152, 2.983792304992676, 3.1017649173736572, 3.2197377681732178, 3.337710380554199, 3.4556832313537598]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 17.0, 8.0, 31.0, 70.0, 113.0, 293.0, 817.0, 2616.0, 28090.0, 904667.0, 105867.0, 4161.0, 1130.0, 383.0, 140.0, 77.0, 30.0, 12.0, 9.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6875, -1.60577392578125, -1.5240478515625, -1.44232177734375, -1.360595703125, -1.27886962890625, -1.1971435546875, -1.11541748046875, -1.03369140625, -0.95196533203125, -0.8702392578125, -0.78851318359375, -0.706787109375, -0.62506103515625, -0.5433349609375, -0.46160888671875, -0.3798828125, -0.29815673828125, -0.2164306640625, -0.13470458984375, -0.052978515625, 0.02874755859375, 0.1104736328125, 0.19219970703125, 0.27392578125, 0.35565185546875, 0.4373779296875, 0.51910400390625, 0.600830078125, 0.68255615234375, 0.7642822265625, 0.84600830078125, 0.927734375, 1.00946044921875, 1.0911865234375, 1.17291259765625, 1.254638671875, 1.33636474609375, 1.4180908203125, 1.49981689453125, 1.58154296875, 1.66326904296875, 1.7449951171875, 1.82672119140625, 1.908447265625, 1.99017333984375, 2.0718994140625, 2.15362548828125, 2.2353515625, 2.31707763671875, 2.3988037109375, 2.48052978515625, 2.562255859375, 2.64398193359375, 2.7257080078125, 2.80743408203125, 2.88916015625, 2.97088623046875, 3.0526123046875, 3.13433837890625, 3.216064453125, 3.29779052734375, 3.3795166015625, 3.46124267578125, 3.54296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 10.0, 7.0, 21.0, 37.0, 30.0, 46.0, 57.0, 85.0, 75.0, 110.0, 100.0, 106.0, 102.0, 62.0, 60.0, 26.0, 36.0, 16.0, 8.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.72906494140625, -2.5479736328125, -2.36688232421875, -2.185791015625, -2.00469970703125, -1.8236083984375, -1.64251708984375, -1.46142578125, -1.28033447265625, -1.0992431640625, -0.91815185546875, -0.737060546875, -0.55596923828125, -0.3748779296875, -0.19378662109375, -0.0126953125, 0.16839599609375, 0.3494873046875, 0.53057861328125, 0.711669921875, 0.89276123046875, 1.0738525390625, 1.25494384765625, 1.43603515625, 1.61712646484375, 1.7982177734375, 1.97930908203125, 2.160400390625, 2.34149169921875, 2.5225830078125, 2.70367431640625, 2.884765625, 3.06585693359375, 3.2469482421875, 3.42803955078125, 3.609130859375, 3.79022216796875, 3.9713134765625, 4.15240478515625, 4.33349609375, 4.51458740234375, 4.6956787109375, 4.87677001953125, 5.057861328125, 5.23895263671875, 5.4200439453125, 5.60113525390625, 5.7822265625, 5.96331787109375, 6.1444091796875, 6.32550048828125, 6.506591796875, 6.68768310546875, 6.8687744140625, 7.04986572265625, 7.23095703125, 7.41204833984375, 7.5931396484375, 7.77423095703125, 7.955322265625, 8.13641357421875, 8.3175048828125, 8.49859619140625, 8.6796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 11.0, 17.0, 34.0, 43.0, 81.0, 174.0, 351.0, 717.0, 1593.0, 3718.0, 8812.0, 20570.0, 48460.0, 107675.0, 208792.0, 273954.0, 196187.0, 99365.0, 44586.0, 18920.0, 8165.0, 3406.0, 1532.0, 676.0, 340.0, 156.0, 98.0, 44.0, 30.0, 23.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.39208984375, -0.3816184997558594, -0.37114715576171875, -0.3606758117675781, -0.3502044677734375, -0.3397331237792969, -0.32926177978515625, -0.3187904357910156, -0.308319091796875, -0.2978477478027344, -0.28737640380859375, -0.2769050598144531, -0.2664337158203125, -0.2559623718261719, -0.24549102783203125, -0.23501968383789062, -0.22454833984375, -0.21407699584960938, -0.20360565185546875, -0.19313430786132812, -0.1826629638671875, -0.17219161987304688, -0.16172027587890625, -0.15124893188476562, -0.140777587890625, -0.13030624389648438, -0.11983489990234375, -0.10936355590820312, -0.0988922119140625, -0.08842086791992188, -0.07794952392578125, -0.06747817993164062, -0.0570068359375, -0.046535491943359375, -0.03606414794921875, -0.025592803955078125, -0.0151214599609375, -0.004650115966796875, 0.00582122802734375, 0.016292572021484375, 0.026763916015625, 0.037235260009765625, 0.04770660400390625, 0.058177947998046875, 0.0686492919921875, 0.07912063598632812, 0.08959197998046875, 0.10006332397460938, 0.11053466796875, 0.12100601196289062, 0.13147735595703125, 0.14194869995117188, 0.1524200439453125, 0.16289138793945312, 0.17336273193359375, 0.18383407592773438, 0.194305419921875, 0.20477676391601562, 0.21524810791015625, 0.22571945190429688, 0.2361907958984375, 0.24666213989257812, 0.25713348388671875, 0.2676048278808594, 0.278076171875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 12.0, 18.0, 17.0, 27.0, 41.0, 47.0, 45.0, 49.0, 75.0, 77.0, 73.0, 85.0, 69.0, 71.0, 47.0, 62.0, 29.0, 22.0, 37.0, 22.0, 18.0, 19.0, 16.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2952880859375, -8.051513671875, -7.8077392578125, -7.56396484375, -7.3201904296875, -7.076416015625, -6.8326416015625, -6.5888671875, -6.3450927734375, -6.101318359375, -5.8575439453125, -5.61376953125, -5.3699951171875, -5.126220703125, -4.8824462890625, -4.638671875, -4.3948974609375, -4.151123046875, -3.9073486328125, -3.66357421875, -3.4197998046875, -3.176025390625, -2.9322509765625, -2.6884765625, -2.4447021484375, -2.200927734375, -1.9571533203125, -1.71337890625, -1.4696044921875, -1.225830078125, -0.9820556640625, -0.73828125, -0.4945068359375, -0.250732421875, -0.0069580078125, 0.23681640625, 0.4805908203125, 0.724365234375, 0.9681396484375, 1.2119140625, 1.4556884765625, 1.699462890625, 1.9432373046875, 2.18701171875, 2.4307861328125, 2.674560546875, 2.9183349609375, 3.162109375, 3.4058837890625, 3.649658203125, 3.8934326171875, 4.13720703125, 4.3809814453125, 4.624755859375, 4.8685302734375, 5.1123046875, 5.3560791015625, 5.599853515625, 5.8436279296875, 6.08740234375, 6.3311767578125, 6.574951171875, 6.8187255859375, 7.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 7.0, 22.0, 32.0, 63.0, 73.0, 101.0, 177.0, 222.0, 330.0, 557.0, 1045.0, 1970.0, 4215.0, 9830.0, 26109.0, 78896.0, 246837.0, 411647.0, 176697.0, 55720.0, 19348.0, 7522.0, 3274.0, 1599.0, 869.0, 490.0, 301.0, 214.0, 136.0, 83.0, 36.0, 38.0, 21.0, 12.0, 10.0, 8.0, 8.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05169677734375, -0.04999351501464844, -0.048290252685546875, -0.04658699035644531, -0.04488372802734375, -0.04318046569824219, -0.041477203369140625, -0.03977394104003906, -0.0380706787109375, -0.03636741638183594, -0.034664154052734375, -0.03296089172363281, -0.03125762939453125, -0.029554367065429688, -0.027851104736328125, -0.026147842407226562, -0.024444580078125, -0.022741317749023438, -0.021038055419921875, -0.019334793090820312, -0.01763153076171875, -0.015928268432617188, -0.014225006103515625, -0.012521743774414062, -0.0108184814453125, -0.009115219116210938, -0.007411956787109375, -0.0057086944580078125, -0.00400543212890625, -0.0023021697998046875, -0.000598907470703125, 0.0011043548583984375, 0.0028076171875, 0.0045108795166015625, 0.006214141845703125, 0.007917404174804688, 0.00962066650390625, 0.011323928833007812, 0.013027191162109375, 0.014730453491210938, 0.0164337158203125, 0.018136978149414062, 0.019840240478515625, 0.021543502807617188, 0.02324676513671875, 0.024950027465820312, 0.026653289794921875, 0.028356552124023438, 0.030059814453125, 0.03176307678222656, 0.033466339111328125, 0.03516960144042969, 0.03687286376953125, 0.03857612609863281, 0.040279388427734375, 0.04198265075683594, 0.0436859130859375, 0.04538917541503906, 0.047092437744140625, 0.04879570007324219, 0.05049896240234375, 0.05220222473144531, 0.053905487060546875, 0.05560874938964844, 0.05731201171875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 1.0, 8.0, 8.0, 15.0, 20.0, 28.0, 46.0, 49.0, 72.0, 71.0, 100.0, 108.0, 85.0, 92.0, 81.0, 46.0, 44.0, 39.0, 27.0, 15.0, 13.0, 10.0, 6.0, 5.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.802776336669922e-05, -3.6121346056461334e-05, -3.421492874622345e-05, -3.2308511435985565e-05, -3.040209412574768e-05, -2.8495676815509796e-05, -2.658925950527191e-05, -2.4682842195034027e-05, -2.2776424884796143e-05, -2.0870007574558258e-05, -1.8963590264320374e-05, -1.705717295408249e-05, -1.5150755643844604e-05, -1.324433833360672e-05, -1.1337921023368835e-05, -9.431503713130951e-06, -7.525086402893066e-06, -5.618669092655182e-06, -3.7122517824172974e-06, -1.8058344721794128e-06, 1.0058283805847168e-07, 2.007000148296356e-06, 3.913417458534241e-06, 5.819834768772125e-06, 7.72625207901001e-06, 9.632669389247894e-06, 1.1539086699485779e-05, 1.3445504009723663e-05, 1.5351921319961548e-05, 1.7258338630199432e-05, 1.9164755940437317e-05, 2.10711732506752e-05, 2.2977590560913086e-05, 2.488400787115097e-05, 2.6790425181388855e-05, 2.869684249162674e-05, 3.0603259801864624e-05, 3.250967711210251e-05, 3.441609442234039e-05, 3.632251173257828e-05, 3.822892904281616e-05, 4.013534635305405e-05, 4.204176366329193e-05, 4.3948180973529816e-05, 4.58545982837677e-05, 4.7761015594005585e-05, 4.966743290424347e-05, 5.1573850214481354e-05, 5.348026752471924e-05, 5.538668483495712e-05, 5.729310214519501e-05, 5.919951945543289e-05, 6.110593676567078e-05, 6.301235407590866e-05, 6.491877138614655e-05, 6.682518869638443e-05, 6.873160600662231e-05, 7.06380233168602e-05, 7.254444062709808e-05, 7.445085793733597e-05, 7.635727524757385e-05, 7.826369255781174e-05, 8.017010986804962e-05, 8.20765271782875e-05, 8.398294448852539e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 10.0, 5.0, 10.0, 13.0, 19.0, 28.0, 51.0, 90.0, 185.0, 472.0, 1119.0, 3595.0, 17202.0, 168866.0, 738138.0, 102299.0, 12152.0, 2619.0, 920.0, 354.0, 171.0, 88.0, 49.0, 26.0, 20.0, 13.0, 12.0, 5.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.134765625, -0.1311626434326172, -0.12755966186523438, -0.12395668029785156, -0.12035369873046875, -0.11675071716308594, -0.11314773559570312, -0.10954475402832031, -0.1059417724609375, -0.10233879089355469, -0.09873580932617188, -0.09513282775878906, -0.09152984619140625, -0.08792686462402344, -0.08432388305664062, -0.08072090148925781, -0.077117919921875, -0.07351493835449219, -0.06991195678710938, -0.06630897521972656, -0.06270599365234375, -0.05910301208496094, -0.055500030517578125, -0.05189704895019531, -0.0482940673828125, -0.04469108581542969, -0.041088104248046875, -0.03748512268066406, -0.03388214111328125, -0.030279159545898438, -0.026676177978515625, -0.023073196411132812, -0.01947021484375, -0.015867233276367188, -0.012264251708984375, -0.008661270141601562, -0.00505828857421875, -0.0014553070068359375, 0.002147674560546875, 0.0057506561279296875, 0.0093536376953125, 0.012956619262695312, 0.016559600830078125, 0.020162582397460938, 0.02376556396484375, 0.027368545532226562, 0.030971527099609375, 0.03457450866699219, 0.038177490234375, 0.04178047180175781, 0.045383453369140625, 0.04898643493652344, 0.05258941650390625, 0.05619239807128906, 0.059795379638671875, 0.06339836120605469, 0.0670013427734375, 0.07060432434082031, 0.07420730590820312, 0.07781028747558594, 0.08141326904296875, 0.08501625061035156, 0.08861923217773438, 0.09222221374511719, 0.0958251953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 14.0, 12.0, 12.0, 30.0, 21.0, 36.0, 38.0, 73.0, 70.0, 87.0, 64.0, 63.0, 80.0, 65.0, 58.0, 66.0, 40.0, 30.0, 30.0, 16.0, 10.0, 8.0, 12.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.017303466796875, -0.01683521270751953, -0.016366958618164062, -0.015898704528808594, -0.015430450439453125, -0.014962196350097656, -0.014493942260742188, -0.014025688171386719, -0.01355743408203125, -0.013089179992675781, -0.012620925903320312, -0.012152671813964844, -0.011684417724609375, -0.011216163635253906, -0.010747909545898438, -0.010279655456542969, -0.0098114013671875, -0.009343147277832031, -0.008874893188476562, -0.008406639099121094, -0.007938385009765625, -0.007470130920410156, -0.0070018768310546875, -0.006533622741699219, -0.00606536865234375, -0.005597114562988281, -0.0051288604736328125, -0.004660606384277344, -0.004192352294921875, -0.0037240982055664062, -0.0032558441162109375, -0.0027875900268554688, -0.0023193359375, -0.0018510818481445312, -0.0013828277587890625, -0.0009145736694335938, -0.000446319580078125, 2.193450927734375e-05, 0.0004901885986328125, 0.0009584426879882812, 0.00142669677734375, 0.0018949508666992188, 0.0023632049560546875, 0.0028314590454101562, 0.003299713134765625, 0.0037679672241210938, 0.0042362213134765625, 0.004704475402832031, 0.0051727294921875, 0.005640983581542969, 0.0061092376708984375, 0.006577491760253906, 0.007045745849609375, 0.007513999938964844, 0.007982254028320312, 0.008450508117675781, 0.00891876220703125, 0.009387016296386719, 0.009855270385742188, 0.010323524475097656, 0.010791778564453125, 0.011260032653808594, 0.011728286743164062, 0.012196540832519531, 0.012664794921875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 45.0, 81.0, 169.0, 215.0, 231.0, 153.0, 61.0, 27.0, 10.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.830513000488281, -12.50902271270752, -12.187532424926758, -11.866042137145996, -11.544551849365234, -11.223062515258789, -10.901571273803711, -10.580081939697266, -10.258591651916504, -9.937101364135742, -9.61561107635498, -9.294120788574219, -8.972630500793457, -8.651140213012695, -8.32965087890625, -8.008160591125488, -7.686669826507568, -7.365179538726807, -7.043689250946045, -6.722199440002441, -6.40070915222168, -6.079218864440918, -5.757728576660156, -5.4362382888793945, -5.114748001098633, -4.793257713317871, -4.471767425537109, -4.150277137756348, -3.828787326812744, -3.5072970390319824, -3.1858067512512207, -2.864316701889038, -2.5428271293640137, -2.221336841583252, -1.8998467922210693, -1.5783565044403076, -1.2568663358688354, -0.9353761672973633, -0.6138858795166016, -0.29239583015441895, 0.029094457626342773, 0.35058465600013733, 0.6720748543739319, 0.9935650825500488, 1.315055251121521, 1.6365454196929932, 1.9580357074737549, 2.2795257568359375, 2.601016044616699, 2.922506332397461, 3.2439963817596436, 3.5654866695404053, 3.886976718902588, 4.20846700668335, 4.529957294464111, 4.851447105407715, 5.172937393188477, 5.494427680969238, 5.81591796875, 6.137408256530762, 6.458898067474365, 6.780388355255127, 7.101878643035889, 7.423368453979492, 7.744859218597412]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 15.0, 21.0, 36.0, 46.0, 65.0, 84.0, 84.0, 97.0, 106.0, 102.0, 110.0, 60.0, 64.0, 39.0, 33.0, 16.0, 9.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646125316619873, -2.4611449241638184, -2.2761645317077637, -2.091184139251709, -1.9062037467956543, -1.7212233543395996, -1.536242961883545, -1.3512625694274902, -1.1662821769714355, -0.9813017845153809, -0.7963213920593262, -0.6113409996032715, -0.4263606071472168, -0.2413802146911621, -0.05639982223510742, 0.12858057022094727, 0.31356096267700195, 0.49854135513305664, 0.6835217475891113, 0.868502140045166, 1.0534825325012207, 1.2384629249572754, 1.42344331741333, 1.6084237098693848, 1.7934041023254395, 1.9783844947814941, 2.163364887237549, 2.3483452796936035, 2.533325672149658, 2.718306064605713, 2.9032864570617676, 3.0882668495178223, 3.273247718811035, 3.45822811126709, 3.6432085037231445, 3.828188896179199, 4.013169288635254, 4.198149681091309, 4.383130073547363, 4.568110466003418, 4.753090858459473, 4.938071250915527, 5.123051643371582, 5.308032035827637, 5.493012428283691, 5.677992820739746, 5.862973213195801, 6.0479536056518555, 6.23293399810791, 6.417914390563965, 6.6028947830200195, 6.787875175476074, 6.972855567932129, 7.157835960388184, 7.342816352844238, 7.527796745300293, 7.712777137756348, 7.897757530212402, 8.082737922668457, 8.267718315124512, 8.452698707580566, 8.637679100036621, 8.822659492492676, 9.00763988494873, 9.192620277404785]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 13.0, 22.0, 56.0, 126.0, 290.0, 856.0, 3460.0, 17119.0, 96817.0, 401822.0, 406692.0, 99025.0, 17410.0, 3447.0, 871.0, 297.0, 119.0, 50.0, 32.0, 15.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.24530029296875, -6.0765380859375, -5.90777587890625, -5.739013671875, -5.57025146484375, -5.4014892578125, -5.23272705078125, -5.06396484375, -4.89520263671875, -4.7264404296875, -4.55767822265625, -4.388916015625, -4.22015380859375, -4.0513916015625, -3.88262939453125, -3.7138671875, -3.54510498046875, -3.3763427734375, -3.20758056640625, -3.038818359375, -2.87005615234375, -2.7012939453125, -2.53253173828125, -2.36376953125, -2.19500732421875, -2.0262451171875, -1.85748291015625, -1.688720703125, -1.51995849609375, -1.3511962890625, -1.18243408203125, -1.013671875, -0.84490966796875, -0.6761474609375, -0.50738525390625, -0.338623046875, -0.16986083984375, -0.0010986328125, 0.16766357421875, 0.33642578125, 0.50518798828125, 0.6739501953125, 0.84271240234375, 1.011474609375, 1.18023681640625, 1.3489990234375, 1.51776123046875, 1.6865234375, 1.85528564453125, 2.0240478515625, 2.19281005859375, 2.361572265625, 2.53033447265625, 2.6990966796875, 2.86785888671875, 3.03662109375, 3.20538330078125, 3.3741455078125, 3.54290771484375, 3.711669921875, 3.88043212890625, 4.0491943359375, 4.21795654296875, 4.38671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 6.0, 11.0, 16.0, 12.0, 34.0, 38.0, 60.0, 61.0, 73.0, 75.0, 91.0, 85.0, 88.0, 80.0, 75.0, 61.0, 42.0, 37.0, 17.0, 21.0, 14.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.78289794921875, -3.4993896484375, -3.21588134765625, -2.932373046875, -2.64886474609375, -2.3653564453125, -2.08184814453125, -1.79833984375, -1.51483154296875, -1.2313232421875, -0.94781494140625, -0.664306640625, -0.38079833984375, -0.0972900390625, 0.18621826171875, 0.4697265625, 0.75323486328125, 1.0367431640625, 1.32025146484375, 1.603759765625, 1.88726806640625, 2.1707763671875, 2.45428466796875, 2.73779296875, 3.02130126953125, 3.3048095703125, 3.58831787109375, 3.871826171875, 4.15533447265625, 4.4388427734375, 4.72235107421875, 5.005859375, 5.28936767578125, 5.5728759765625, 5.85638427734375, 6.139892578125, 6.42340087890625, 6.7069091796875, 6.99041748046875, 7.27392578125, 7.55743408203125, 7.8409423828125, 8.12445068359375, 8.407958984375, 8.69146728515625, 8.9749755859375, 9.25848388671875, 9.5419921875, 9.82550048828125, 10.1090087890625, 10.39251708984375, 10.676025390625, 10.95953369140625, 11.2430419921875, 11.52655029296875, 11.81005859375, 12.09356689453125, 12.3770751953125, 12.66058349609375, 12.944091796875, 13.22760009765625, 13.5111083984375, 13.79461669921875, 14.078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 1.0, 7.0, 10.0, 6.0, 11.0, 14.0, 7.0, 24.0, 26.0, 41.0, 41.0, 52.0, 72.0, 78.0, 93.0, 128.0, 155.0, 180.0, 327.0, 642.0, 9142.0, 467108.0, 556577.0, 11726.0, 768.0, 321.0, 220.0, 151.0, 118.0, 91.0, 74.0, 62.0, 49.0, 44.0, 32.0, 35.0, 21.0, 27.0, 14.0, 15.0, 7.0, 6.0, 3.0, 4.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.2109375, -10.837646484375, -10.46435546875, -10.091064453125, -9.7177734375, -9.344482421875, -8.97119140625, -8.597900390625, -8.224609375, -7.851318359375, -7.47802734375, -7.104736328125, -6.7314453125, -6.358154296875, -5.98486328125, -5.611572265625, -5.23828125, -4.864990234375, -4.49169921875, -4.118408203125, -3.7451171875, -3.371826171875, -2.99853515625, -2.625244140625, -2.251953125, -1.878662109375, -1.50537109375, -1.132080078125, -0.7587890625, -0.385498046875, -0.01220703125, 0.361083984375, 0.734375, 1.107666015625, 1.48095703125, 1.854248046875, 2.2275390625, 2.600830078125, 2.97412109375, 3.347412109375, 3.720703125, 4.093994140625, 4.46728515625, 4.840576171875, 5.2138671875, 5.587158203125, 5.96044921875, 6.333740234375, 6.70703125, 7.080322265625, 7.45361328125, 7.826904296875, 8.2001953125, 8.573486328125, 8.94677734375, 9.320068359375, 9.693359375, 10.066650390625, 10.43994140625, 10.813232421875, 11.1865234375, 11.559814453125, 11.93310546875, 12.306396484375, 12.6796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 5.0, 5.0, 5.0, 3.0, 2.0, 10.0, 7.0, 10.0, 15.0, 13.0, 16.0, 20.0, 22.0, 17.0, 29.0, 30.0, 36.0, 33.0, 32.0, 26.0, 41.0, 31.0, 45.0, 38.0, 45.0, 42.0, 45.0, 31.0, 38.0, 26.0, 31.0, 34.0, 33.0, 31.0, 20.0, 13.0, 24.0, 18.0, 9.0, 8.0, 11.0, 8.0, 11.0, 5.0, 5.0, 4.0, 4.0, 7.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-3.9765625, -3.84600830078125, -3.7154541015625, -3.58489990234375, -3.454345703125, -3.32379150390625, -3.1932373046875, -3.06268310546875, -2.93212890625, -2.80157470703125, -2.6710205078125, -2.54046630859375, -2.409912109375, -2.27935791015625, -2.1488037109375, -2.01824951171875, -1.8876953125, -1.75714111328125, -1.6265869140625, -1.49603271484375, -1.365478515625, -1.23492431640625, -1.1043701171875, -0.97381591796875, -0.84326171875, -0.71270751953125, -0.5821533203125, -0.45159912109375, -0.321044921875, -0.19049072265625, -0.0599365234375, 0.07061767578125, 0.201171875, 0.33172607421875, 0.4622802734375, 0.59283447265625, 0.723388671875, 0.85394287109375, 0.9844970703125, 1.11505126953125, 1.24560546875, 1.37615966796875, 1.5067138671875, 1.63726806640625, 1.767822265625, 1.89837646484375, 2.0289306640625, 2.15948486328125, 2.2900390625, 2.42059326171875, 2.5511474609375, 2.68170166015625, 2.812255859375, 2.94281005859375, 3.0733642578125, 3.20391845703125, 3.33447265625, 3.46502685546875, 3.5955810546875, 3.72613525390625, 3.856689453125, 3.98724365234375, 4.1177978515625, 4.24835205078125, 4.37890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 7.0, 18.0, 28.0, 32.0, 57.0, 133.0, 208.0, 468.0, 1879.0, 18322.0, 618599.0, 395138.0, 11337.0, 1443.0, 411.0, 189.0, 108.0, 55.0, 45.0, 21.0, 15.0, 3.0, 9.0, 8.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.67578125, -2.572540283203125, -2.46929931640625, -2.366058349609375, -2.2628173828125, -2.159576416015625, -2.05633544921875, -1.953094482421875, -1.849853515625, -1.746612548828125, -1.64337158203125, -1.540130615234375, -1.4368896484375, -1.333648681640625, -1.23040771484375, -1.127166748046875, -1.02392578125, -0.920684814453125, -0.81744384765625, -0.714202880859375, -0.6109619140625, -0.507720947265625, -0.40447998046875, -0.301239013671875, -0.197998046875, -0.094757080078125, 0.00848388671875, 0.111724853515625, 0.2149658203125, 0.318206787109375, 0.42144775390625, 0.524688720703125, 0.6279296875, 0.731170654296875, 0.83441162109375, 0.937652587890625, 1.0408935546875, 1.144134521484375, 1.24737548828125, 1.350616455078125, 1.453857421875, 1.557098388671875, 1.66033935546875, 1.763580322265625, 1.8668212890625, 1.970062255859375, 2.07330322265625, 2.176544189453125, 2.27978515625, 2.383026123046875, 2.48626708984375, 2.589508056640625, 2.6927490234375, 2.795989990234375, 2.89923095703125, 3.002471923828125, 3.105712890625, 3.208953857421875, 3.31219482421875, 3.415435791015625, 3.5186767578125, 3.621917724609375, 3.72515869140625, 3.828399658203125, 3.931640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 7.0, 4.0, 3.0, 9.0, 10.0, 16.0, 9.0, 16.0, 37.0, 32.0, 54.0, 44.0, 68.0, 57.0, 93.0, 92.0, 69.0, 64.0, 56.0, 61.0, 44.0, 32.0, 29.0, 22.0, 21.0, 6.0, 12.0, 7.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016260147094726562, -0.00015597790479660034, -0.00014935433864593506, -0.00014273077249526978, -0.0001361072063446045, -0.0001294836401939392, -0.00012286007404327393, -0.00011623650789260864, -0.00010961294174194336, -0.00010298937559127808, -9.636580944061279e-05, -8.974224328994751e-05, -8.311867713928223e-05, -7.649511098861694e-05, -6.987154483795166e-05, -6.324797868728638e-05, -5.6624412536621094e-05, -5.000084638595581e-05, -4.337728023529053e-05, -3.6753714084625244e-05, -3.013014793395996e-05, -2.3506581783294678e-05, -1.6883015632629395e-05, -1.0259449481964111e-05, -3.635883331298828e-06, 2.987682819366455e-06, 9.611248970031738e-06, 1.623481512069702e-05, 2.2858381271362305e-05, 2.9481947422027588e-05, 3.610551357269287e-05, 4.2729079723358154e-05, 4.935264587402344e-05, 5.597621202468872e-05, 6.2599778175354e-05, 6.922334432601929e-05, 7.584691047668457e-05, 8.247047662734985e-05, 8.909404277801514e-05, 9.571760892868042e-05, 0.0001023411750793457, 0.00010896474123001099, 0.00011558830738067627, 0.00012221187353134155, 0.00012883543968200684, 0.00013545900583267212, 0.0001420825719833374, 0.00014870613813400269, 0.00015532970428466797, 0.00016195327043533325, 0.00016857683658599854, 0.00017520040273666382, 0.0001818239688873291, 0.00018844753503799438, 0.00019507110118865967, 0.00020169466733932495, 0.00020831823348999023, 0.00021494179964065552, 0.0002215653657913208, 0.00022818893194198608, 0.00023481249809265137, 0.00024143606424331665, 0.00024805963039398193, 0.0002546831965446472, 0.0002613067626953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 9.0, 4.0, 8.0, 9.0, 13.0, 15.0, 25.0, 37.0, 50.0, 83.0, 114.0, 167.0, 429.0, 1408.0, 8125.0, 161767.0, 807209.0, 62546.0, 4748.0, 971.0, 324.0, 163.0, 97.0, 61.0, 40.0, 29.0, 25.0, 23.0, 11.0, 6.0, 5.0, 8.0, 1.0, 5.0, 1.0, 2.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.091796875, -3.0018310546875, -2.911865234375, -2.8218994140625, -2.73193359375, -2.6419677734375, -2.552001953125, -2.4620361328125, -2.3720703125, -2.2821044921875, -2.192138671875, -2.1021728515625, -2.01220703125, -1.9222412109375, -1.832275390625, -1.7423095703125, -1.65234375, -1.5623779296875, -1.472412109375, -1.3824462890625, -1.29248046875, -1.2025146484375, -1.112548828125, -1.0225830078125, -0.9326171875, -0.8426513671875, -0.752685546875, -0.6627197265625, -0.57275390625, -0.4827880859375, -0.392822265625, -0.3028564453125, -0.212890625, -0.1229248046875, -0.032958984375, 0.0570068359375, 0.14697265625, 0.2369384765625, 0.326904296875, 0.4168701171875, 0.5068359375, 0.5968017578125, 0.686767578125, 0.7767333984375, 0.86669921875, 0.9566650390625, 1.046630859375, 1.1365966796875, 1.2265625, 1.3165283203125, 1.406494140625, 1.4964599609375, 1.58642578125, 1.6763916015625, 1.766357421875, 1.8563232421875, 1.9462890625, 2.0362548828125, 2.126220703125, 2.2161865234375, 2.30615234375, 2.3961181640625, 2.486083984375, 2.5760498046875, 2.666015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 11.0, 10.0, 7.0, 15.0, 24.0, 28.0, 34.0, 48.0, 54.0, 66.0, 74.0, 71.0, 85.0, 83.0, 78.0, 69.0, 48.0, 46.0, 32.0, 25.0, 24.0, 11.0, 9.0, 7.0, 15.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66162109375, -0.641815185546875, -0.62200927734375, -0.602203369140625, -0.5823974609375, -0.562591552734375, -0.54278564453125, -0.522979736328125, -0.503173828125, -0.483367919921875, -0.46356201171875, -0.443756103515625, -0.4239501953125, -0.404144287109375, -0.38433837890625, -0.364532470703125, -0.3447265625, -0.324920654296875, -0.30511474609375, -0.285308837890625, -0.2655029296875, -0.245697021484375, -0.22589111328125, -0.206085205078125, -0.186279296875, -0.166473388671875, -0.14666748046875, -0.126861572265625, -0.1070556640625, -0.087249755859375, -0.06744384765625, -0.047637939453125, -0.02783203125, -0.008026123046875, 0.01177978515625, 0.031585693359375, 0.0513916015625, 0.071197509765625, 0.09100341796875, 0.110809326171875, 0.130615234375, 0.150421142578125, 0.17022705078125, 0.190032958984375, 0.2098388671875, 0.229644775390625, 0.24945068359375, 0.269256591796875, 0.2890625, 0.308868408203125, 0.32867431640625, 0.348480224609375, 0.3682861328125, 0.388092041015625, 0.40789794921875, 0.427703857421875, 0.447509765625, 0.467315673828125, 0.48712158203125, 0.506927490234375, 0.5267333984375, 0.546539306640625, 0.56634521484375, 0.586151123046875, 0.60595703125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 18.0, 41.0, 58.0, 105.0, 117.0, 171.0, 175.0, 129.0, 81.0, 55.0, 32.0, 18.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.838399410247803, -4.357330322265625, -3.8762612342834473, -3.3951919078826904, -2.9141228199005127, -2.433053731918335, -1.9519844055175781, -1.4709153175354004, -0.9898462295532227, -0.5087770819664001, -0.027707934379577637, 0.45336127281188965, 0.9344303607940674, 1.4154994487762451, 1.896568775177002, 2.3776378631591797, 2.8587069511413574, 3.339776039123535, 3.820845127105713, 4.301914215087891, 4.782983779907227, 5.264052391052246, 5.745121955871582, 6.22619104385376, 6.7072601318359375, 7.188329219818115, 7.669398307800293, 8.150467872619629, 8.631536483764648, 9.112606048583984, 9.59367561340332, 10.07474422454834, 10.55581283569336, 11.036882400512695, 11.517951011657715, 11.99902057647705, 12.48008918762207, 12.961158752441406, 13.442228317260742, 13.923296928405762, 14.404365539550781, 14.885435104370117, 15.366503715515137, 15.847573280334473, 16.328641891479492, 16.809711456298828, 17.290781021118164, 17.7718505859375, 18.252918243408203, 18.73398780822754, 19.215057373046875, 19.696125030517578, 20.177194595336914, 20.65826416015625, 21.139333724975586, 21.620403289794922, 22.101472854614258, 22.582542419433594, 23.06361198425293, 23.544679641723633, 24.02574920654297, 24.506818771362305, 24.98788833618164, 25.468955993652344, 25.95002555847168]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 10.0, 9.0, 8.0, 15.0, 18.0, 24.0, 20.0, 31.0, 40.0, 30.0, 40.0, 39.0, 43.0, 63.0, 60.0, 58.0, 56.0, 51.0, 44.0, 65.0, 38.0, 47.0, 36.0, 35.0, 34.0, 15.0, 16.0, 14.0, 14.0, 6.0, 13.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.641651153564453, -6.327957630157471, -6.014264106750488, -5.700570583343506, -5.386877059936523, -5.073183536529541, -4.759490013122559, -4.445796489715576, -4.132102966308594, -3.8184094429016113, -3.504715919494629, -3.1910223960876465, -2.877328872680664, -2.5636353492736816, -2.249941825866699, -1.9362483024597168, -1.6225547790527344, -1.308861255645752, -0.9951677322387695, -0.6814742088317871, -0.3677806854248047, -0.054087162017822266, 0.25960636138916016, 0.5732998847961426, 0.886993408203125, 1.2006869316101074, 1.5143804550170898, 1.8280739784240723, 2.1417675018310547, 2.455461025238037, 2.7691545486450195, 3.082848072052002, 3.3965415954589844, 3.710235118865967, 4.023928642272949, 4.337622165679932, 4.651315689086914, 4.9650092124938965, 5.278702735900879, 5.592396259307861, 5.906089782714844, 6.219783306121826, 6.533476829528809, 6.847170352935791, 7.160863876342773, 7.474557399749756, 7.788250923156738, 8.101943969726562, 8.415637969970703, 8.729331970214844, 9.043025016784668, 9.356718063354492, 9.670412063598633, 9.984106063842773, 10.297799110412598, 10.611492156982422, 10.925186157226562, 11.238880157470703, 11.552573204040527, 11.866266250610352, 12.179960250854492, 12.493654251098633, 12.807347297668457, 13.121040344238281, 13.434734344482422]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 5.0, 20.0, 40.0, 46.0, 83.0, 127.0, 150.0, 272.0, 515.0, 1453.0, 10023.0, 178537.0, 2205923.0, 1683057.0, 105000.0, 6636.0, 1109.0, 492.0, 266.0, 169.0, 122.0, 87.0, 57.0, 38.0, 14.0, 15.0, 10.0, 6.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.528076171875, -5.23583984375, -4.943603515625, -4.6513671875, -4.359130859375, -4.06689453125, -3.774658203125, -3.482421875, -3.190185546875, -2.89794921875, -2.605712890625, -2.3134765625, -2.021240234375, -1.72900390625, -1.436767578125, -1.14453125, -0.852294921875, -0.56005859375, -0.267822265625, 0.0244140625, 0.316650390625, 0.60888671875, 0.901123046875, 1.193359375, 1.485595703125, 1.77783203125, 2.070068359375, 2.3623046875, 2.654541015625, 2.94677734375, 3.239013671875, 3.53125, 3.823486328125, 4.11572265625, 4.407958984375, 4.7001953125, 4.992431640625, 5.28466796875, 5.576904296875, 5.869140625, 6.161376953125, 6.45361328125, 6.745849609375, 7.0380859375, 7.330322265625, 7.62255859375, 7.914794921875, 8.20703125, 8.499267578125, 8.79150390625, 9.083740234375, 9.3759765625, 9.668212890625, 9.96044921875, 10.252685546875, 10.544921875, 10.837158203125, 11.12939453125, 11.421630859375, 11.7138671875, 12.006103515625, 12.29833984375, 12.590576171875, 12.8828125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 6.0, 3.0, 2.0, 7.0, 9.0, 10.0, 12.0, 17.0, 17.0, 16.0, 15.0, 22.0, 29.0, 22.0, 40.0, 32.0, 37.0, 29.0, 31.0, 40.0, 34.0, 38.0, 43.0, 38.0, 43.0, 41.0, 50.0, 43.0, 33.0, 38.0, 27.0, 22.0, 25.0, 21.0, 14.0, 19.0, 16.0, 6.0, 8.0, 9.0, 9.0, 5.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.28125, -3.173004150390625, -3.06475830078125, -2.956512451171875, -2.8482666015625, -2.740020751953125, -2.63177490234375, -2.523529052734375, -2.415283203125, -2.307037353515625, -2.19879150390625, -2.090545654296875, -1.9822998046875, -1.874053955078125, -1.76580810546875, -1.657562255859375, -1.54931640625, -1.441070556640625, -1.33282470703125, -1.224578857421875, -1.1163330078125, -1.008087158203125, -0.89984130859375, -0.791595458984375, -0.683349609375, -0.575103759765625, -0.46685791015625, -0.358612060546875, -0.2503662109375, -0.142120361328125, -0.03387451171875, 0.074371337890625, 0.1826171875, 0.290863037109375, 0.39910888671875, 0.507354736328125, 0.6156005859375, 0.723846435546875, 0.83209228515625, 0.940338134765625, 1.048583984375, 1.156829833984375, 1.26507568359375, 1.373321533203125, 1.4815673828125, 1.589813232421875, 1.69805908203125, 1.806304931640625, 1.91455078125, 2.022796630859375, 2.13104248046875, 2.239288330078125, 2.3475341796875, 2.455780029296875, 2.56402587890625, 2.672271728515625, 2.780517578125, 2.888763427734375, 2.99700927734375, 3.105255126953125, 3.2135009765625, 3.321746826171875, 3.42999267578125, 3.538238525390625, 3.646484375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 9.0, 10.0, 19.0, 12.0, 28.0, 32.0, 38.0, 84.0, 135.0, 224.0, 531.0, 1574.0, 22504.0, 4022832.0, 142668.0, 2254.0, 650.0, 265.0, 151.0, 76.0, 60.0, 35.0, 14.0, 19.0, 15.0, 12.0, 10.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-24.515625, -23.927001953125, -23.33837890625, -22.749755859375, -22.1611328125, -21.572509765625, -20.98388671875, -20.395263671875, -19.806640625, -19.218017578125, -18.62939453125, -18.040771484375, -17.4521484375, -16.863525390625, -16.27490234375, -15.686279296875, -15.09765625, -14.509033203125, -13.92041015625, -13.331787109375, -12.7431640625, -12.154541015625, -11.56591796875, -10.977294921875, -10.388671875, -9.800048828125, -9.21142578125, -8.622802734375, -8.0341796875, -7.445556640625, -6.85693359375, -6.268310546875, -5.6796875, -5.091064453125, -4.50244140625, -3.913818359375, -3.3251953125, -2.736572265625, -2.14794921875, -1.559326171875, -0.970703125, -0.382080078125, 0.20654296875, 0.795166015625, 1.3837890625, 1.972412109375, 2.56103515625, 3.149658203125, 3.73828125, 4.326904296875, 4.91552734375, 5.504150390625, 6.0927734375, 6.681396484375, 7.27001953125, 7.858642578125, 8.447265625, 9.035888671875, 9.62451171875, 10.213134765625, 10.8017578125, 11.390380859375, 11.97900390625, 12.567626953125, 13.15625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 10.0, 15.0, 20.0, 51.0, 61.0, 119.0, 205.0, 359.0, 598.0, 770.0, 695.0, 465.0, 288.0, 187.0, 95.0, 50.0, 32.0, 25.0, 13.0, 12.0, 6.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.498046875, -1.403289794921875, -1.30853271484375, -1.213775634765625, -1.1190185546875, -1.024261474609375, -0.92950439453125, -0.834747314453125, -0.739990234375, -0.645233154296875, -0.55047607421875, -0.455718994140625, -0.3609619140625, -0.266204833984375, -0.17144775390625, -0.076690673828125, 0.01806640625, 0.112823486328125, 0.20758056640625, 0.302337646484375, 0.3970947265625, 0.491851806640625, 0.58660888671875, 0.681365966796875, 0.776123046875, 0.870880126953125, 0.96563720703125, 1.060394287109375, 1.1551513671875, 1.249908447265625, 1.34466552734375, 1.439422607421875, 1.5341796875, 1.628936767578125, 1.72369384765625, 1.818450927734375, 1.9132080078125, 2.007965087890625, 2.10272216796875, 2.197479248046875, 2.292236328125, 2.386993408203125, 2.48175048828125, 2.576507568359375, 2.6712646484375, 2.766021728515625, 2.86077880859375, 2.955535888671875, 3.05029296875, 3.145050048828125, 3.23980712890625, 3.334564208984375, 3.4293212890625, 3.524078369140625, 3.61883544921875, 3.713592529296875, 3.808349609375, 3.903106689453125, 3.99786376953125, 4.092620849609375, 4.1873779296875, 4.282135009765625, 4.37689208984375, 4.471649169921875, 4.56640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 8.0, 11.0, 21.0, 32.0, 36.0, 40.0, 61.0, 71.0, 83.0, 103.0, 94.0, 81.0, 75.0, 73.0, 67.0, 45.0, 39.0, 21.0, 20.0, 12.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.012707233428955, -3.792933702468872, -3.573160171508789, -3.353386402130127, -3.133613109588623, -2.913839340209961, -2.694065809249878, -2.474292278289795, -2.254518747329712, -2.034745216369629, -1.814971685409546, -1.5951980352401733, -1.3754245042800903, -1.1556509733200073, -0.9358773231506348, -0.7161037921905518, -0.49633026123046875, -0.27655670046806335, -0.05678313970565796, 0.16299045085906982, 0.38276398181915283, 0.6025375127792358, 0.8223111629486084, 1.0420846939086914, 1.2618582248687744, 1.4816317558288574, 1.7014052867889404, 1.921178936958313, 2.1409525871276855, 2.3607258796691895, 2.5804996490478516, 2.8002731800079346, 3.020047187805176, 3.239820718765259, 3.459594249725342, 3.679368019104004, 3.899141311645508, 4.11891508102417, 4.338688850402832, 4.558462142944336, 4.77823543548584, 4.998009204864502, 5.217782497406006, 5.437556266784668, 5.657329559326172, 5.877103328704834, 6.096877098083496, 6.316650390625, 6.536424160003662, 6.756197929382324, 6.975971221923828, 7.19574499130249, 7.415518283843994, 7.635292053222656, 7.85506534576416, 8.074838638305664, 8.294612884521484, 8.514386177062988, 8.734160423278809, 8.953933715820312, 9.173707008361816, 9.39348030090332, 9.61325454711914, 9.833027839660645, 10.052801132202148]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 10.0, 11.0, 12.0, 14.0, 18.0, 18.0, 8.0, 21.0, 25.0, 21.0, 20.0, 22.0, 27.0, 23.0, 29.0, 29.0, 34.0, 44.0, 40.0, 39.0, 43.0, 39.0, 33.0, 45.0, 46.0, 32.0, 34.0, 37.0, 34.0, 21.0, 23.0, 18.0, 19.0, 17.0, 14.0, 11.0, 10.0, 11.0, 9.0, 4.0, 6.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.9131927490234375, -3.800863027572632, -3.688533306121826, -3.5762035846710205, -3.463873863220215, -3.351544141769409, -3.2392144203186035, -3.126884698867798, -3.014554977416992, -2.9022252559661865, -2.789895534515381, -2.677565813064575, -2.5652360916137695, -2.452906370162964, -2.340576648712158, -2.2282469272613525, -2.115917205810547, -2.003587484359741, -1.8912577629089355, -1.7789280414581299, -1.6665983200073242, -1.5542685985565186, -1.441938877105713, -1.3296091556549072, -1.2172791957855225, -1.1049494743347168, -0.9926197528839111, -0.8802900314331055, -0.7679603099822998, -0.6556305289268494, -0.5433008074760437, -0.43097108602523804, -0.31864142417907715, -0.20631170272827148, -0.09398196637630463, 0.01834776997566223, 0.1306774914264679, 0.24300724267959595, 0.3553369641304016, 0.4676666855812073, 0.5799964070320129, 0.6923261284828186, 0.8046558499336243, 0.9169856309890747, 1.0293153524398804, 1.141645073890686, 1.2539747953414917, 1.3663045167922974, 1.478634238243103, 1.5909639596939087, 1.7032936811447144, 1.81562340259552, 1.9279531240463257, 2.040282964706421, 2.1526126861572266, 2.2649424076080322, 2.377272129058838, 2.4896018505096436, 2.601931571960449, 2.714261293411255, 2.8265910148620605, 2.938920736312866, 3.051250457763672, 3.1635801792144775, 3.275909900665283]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 22.0, 22.0, 25.0, 32.0, 44.0, 69.0, 105.0, 150.0, 192.0, 259.0, 451.0, 822.0, 1790.0, 4943.0, 17049.0, 67077.0, 241275.0, 425730.0, 209385.0, 56270.0, 14697.0, 4423.0, 1676.0, 753.0, 428.0, 262.0, 172.0, 107.0, 86.0, 74.0, 49.0, 25.0, 18.0, 22.0, 6.0, 9.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6591796875, -0.6367874145507812, -0.6143951416015625, -0.5920028686523438, -0.569610595703125, -0.5472183227539062, -0.5248260498046875, -0.5024337768554688, -0.48004150390625, -0.45764923095703125, -0.4352569580078125, -0.41286468505859375, -0.390472412109375, -0.36808013916015625, -0.3456878662109375, -0.32329559326171875, -0.3009033203125, -0.27851104736328125, -0.2561187744140625, -0.23372650146484375, -0.211334228515625, -0.18894195556640625, -0.1665496826171875, -0.14415740966796875, -0.12176513671875, -0.09937286376953125, -0.0769805908203125, -0.05458831787109375, -0.032196044921875, -0.00980377197265625, 0.0125885009765625, 0.03498077392578125, 0.057373046875, 0.07976531982421875, 0.1021575927734375, 0.12454986572265625, 0.146942138671875, 0.16933441162109375, 0.1917266845703125, 0.21411895751953125, 0.23651123046875, 0.25890350341796875, 0.2812957763671875, 0.30368804931640625, 0.326080322265625, 0.34847259521484375, 0.3708648681640625, 0.39325714111328125, 0.4156494140625, 0.43804168701171875, 0.4604339599609375, 0.48282623291015625, 0.505218505859375, 0.5276107788085938, 0.5500030517578125, 0.5723953247070312, 0.59478759765625, 0.6171798706054688, 0.6395721435546875, 0.6619644165039062, 0.684356689453125, 0.7067489624023438, 0.7291412353515625, 0.7515335083007812, 0.77392578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 5.0, 4.0, 5.0, 6.0, 18.0, 12.0, 21.0, 20.0, 19.0, 22.0, 26.0, 32.0, 35.0, 32.0, 46.0, 45.0, 41.0, 43.0, 53.0, 62.0, 44.0, 49.0, 44.0, 41.0, 34.0, 47.0, 30.0, 32.0, 27.0, 25.0, 19.0, 15.0, 10.0, 7.0, 9.0, 7.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.486328125, -3.39398193359375, -3.3016357421875, -3.20928955078125, -3.116943359375, -3.02459716796875, -2.9322509765625, -2.83990478515625, -2.74755859375, -2.65521240234375, -2.5628662109375, -2.47052001953125, -2.378173828125, -2.28582763671875, -2.1934814453125, -2.10113525390625, -2.0087890625, -1.91644287109375, -1.8240966796875, -1.73175048828125, -1.639404296875, -1.54705810546875, -1.4547119140625, -1.36236572265625, -1.27001953125, -1.17767333984375, -1.0853271484375, -0.99298095703125, -0.900634765625, -0.80828857421875, -0.7159423828125, -0.62359619140625, -0.53125, -0.43890380859375, -0.3465576171875, -0.25421142578125, -0.161865234375, -0.06951904296875, 0.0228271484375, 0.11517333984375, 0.20751953125, 0.29986572265625, 0.3922119140625, 0.48455810546875, 0.576904296875, 0.66925048828125, 0.7615966796875, 0.85394287109375, 0.9462890625, 1.03863525390625, 1.1309814453125, 1.22332763671875, 1.315673828125, 1.40802001953125, 1.5003662109375, 1.59271240234375, 1.68505859375, 1.77740478515625, 1.8697509765625, 1.96209716796875, 2.054443359375, 2.14678955078125, 2.2391357421875, 2.33148193359375, 2.423828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 13.0, 25.0, 31.0, 43.0, 77.0, 151.0, 301.0, 623.0, 1415.0, 2884.0, 6109.0, 13227.0, 28220.0, 58832.0, 115219.0, 192442.0, 233742.0, 183379.0, 107140.0, 54753.0, 26394.0, 12384.0, 5718.0, 2790.0, 1302.0, 617.0, 320.0, 156.0, 91.0, 43.0, 34.0, 21.0, 8.0, 10.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.34423828125, -0.3342437744140625, -0.324249267578125, -0.3142547607421875, -0.30426025390625, -0.2942657470703125, -0.284271240234375, -0.2742767333984375, -0.2642822265625, -0.2542877197265625, -0.244293212890625, -0.2342987060546875, -0.22430419921875, -0.2143096923828125, -0.204315185546875, -0.1943206787109375, -0.184326171875, -0.1743316650390625, -0.164337158203125, -0.1543426513671875, -0.14434814453125, -0.1343536376953125, -0.124359130859375, -0.1143646240234375, -0.1043701171875, -0.0943756103515625, -0.084381103515625, -0.0743865966796875, -0.06439208984375, -0.0543975830078125, -0.044403076171875, -0.0344085693359375, -0.0244140625, -0.0144195556640625, -0.004425048828125, 0.0055694580078125, 0.01556396484375, 0.0255584716796875, 0.035552978515625, 0.0455474853515625, 0.0555419921875, 0.0655364990234375, 0.075531005859375, 0.0855255126953125, 0.09552001953125, 0.1055145263671875, 0.115509033203125, 0.1255035400390625, 0.135498046875, 0.1454925537109375, 0.155487060546875, 0.1654815673828125, 0.17547607421875, 0.1854705810546875, 0.195465087890625, 0.2054595947265625, 0.2154541015625, 0.2254486083984375, 0.235443115234375, 0.2454376220703125, 0.25543212890625, 0.2654266357421875, 0.275421142578125, 0.2854156494140625, 0.29541015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 6.0, 2.0, 5.0, 7.0, 7.0, 5.0, 12.0, 11.0, 18.0, 22.0, 28.0, 30.0, 32.0, 26.0, 25.0, 45.0, 39.0, 25.0, 34.0, 47.0, 41.0, 47.0, 32.0, 50.0, 29.0, 44.0, 37.0, 22.0, 40.0, 35.0, 33.0, 32.0, 19.0, 18.0, 15.0, 14.0, 7.0, 13.0, 7.0, 7.0, 5.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.6171875, -4.46002197265625, -4.3028564453125, -4.14569091796875, -3.988525390625, -3.83135986328125, -3.6741943359375, -3.51702880859375, -3.35986328125, -3.20269775390625, -3.0455322265625, -2.88836669921875, -2.731201171875, -2.57403564453125, -2.4168701171875, -2.25970458984375, -2.1025390625, -1.94537353515625, -1.7882080078125, -1.63104248046875, -1.473876953125, -1.31671142578125, -1.1595458984375, -1.00238037109375, -0.84521484375, -0.68804931640625, -0.5308837890625, -0.37371826171875, -0.216552734375, -0.05938720703125, 0.0977783203125, 0.25494384765625, 0.412109375, 0.56927490234375, 0.7264404296875, 0.88360595703125, 1.040771484375, 1.19793701171875, 1.3551025390625, 1.51226806640625, 1.66943359375, 1.82659912109375, 1.9837646484375, 2.14093017578125, 2.298095703125, 2.45526123046875, 2.6124267578125, 2.76959228515625, 2.9267578125, 3.08392333984375, 3.2410888671875, 3.39825439453125, 3.555419921875, 3.71258544921875, 3.8697509765625, 4.02691650390625, 4.18408203125, 4.34124755859375, 4.4984130859375, 4.65557861328125, 4.812744140625, 4.96990966796875, 5.1270751953125, 5.28424072265625, 5.44140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 9.0, 3.0, 9.0, 8.0, 17.0, 30.0, 44.0, 76.0, 111.0, 178.0, 287.0, 497.0, 815.0, 1613.0, 2979.0, 5959.0, 13825.0, 36361.0, 108812.0, 296404.0, 350445.0, 147977.0, 48731.0, 17778.0, 7648.0, 3568.0, 1834.0, 990.0, 583.0, 328.0, 224.0, 147.0, 93.0, 58.0, 32.0, 27.0, 17.0, 7.0, 5.0, 4.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0611572265625, -0.059416770935058594, -0.05767631530761719, -0.05593585968017578, -0.054195404052734375, -0.05245494842529297, -0.05071449279785156, -0.048974037170410156, -0.04723358154296875, -0.045493125915527344, -0.04375267028808594, -0.04201221466064453, -0.040271759033203125, -0.03853130340576172, -0.03679084777832031, -0.035050392150878906, -0.0333099365234375, -0.031569480895996094, -0.029829025268554688, -0.02808856964111328, -0.026348114013671875, -0.02460765838623047, -0.022867202758789062, -0.021126747131347656, -0.01938629150390625, -0.017645835876464844, -0.015905380249023438, -0.014164924621582031, -0.012424468994140625, -0.010684013366699219, -0.008943557739257812, -0.007203102111816406, -0.005462646484375, -0.0037221908569335938, -0.0019817352294921875, -0.00024127960205078125, 0.001499176025390625, 0.0032396316528320312, 0.0049800872802734375, 0.006720542907714844, 0.00846099853515625, 0.010201454162597656, 0.011941909790039062, 0.013682365417480469, 0.015422821044921875, 0.01716327667236328, 0.018903732299804688, 0.020644187927246094, 0.0223846435546875, 0.024125099182128906, 0.025865554809570312, 0.02760601043701172, 0.029346466064453125, 0.03108692169189453, 0.03282737731933594, 0.034567832946777344, 0.03630828857421875, 0.038048744201660156, 0.03978919982910156, 0.04152965545654297, 0.043270111083984375, 0.04501056671142578, 0.04675102233886719, 0.048491477966308594, 0.05023193359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 2.0, 13.0, 18.0, 18.0, 24.0, 29.0, 37.0, 71.0, 105.0, 111.0, 118.0, 124.0, 89.0, 68.0, 50.0, 27.0, 26.0, 18.0, 16.0, 9.0, 9.0, 2.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010859966278076172, -0.00010605063289403915, -0.00010350160300731659, -0.00010095257312059402, -9.840354323387146e-05, -9.58545133471489e-05, -9.330548346042633e-05, -9.075645357370377e-05, -8.82074236869812e-05, -8.565839380025864e-05, -8.310936391353607e-05, -8.056033402681351e-05, -7.801130414009094e-05, -7.546227425336838e-05, -7.291324436664581e-05, -7.036421447992325e-05, -6.781518459320068e-05, -6.526615470647812e-05, -6.271712481975555e-05, -6.016809493303299e-05, -5.7619065046310425e-05, -5.507003515958786e-05, -5.2521005272865295e-05, -4.997197538614273e-05, -4.7422945499420166e-05, -4.48739156126976e-05, -4.232488572597504e-05, -3.977585583925247e-05, -3.722682595252991e-05, -3.467779606580734e-05, -3.212876617908478e-05, -2.9579736292362213e-05, -2.703070640563965e-05, -2.4481676518917084e-05, -2.193264663219452e-05, -1.9383616745471954e-05, -1.683458685874939e-05, -1.4285556972026825e-05, -1.173652708530426e-05, -9.187497198581696e-06, -6.638467311859131e-06, -4.089437425136566e-06, -1.5404075384140015e-06, 1.0086223483085632e-06, 3.557652235031128e-06, 6.106682121753693e-06, 8.655712008476257e-06, 1.1204741895198822e-05, 1.3753771781921387e-05, 1.630280166864395e-05, 1.8851831555366516e-05, 2.140086144208908e-05, 2.3949891328811646e-05, 2.649892121553421e-05, 2.9047951102256775e-05, 3.159698098897934e-05, 3.4146010875701904e-05, 3.669504076242447e-05, 3.9244070649147034e-05, 4.17931005358696e-05, 4.434213042259216e-05, 4.689116030931473e-05, 4.944019019603729e-05, 5.198922008275986e-05, 5.453824996948242e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 24.0, 11.0, 17.0, 31.0, 50.0, 93.0, 221.0, 687.0, 3211.0, 25030.0, 370956.0, 599088.0, 42810.0, 4749.0, 980.0, 286.0, 116.0, 56.0, 29.0, 24.0, 18.0, 13.0, 15.0, 10.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1195068359375, -0.11509895324707031, -0.11069107055664062, -0.10628318786621094, -0.10187530517578125, -0.09746742248535156, -0.09305953979492188, -0.08865165710449219, -0.0842437744140625, -0.07983589172363281, -0.07542800903320312, -0.07102012634277344, -0.06661224365234375, -0.06220436096191406, -0.057796478271484375, -0.05338859558105469, -0.048980712890625, -0.04457283020019531, -0.040164947509765625, -0.03575706481933594, -0.03134918212890625, -0.026941299438476562, -0.022533416748046875, -0.018125534057617188, -0.0137176513671875, -0.009309768676757812, -0.004901885986328125, -0.0004940032958984375, 0.00391387939453125, 0.008321762084960938, 0.012729644775390625, 0.017137527465820312, 0.02154541015625, 0.025953292846679688, 0.030361175537109375, 0.03476905822753906, 0.03917694091796875, 0.04358482360839844, 0.047992706298828125, 0.05240058898925781, 0.0568084716796875, 0.06121635437011719, 0.06562423706054688, 0.07003211975097656, 0.07444000244140625, 0.07884788513183594, 0.08325576782226562, 0.08766365051269531, 0.092071533203125, 0.09647941589355469, 0.10088729858398438, 0.10529518127441406, 0.10970306396484375, 0.11411094665527344, 0.11851882934570312, 0.12292671203613281, 0.1273345947265625, 0.1317424774169922, 0.13615036010742188, 0.14055824279785156, 0.14496612548828125, 0.14937400817871094, 0.15378189086914062, 0.1581897735595703, 0.16259765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 2.0, 5.0, 6.0, 8.0, 12.0, 21.0, 12.0, 35.0, 53.0, 48.0, 60.0, 76.0, 88.0, 76.0, 91.0, 86.0, 72.0, 40.0, 48.0, 40.0, 30.0, 20.0, 15.0, 18.0, 12.0, 4.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0156402587890625, -0.015057086944580078, -0.014473915100097656, -0.013890743255615234, -0.013307571411132812, -0.01272439956665039, -0.012141227722167969, -0.011558055877685547, -0.010974884033203125, -0.010391712188720703, -0.009808540344238281, -0.00922536849975586, -0.008642196655273438, -0.008059024810791016, -0.007475852966308594, -0.006892681121826172, -0.00630950927734375, -0.005726337432861328, -0.005143165588378906, -0.004559993743896484, -0.0039768218994140625, -0.0033936500549316406, -0.0028104782104492188, -0.002227306365966797, -0.001644134521484375, -0.0010609626770019531, -0.00047779083251953125, 0.00010538101196289062, 0.0006885528564453125, 0.0012717247009277344, 0.0018548965454101562, 0.002438068389892578, 0.003021240234375, 0.003604412078857422, 0.004187583923339844, 0.004770755767822266, 0.0053539276123046875, 0.005937099456787109, 0.006520271301269531, 0.007103443145751953, 0.007686614990234375, 0.008269786834716797, 0.008852958679199219, 0.00943613052368164, 0.010019302368164062, 0.010602474212646484, 0.011185646057128906, 0.011768817901611328, 0.01235198974609375, 0.012935161590576172, 0.013518333435058594, 0.014101505279541016, 0.014684677124023438, 0.01526784896850586, 0.01585102081298828, 0.016434192657470703, 0.017017364501953125, 0.017600536346435547, 0.01818370819091797, 0.01876688003540039, 0.019350051879882812, 0.019933223724365234, 0.020516395568847656, 0.021099567413330078, 0.0216827392578125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 16.0, 30.0, 42.0, 86.0, 122.0, 153.0, 144.0, 132.0, 114.0, 92.0, 39.0, 21.0, 3.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.160707473754883, -9.941709518432617, -9.722711563110352, -9.50371265411377, -9.284714698791504, -9.065716743469238, -8.846718788146973, -8.627720832824707, -8.408721923828125, -8.18972396850586, -7.9707255363464355, -7.75172758102417, -7.532729148864746, -7.3137311935424805, -7.094733238220215, -6.875734806060791, -6.656737327575684, -6.437739372253418, -6.218740940093994, -5.9997429847717285, -5.780744552612305, -5.561746597290039, -5.342748641967773, -5.12375020980835, -4.904751777648926, -4.68575382232666, -4.466755390167236, -4.247757434844971, -4.028759002685547, -3.8097610473632812, -3.5907628536224365, -3.371764659881592, -3.152766704559326, -2.9337685108184814, -2.7147703170776367, -2.495772361755371, -2.2767741680145264, -2.0577759742736816, -1.838777780532837, -1.6197797060012817, -1.400781512260437, -1.1817833185195923, -0.9627852439880371, -0.7437870502471924, -0.5247889161109924, -0.3057907819747925, -0.08679258823394775, 0.13220548629760742, 0.35120368003845215, 0.5702018141746521, 0.789199948310852, 1.0081981420516968, 1.227196216583252, 1.4461944103240967, 1.6651926040649414, 1.8841906785964966, 2.103188991546631, 2.3221871852874756, 2.5411853790283203, 2.760183334350586, 2.9791815280914307, 3.1981797218322754, 3.41717791557312, 3.636176109313965, 3.8551740646362305]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 17.0, 9.0, 17.0, 24.0, 19.0, 28.0, 28.0, 31.0, 29.0, 40.0, 35.0, 52.0, 52.0, 50.0, 67.0, 60.0, 57.0, 59.0, 49.0, 53.0, 45.0, 40.0, 27.0, 27.0, 18.0, 14.0, 18.0, 10.0, 4.0, 8.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.067600250244141, -3.964730739593506, -3.861861228942871, -3.7589914798736572, -3.6561219692230225, -3.5532524585723877, -3.450382709503174, -3.347513198852539, -3.2446436882019043, -3.1417741775512695, -3.0389046669006348, -2.936034917831421, -2.833165407180786, -2.7302958965301514, -2.6274261474609375, -2.5245566368103027, -2.421687126159668, -2.318817615509033, -2.2159481048583984, -2.1130783557891846, -2.01020884513855, -1.907339334487915, -1.8044697046279907, -1.7016000747680664, -1.5987305641174316, -1.4958610534667969, -1.3929914236068726, -1.2901217937469482, -1.1872522830963135, -1.0843827724456787, -0.9815131425857544, -0.8786435723304749, -0.7757737636566162, -0.6729041934013367, -0.5700346231460571, -0.4671650528907776, -0.36429548263549805, -0.2614259123802185, -0.15855634212493896, -0.055686771869659424, 0.04718279838562012, 0.15005236864089966, 0.2529219388961792, 0.35579150915145874, 0.4586610794067383, 0.5615306496620178, 0.6644002199172974, 0.7672697901725769, 0.8701393604278564, 0.973008930683136, 1.0758785009384155, 1.1787481307983398, 1.2816176414489746, 1.3844871520996094, 1.4873567819595337, 1.590226411819458, 1.6930959224700928, 1.7959654331207275, 1.8988350629806519, 2.001704692840576, 2.104574203491211, 2.2074437141418457, 2.3103132247924805, 2.4131829738616943, 2.516052484512329]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 3.0, 10.0, 7.0, 11.0, 21.0, 24.0, 30.0, 47.0, 64.0, 157.0, 662.0, 4649.0, 58897.0, 504056.0, 431860.0, 43327.0, 3703.0, 583.0, 177.0, 70.0, 47.0, 28.0, 21.0, 25.0, 15.0, 12.0, 7.0, 7.0, 7.0, 8.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4921875, -8.25592041015625, -8.0196533203125, -7.78338623046875, -7.547119140625, -7.31085205078125, -7.0745849609375, -6.83831787109375, -6.60205078125, -6.36578369140625, -6.1295166015625, -5.89324951171875, -5.656982421875, -5.42071533203125, -5.1844482421875, -4.94818115234375, -4.7119140625, -4.47564697265625, -4.2393798828125, -4.00311279296875, -3.766845703125, -3.53057861328125, -3.2943115234375, -3.05804443359375, -2.82177734375, -2.58551025390625, -2.3492431640625, -2.11297607421875, -1.876708984375, -1.64044189453125, -1.4041748046875, -1.16790771484375, -0.931640625, -0.69537353515625, -0.4591064453125, -0.22283935546875, 0.013427734375, 0.24969482421875, 0.4859619140625, 0.72222900390625, 0.95849609375, 1.19476318359375, 1.4310302734375, 1.66729736328125, 1.903564453125, 2.13983154296875, 2.3760986328125, 2.61236572265625, 2.8486328125, 3.08489990234375, 3.3211669921875, 3.55743408203125, 3.793701171875, 4.02996826171875, 4.2662353515625, 4.50250244140625, 4.73876953125, 4.97503662109375, 5.2113037109375, 5.44757080078125, 5.683837890625, 5.92010498046875, 6.1563720703125, 6.39263916015625, 6.62890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 13.0, 11.0, 12.0, 21.0, 27.0, 27.0, 26.0, 25.0, 21.0, 34.0, 37.0, 42.0, 44.0, 47.0, 47.0, 47.0, 46.0, 46.0, 57.0, 54.0, 38.0, 39.0, 29.0, 35.0, 27.0, 25.0, 24.0, 17.0, 15.0, 12.0, 4.0, 6.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.18359375, -5.02825927734375, -4.8729248046875, -4.71759033203125, -4.562255859375, -4.40692138671875, -4.2515869140625, -4.09625244140625, -3.94091796875, -3.78558349609375, -3.6302490234375, -3.47491455078125, -3.319580078125, -3.16424560546875, -3.0089111328125, -2.85357666015625, -2.6982421875, -2.54290771484375, -2.3875732421875, -2.23223876953125, -2.076904296875, -1.92156982421875, -1.7662353515625, -1.61090087890625, -1.45556640625, -1.30023193359375, -1.1448974609375, -0.98956298828125, -0.834228515625, -0.67889404296875, -0.5235595703125, -0.36822509765625, -0.212890625, -0.05755615234375, 0.0977783203125, 0.25311279296875, 0.408447265625, 0.56378173828125, 0.7191162109375, 0.87445068359375, 1.02978515625, 1.18511962890625, 1.3404541015625, 1.49578857421875, 1.651123046875, 1.80645751953125, 1.9617919921875, 2.11712646484375, 2.2724609375, 2.42779541015625, 2.5831298828125, 2.73846435546875, 2.893798828125, 3.04913330078125, 3.2044677734375, 3.35980224609375, 3.51513671875, 3.67047119140625, 3.8258056640625, 3.98114013671875, 4.136474609375, 4.29180908203125, 4.4471435546875, 4.60247802734375, 4.7578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 6.0, 10.0, 9.0, 9.0, 10.0, 21.0, 20.0, 34.0, 45.0, 57.0, 82.0, 92.0, 142.0, 150.0, 228.0, 288.0, 570.0, 3701.0, 209477.0, 801207.0, 29750.0, 1144.0, 439.0, 292.0, 177.0, 147.0, 111.0, 63.0, 68.0, 55.0, 45.0, 38.0, 23.0, 10.0, 10.0, 9.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6171875, -11.2572021484375, -10.897216796875, -10.5372314453125, -10.17724609375, -9.8172607421875, -9.457275390625, -9.0972900390625, -8.7373046875, -8.3773193359375, -8.017333984375, -7.6573486328125, -7.29736328125, -6.9373779296875, -6.577392578125, -6.2174072265625, -5.857421875, -5.4974365234375, -5.137451171875, -4.7774658203125, -4.41748046875, -4.0574951171875, -3.697509765625, -3.3375244140625, -2.9775390625, -2.6175537109375, -2.257568359375, -1.8975830078125, -1.53759765625, -1.1776123046875, -0.817626953125, -0.4576416015625, -0.09765625, 0.2623291015625, 0.622314453125, 0.9822998046875, 1.34228515625, 1.7022705078125, 2.062255859375, 2.4222412109375, 2.7822265625, 3.1422119140625, 3.502197265625, 3.8621826171875, 4.22216796875, 4.5821533203125, 4.942138671875, 5.3021240234375, 5.662109375, 6.0220947265625, 6.382080078125, 6.7420654296875, 7.10205078125, 7.4620361328125, 7.822021484375, 8.1820068359375, 8.5419921875, 8.9019775390625, 9.261962890625, 9.6219482421875, 9.98193359375, 10.3419189453125, 10.701904296875, 11.0618896484375, 11.421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 8.0, 13.0, 7.0, 7.0, 14.0, 11.0, 9.0, 18.0, 18.0, 21.0, 16.0, 28.0, 21.0, 36.0, 42.0, 31.0, 45.0, 37.0, 41.0, 48.0, 44.0, 53.0, 27.0, 42.0, 42.0, 33.0, 45.0, 37.0, 31.0, 28.0, 30.0, 18.0, 19.0, 18.0, 13.0, 13.0, 8.0, 5.0, 3.0, 6.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.578125, -4.42706298828125, -4.2760009765625, -4.12493896484375, -3.973876953125, -3.82281494140625, -3.6717529296875, -3.52069091796875, -3.36962890625, -3.21856689453125, -3.0675048828125, -2.91644287109375, -2.765380859375, -2.61431884765625, -2.4632568359375, -2.31219482421875, -2.1611328125, -2.01007080078125, -1.8590087890625, -1.70794677734375, -1.556884765625, -1.40582275390625, -1.2547607421875, -1.10369873046875, -0.95263671875, -0.80157470703125, -0.6505126953125, -0.49945068359375, -0.348388671875, -0.19732666015625, -0.0462646484375, 0.10479736328125, 0.255859375, 0.40692138671875, 0.5579833984375, 0.70904541015625, 0.860107421875, 1.01116943359375, 1.1622314453125, 1.31329345703125, 1.46435546875, 1.61541748046875, 1.7664794921875, 1.91754150390625, 2.068603515625, 2.21966552734375, 2.3707275390625, 2.52178955078125, 2.6728515625, 2.82391357421875, 2.9749755859375, 3.12603759765625, 3.277099609375, 3.42816162109375, 3.5792236328125, 3.73028564453125, 3.88134765625, 4.03240966796875, 4.1834716796875, 4.33453369140625, 4.485595703125, 4.63665771484375, 4.7877197265625, 4.93878173828125, 5.08984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 13.0, 15.0, 23.0, 44.0, 100.0, 233.0, 373.0, 1159.0, 9158.0, 488528.0, 537224.0, 9615.0, 1294.0, 374.0, 177.0, 89.0, 48.0, 30.0, 15.0, 8.0, 7.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.76953125, -4.62506103515625, -4.4805908203125, -4.33612060546875, -4.191650390625, -4.04718017578125, -3.9027099609375, -3.75823974609375, -3.61376953125, -3.46929931640625, -3.3248291015625, -3.18035888671875, -3.035888671875, -2.89141845703125, -2.7469482421875, -2.60247802734375, -2.4580078125, -2.31353759765625, -2.1690673828125, -2.02459716796875, -1.880126953125, -1.73565673828125, -1.5911865234375, -1.44671630859375, -1.30224609375, -1.15777587890625, -1.0133056640625, -0.86883544921875, -0.724365234375, -0.57989501953125, -0.4354248046875, -0.29095458984375, -0.146484375, -0.00201416015625, 0.1424560546875, 0.28692626953125, 0.431396484375, 0.57586669921875, 0.7203369140625, 0.86480712890625, 1.00927734375, 1.15374755859375, 1.2982177734375, 1.44268798828125, 1.587158203125, 1.73162841796875, 1.8760986328125, 2.02056884765625, 2.1650390625, 2.30950927734375, 2.4539794921875, 2.59844970703125, 2.742919921875, 2.88739013671875, 3.0318603515625, 3.17633056640625, 3.32080078125, 3.46527099609375, 3.6097412109375, 3.75421142578125, 3.898681640625, 4.04315185546875, 4.1876220703125, 4.33209228515625, 4.4765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 9.0, 11.0, 19.0, 30.0, 54.0, 107.0, 152.0, 167.0, 168.0, 104.0, 88.0, 44.0, 18.0, 19.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034332275390625, -0.00032749027013778687, -0.00031165778636932373, -0.0002958253026008606, -0.00027999281883239746, -0.0002641603350639343, -0.0002483278512954712, -0.00023249536752700806, -0.00021666288375854492, -0.0002008303999900818, -0.00018499791622161865, -0.00016916543245315552, -0.00015333294868469238, -0.00013750046491622925, -0.00012166798114776611, -0.00010583549737930298, -9.000301361083984e-05, -7.417052984237671e-05, -5.8338046073913574e-05, -4.250556230545044e-05, -2.6673078536987305e-05, -1.084059476852417e-05, 4.991888999938965e-06, 2.08243727684021e-05, 3.6656856536865234e-05, 5.248934030532837e-05, 6.83218240737915e-05, 8.415430784225464e-05, 9.998679161071777e-05, 0.00011581927537918091, 0.00013165175914764404, 0.00014748424291610718, 0.0001633167266845703, 0.00017914921045303345, 0.00019498169422149658, 0.00021081417798995972, 0.00022664666175842285, 0.00024247914552688599, 0.0002583116292953491, 0.00027414411306381226, 0.0002899765968322754, 0.0003058090806007385, 0.00032164156436920166, 0.0003374740481376648, 0.00035330653190612793, 0.00036913901567459106, 0.0003849714994430542, 0.00040080398321151733, 0.00041663646697998047, 0.0004324689507484436, 0.00044830143451690674, 0.0004641339182853699, 0.000479966402053833, 0.0004957988858222961, 0.0005116313695907593, 0.0005274638533592224, 0.0005432963371276855, 0.0005591288208961487, 0.0005749613046646118, 0.000590793788433075, 0.0006066262722015381, 0.0006224587559700012, 0.0006382912397384644, 0.0006541237235069275, 0.0006699562072753906]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 5.0, 6.0, 9.0, 13.0, 14.0, 18.0, 42.0, 77.0, 108.0, 195.0, 583.0, 4027.0, 144940.0, 882042.0, 14351.0, 1375.0, 351.0, 146.0, 90.0, 45.0, 28.0, 26.0, 13.0, 11.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.27642822265625, -5.1075439453125, -4.93865966796875, -4.769775390625, -4.60089111328125, -4.4320068359375, -4.26312255859375, -4.09423828125, -3.92535400390625, -3.7564697265625, -3.58758544921875, -3.418701171875, -3.24981689453125, -3.0809326171875, -2.91204833984375, -2.7431640625, -2.57427978515625, -2.4053955078125, -2.23651123046875, -2.067626953125, -1.89874267578125, -1.7298583984375, -1.56097412109375, -1.39208984375, -1.22320556640625, -1.0543212890625, -0.88543701171875, -0.716552734375, -0.54766845703125, -0.3787841796875, -0.20989990234375, -0.041015625, 0.12786865234375, 0.2967529296875, 0.46563720703125, 0.634521484375, 0.80340576171875, 0.9722900390625, 1.14117431640625, 1.31005859375, 1.47894287109375, 1.6478271484375, 1.81671142578125, 1.985595703125, 2.15447998046875, 2.3233642578125, 2.49224853515625, 2.6611328125, 2.83001708984375, 2.9989013671875, 3.16778564453125, 3.336669921875, 3.50555419921875, 3.6744384765625, 3.84332275390625, 4.01220703125, 4.18109130859375, 4.3499755859375, 4.51885986328125, 4.687744140625, 4.85662841796875, 5.0255126953125, 5.19439697265625, 5.36328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 15.0, 16.0, 35.0, 41.0, 61.0, 75.0, 102.0, 112.0, 120.0, 111.0, 89.0, 66.0, 48.0, 25.0, 17.0, 10.0, 11.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99365234375, -0.9593582153320312, -0.9250640869140625, -0.8907699584960938, -0.856475830078125, -0.8221817016601562, -0.7878875732421875, -0.7535934448242188, -0.71929931640625, -0.6850051879882812, -0.6507110595703125, -0.6164169311523438, -0.582122802734375, -0.5478286743164062, -0.5135345458984375, -0.47924041748046875, -0.4449462890625, -0.41065216064453125, -0.3763580322265625, -0.34206390380859375, -0.307769775390625, -0.27347564697265625, -0.2391815185546875, -0.20488739013671875, -0.17059326171875, -0.13629913330078125, -0.1020050048828125, -0.06771087646484375, -0.033416748046875, 0.00087738037109375, 0.0351715087890625, 0.06946563720703125, 0.103759765625, 0.13805389404296875, 0.1723480224609375, 0.20664215087890625, 0.240936279296875, 0.27523040771484375, 0.3095245361328125, 0.34381866455078125, 0.37811279296875, 0.41240692138671875, 0.4467010498046875, 0.48099517822265625, 0.515289306640625, 0.5495834350585938, 0.5838775634765625, 0.6181716918945312, 0.6524658203125, 0.6867599487304688, 0.7210540771484375, 0.7553482055664062, 0.789642333984375, 0.8239364624023438, 0.8582305908203125, 0.8925247192382812, 0.92681884765625, 0.9611129760742188, 0.9954071044921875, 1.0297012329101562, 1.063995361328125, 1.0982894897460938, 1.1325836181640625, 1.1668777465820312, 1.201171875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 16.0, 14.0, 11.0, 16.0, 30.0, 38.0, 50.0, 66.0, 59.0, 76.0, 86.0, 94.0, 86.0, 82.0, 69.0, 51.0, 44.0, 38.0, 25.0, 9.0, 11.0, 12.0, 5.0, 6.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.144302368164062, -9.90947437286377, -9.674646377563477, -9.439818382263184, -9.20499038696289, -8.970162391662598, -8.735334396362305, -8.500506401062012, -8.265678405761719, -8.030850410461426, -7.796022415161133, -7.56119441986084, -7.326366424560547, -7.091538429260254, -6.856710433959961, -6.621882915496826, -6.387055397033691, -6.152227401733398, -5.9173994064331055, -5.6825714111328125, -5.4477434158325195, -5.212915420532227, -4.978087425231934, -4.743259906768799, -4.508431434631348, -4.273603439331055, -4.038775444030762, -3.8039474487304688, -3.569119691848755, -3.334291696548462, -3.099463701248169, -2.864635944366455, -2.629807949066162, -2.394979953765869, -2.160151958465576, -1.9253240823745728, -1.6904962062835693, -1.4556682109832764, -1.2208402156829834, -0.98601233959198, -0.751184344291687, -0.5163564085960388, -0.28152844309806824, -0.046700477600097656, 0.18812745809555054, 0.42295539379119873, 0.6577833890914917, 0.8926112651824951, 1.127439260482788, 1.362267255783081, 1.5970951318740845, 1.8319231271743774, 2.066751003265381, 2.301578998565674, 2.536406993865967, 2.7712349891662598, 3.0060629844665527, 3.2408909797668457, 3.4757189750671387, 3.7105469703674316, 3.9453747272491455, 4.180202484130859, 4.415030479431152, 4.649858474731445, 4.884686470031738]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 5.0, 4.0, 3.0, 8.0, 9.0, 9.0, 9.0, 17.0, 12.0, 14.0, 15.0, 16.0, 24.0, 24.0, 19.0, 23.0, 30.0, 30.0, 28.0, 36.0, 35.0, 30.0, 37.0, 37.0, 48.0, 38.0, 36.0, 45.0, 37.0, 34.0, 48.0, 32.0, 21.0, 27.0, 34.0, 24.0, 22.0, 14.0, 15.0, 10.0, 12.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.59603214263916, -7.35667085647583, -7.117309093475342, -6.877947807312012, -6.638586044311523, -6.399224758148193, -6.159863471984863, -5.920501708984375, -5.681139945983887, -5.441778659820557, -5.202416896820068, -4.963055610656738, -4.72369384765625, -4.48433256149292, -4.24497127532959, -4.005609512329102, -3.7662482261657715, -3.5268867015838623, -3.287525177001953, -3.048163890838623, -2.8088021278381348, -2.5694408416748047, -2.3300793170928955, -2.0907177925109863, -1.8513562679290771, -1.611994743347168, -1.3726332187652588, -1.1332718133926392, -0.89391028881073, -0.6545487642288208, -0.41518735885620117, -0.175825834274292, 0.06353569030761719, 0.302897185087204, 0.5422586798667908, 0.7816201448440552, 1.0209816694259644, 1.2603431940078735, 1.4997045993804932, 1.7390661239624023, 1.9784276485443115, 2.2177891731262207, 2.45715069770813, 2.696512222290039, 2.935873508453369, 3.1752352714538574, 3.4145965576171875, 3.6539580821990967, 3.893319606781006, 4.132680892944336, 4.372042655944824, 4.611403942108154, 4.850765705108643, 5.090126991271973, 5.329488754272461, 5.568850040435791, 5.808211326599121, 6.047572612762451, 6.2869343757629395, 6.5262956619262695, 6.765657424926758, 7.005018711090088, 7.244379997253418, 7.483741760253906, 7.7231035232543945]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 5.0, 9.0, 12.0, 13.0, 22.0, 27.0, 44.0, 41.0, 67.0, 96.0, 114.0, 159.0, 235.0, 364.0, 897.0, 4041.0, 36543.0, 520048.0, 2663959.0, 891779.0, 66961.0, 6225.0, 1182.0, 450.0, 258.0, 199.0, 131.0, 88.0, 72.0, 56.0, 35.0, 22.0, 26.0, 13.0, 23.0, 14.0, 11.0, 8.0, 5.0, 7.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.1328125, -7.89080810546875, -7.6488037109375, -7.40679931640625, -7.164794921875, -6.92279052734375, -6.6807861328125, -6.43878173828125, -6.19677734375, -5.95477294921875, -5.7127685546875, -5.47076416015625, -5.228759765625, -4.98675537109375, -4.7447509765625, -4.50274658203125, -4.2607421875, -4.01873779296875, -3.7767333984375, -3.53472900390625, -3.292724609375, -3.05072021484375, -2.8087158203125, -2.56671142578125, -2.32470703125, -2.08270263671875, -1.8406982421875, -1.59869384765625, -1.356689453125, -1.11468505859375, -0.8726806640625, -0.63067626953125, -0.388671875, -0.14666748046875, 0.0953369140625, 0.33734130859375, 0.579345703125, 0.82135009765625, 1.0633544921875, 1.30535888671875, 1.54736328125, 1.78936767578125, 2.0313720703125, 2.27337646484375, 2.515380859375, 2.75738525390625, 2.9993896484375, 3.24139404296875, 3.4833984375, 3.72540283203125, 3.9674072265625, 4.20941162109375, 4.451416015625, 4.69342041015625, 4.9354248046875, 5.17742919921875, 5.41943359375, 5.66143798828125, 5.9034423828125, 6.14544677734375, 6.387451171875, 6.62945556640625, 6.8714599609375, 7.11346435546875, 7.35546875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 9.0, 6.0, 13.0, 13.0, 9.0, 17.0, 16.0, 16.0, 30.0, 25.0, 28.0, 22.0, 32.0, 29.0, 37.0, 30.0, 27.0, 48.0, 41.0, 42.0, 38.0, 56.0, 45.0, 49.0, 54.0, 36.0, 39.0, 30.0, 31.0, 23.0, 21.0, 20.0, 15.0, 10.0, 13.0, 5.0, 9.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.507537841796875, -3.38812255859375, -3.268707275390625, -3.1492919921875, -3.029876708984375, -2.91046142578125, -2.791046142578125, -2.671630859375, -2.552215576171875, -2.43280029296875, -2.313385009765625, -2.1939697265625, -2.074554443359375, -1.95513916015625, -1.835723876953125, -1.71630859375, -1.596893310546875, -1.47747802734375, -1.358062744140625, -1.2386474609375, -1.119232177734375, -0.99981689453125, -0.880401611328125, -0.760986328125, -0.641571044921875, -0.52215576171875, -0.402740478515625, -0.2833251953125, -0.163909912109375, -0.04449462890625, 0.074920654296875, 0.1943359375, 0.313751220703125, 0.43316650390625, 0.552581787109375, 0.6719970703125, 0.791412353515625, 0.91082763671875, 1.030242919921875, 1.149658203125, 1.269073486328125, 1.38848876953125, 1.507904052734375, 1.6273193359375, 1.746734619140625, 1.86614990234375, 1.985565185546875, 2.10498046875, 2.224395751953125, 2.34381103515625, 2.463226318359375, 2.5826416015625, 2.702056884765625, 2.82147216796875, 2.940887451171875, 3.060302734375, 3.179718017578125, 3.29913330078125, 3.418548583984375, 3.5379638671875, 3.657379150390625, 3.77679443359375, 3.896209716796875, 4.015625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 14.0, 16.0, 29.0, 39.0, 70.0, 102.0, 269.0, 490.0, 1132.0, 3714.0, 107628.0, 3957419.0, 117314.0, 3872.0, 1122.0, 471.0, 221.0, 147.0, 69.0, 45.0, 27.0, 17.0, 20.0, 11.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.544677734375, -9.12060546875, -8.696533203125, -8.2724609375, -7.848388671875, -7.42431640625, -7.000244140625, -6.576171875, -6.152099609375, -5.72802734375, -5.303955078125, -4.8798828125, -4.455810546875, -4.03173828125, -3.607666015625, -3.18359375, -2.759521484375, -2.33544921875, -1.911376953125, -1.4873046875, -1.063232421875, -0.63916015625, -0.215087890625, 0.208984375, 0.633056640625, 1.05712890625, 1.481201171875, 1.9052734375, 2.329345703125, 2.75341796875, 3.177490234375, 3.6015625, 4.025634765625, 4.44970703125, 4.873779296875, 5.2978515625, 5.721923828125, 6.14599609375, 6.570068359375, 6.994140625, 7.418212890625, 7.84228515625, 8.266357421875, 8.6904296875, 9.114501953125, 9.53857421875, 9.962646484375, 10.38671875, 10.810791015625, 11.23486328125, 11.658935546875, 12.0830078125, 12.507080078125, 12.93115234375, 13.355224609375, 13.779296875, 14.203369140625, 14.62744140625, 15.051513671875, 15.4755859375, 15.899658203125, 16.32373046875, 16.747802734375, 17.171875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 6.0, 9.0, 16.0, 24.0, 22.0, 39.0, 58.0, 83.0, 130.0, 178.0, 284.0, 385.0, 461.0, 555.0, 472.0, 430.0, 290.0, 220.0, 141.0, 97.0, 55.0, 31.0, 28.0, 19.0, 13.0, 6.0, 4.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.66796875, -2.606658935546875, -2.54534912109375, -2.484039306640625, -2.4227294921875, -2.361419677734375, -2.30010986328125, -2.238800048828125, -2.177490234375, -2.116180419921875, -2.05487060546875, -1.993560791015625, -1.9322509765625, -1.870941162109375, -1.80963134765625, -1.748321533203125, -1.68701171875, -1.625701904296875, -1.56439208984375, -1.503082275390625, -1.4417724609375, -1.380462646484375, -1.31915283203125, -1.257843017578125, -1.196533203125, -1.135223388671875, -1.07391357421875, -1.012603759765625, -0.9512939453125, -0.889984130859375, -0.82867431640625, -0.767364501953125, -0.7060546875, -0.644744873046875, -0.58343505859375, -0.522125244140625, -0.4608154296875, -0.399505615234375, -0.33819580078125, -0.276885986328125, -0.215576171875, -0.154266357421875, -0.09295654296875, -0.031646728515625, 0.0296630859375, 0.090972900390625, 0.15228271484375, 0.213592529296875, 0.27490234375, 0.336212158203125, 0.39752197265625, 0.458831787109375, 0.5201416015625, 0.581451416015625, 0.64276123046875, 0.704071044921875, 0.765380859375, 0.826690673828125, 0.88800048828125, 0.949310302734375, 1.0106201171875, 1.071929931640625, 1.13323974609375, 1.194549560546875, 1.255859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 6.0, 15.0, 37.0, 55.0, 116.0, 163.0, 180.0, 173.0, 119.0, 72.0, 45.0, 13.0, 13.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.672292709350586, -13.251670837402344, -12.831049919128418, -12.410428047180176, -11.989806175231934, -11.569185256958008, -11.148563385009766, -10.727941513061523, -10.307319641113281, -9.886697769165039, -9.466076850891113, -9.045454978942871, -8.624833106994629, -8.204212188720703, -7.783590316772461, -7.362968444824219, -6.942347049713135, -6.521725654602051, -6.101103782653809, -5.680482387542725, -5.259860515594482, -4.839239120483398, -4.418617248535156, -3.9979958534240723, -3.577374219894409, -3.156752586364746, -2.736130952835083, -2.31550931930542, -1.8948878049850464, -1.4742662906646729, -1.0536446571350098, -0.6330230236053467, -0.2124013900756836, 0.2082202136516571, 0.6288418173789978, 1.0494633913040161, 1.4700850248336792, 1.8907065391540527, 2.311328172683716, 2.731949806213379, 3.152571439743042, 3.573193073272705, 3.993814706802368, 4.414436340332031, 4.835057735443115, 5.255679130554199, 5.676301002502441, 6.096922874450684, 6.517544269561768, 6.938165664672852, 7.358787536621094, 7.779408931732178, 8.200030326843262, 8.620652198791504, 9.041274070739746, 9.461894989013672, 9.882516860961914, 10.303138732910156, 10.723759651184082, 11.144381523132324, 11.565003395080566, 11.985624313354492, 12.406246185302734, 12.826868057250977, 13.247489929199219]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 5.0, 4.0, 11.0, 17.0, 22.0, 17.0, 18.0, 24.0, 29.0, 20.0, 23.0, 29.0, 36.0, 36.0, 29.0, 40.0, 37.0, 49.0, 46.0, 56.0, 42.0, 40.0, 46.0, 36.0, 49.0, 28.0, 36.0, 23.0, 30.0, 20.0, 19.0, 18.0, 16.0, 7.0, 5.0, 10.0, 10.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.525993824005127, -3.3983798027038574, -3.270765781402588, -3.1431517601013184, -3.015537738800049, -2.8879237174987793, -2.7603094577789307, -2.632695436477661, -2.5050814151763916, -2.377467393875122, -2.2498533725738525, -2.122239351272583, -1.994625210762024, -1.8670111894607544, -1.7393970489501953, -1.6117830276489258, -1.4841690063476562, -1.3565549850463867, -1.2289409637451172, -1.101326823234558, -0.9737128019332886, -0.846098780632019, -0.7184846997261047, -0.5908706188201904, -0.4632565975189209, -0.335642546415329, -0.20802849531173706, -0.08041444420814514, 0.04719960689544678, 0.1748136281967163, 0.3024277091026306, 0.4300417900085449, 0.5576558113098145, 0.685269832611084, 0.8128839135169983, 0.9404979944229126, 1.0681120157241821, 1.1957260370254517, 1.3233401775360107, 1.4509541988372803, 1.5785682201385498, 1.7061822414398193, 1.8337962627410889, 1.961410403251648, 2.089024543762207, 2.2166385650634766, 2.344252586364746, 2.4718666076660156, 2.599480628967285, 2.7270946502685547, 2.854708671569824, 2.9823226928710938, 3.1099367141723633, 3.237550735473633, 3.3651649951934814, 3.492779016494751, 3.6203930377960205, 3.74800705909729, 3.8756210803985596, 4.003235340118408, 4.130849361419678, 4.258463382720947, 4.386077404022217, 4.513691425323486, 4.641305446624756]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 10.0, 11.0, 12.0, 21.0, 30.0, 47.0, 73.0, 118.0, 172.0, 323.0, 532.0, 1059.0, 2108.0, 4655.0, 11643.0, 30944.0, 83954.0, 208795.0, 329231.0, 225459.0, 92658.0, 33966.0, 12675.0, 5124.0, 2335.0, 1112.0, 596.0, 342.0, 197.0, 123.0, 70.0, 62.0, 35.0, 18.0, 14.0, 11.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61328125, -0.595001220703125, -0.57672119140625, -0.558441162109375, -0.5401611328125, -0.521881103515625, -0.50360107421875, -0.485321044921875, -0.467041015625, -0.448760986328125, -0.43048095703125, -0.412200927734375, -0.3939208984375, -0.375640869140625, -0.35736083984375, -0.339080810546875, -0.32080078125, -0.302520751953125, -0.28424072265625, -0.265960693359375, -0.2476806640625, -0.229400634765625, -0.21112060546875, -0.192840576171875, -0.174560546875, -0.156280517578125, -0.13800048828125, -0.119720458984375, -0.1014404296875, -0.083160400390625, -0.06488037109375, -0.046600341796875, -0.0283203125, -0.010040283203125, 0.00823974609375, 0.026519775390625, 0.0447998046875, 0.063079833984375, 0.08135986328125, 0.099639892578125, 0.117919921875, 0.136199951171875, 0.15447998046875, 0.172760009765625, 0.1910400390625, 0.209320068359375, 0.22760009765625, 0.245880126953125, 0.26416015625, 0.282440185546875, 0.30072021484375, 0.319000244140625, 0.3372802734375, 0.355560302734375, 0.37384033203125, 0.392120361328125, 0.410400390625, 0.428680419921875, 0.44696044921875, 0.465240478515625, 0.4835205078125, 0.501800537109375, 0.52008056640625, 0.538360595703125, 0.556640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 13.0, 13.0, 21.0, 20.0, 29.0, 19.0, 30.0, 39.0, 34.0, 36.0, 42.0, 50.0, 54.0, 41.0, 61.0, 53.0, 61.0, 58.0, 48.0, 49.0, 40.0, 42.0, 29.0, 17.0, 15.0, 15.0, 17.0, 16.0, 10.0, 9.0, 1.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.57379150390625, -2.4639892578125, -2.35418701171875, -2.244384765625, -2.13458251953125, -2.0247802734375, -1.91497802734375, -1.80517578125, -1.69537353515625, -1.5855712890625, -1.47576904296875, -1.365966796875, -1.25616455078125, -1.1463623046875, -1.03656005859375, -0.9267578125, -0.81695556640625, -0.7071533203125, -0.59735107421875, -0.487548828125, -0.37774658203125, -0.2679443359375, -0.15814208984375, -0.04833984375, 0.06146240234375, 0.1712646484375, 0.28106689453125, 0.390869140625, 0.50067138671875, 0.6104736328125, 0.72027587890625, 0.830078125, 0.93988037109375, 1.0496826171875, 1.15948486328125, 1.269287109375, 1.37908935546875, 1.4888916015625, 1.59869384765625, 1.70849609375, 1.81829833984375, 1.9281005859375, 2.03790283203125, 2.147705078125, 2.25750732421875, 2.3673095703125, 2.47711181640625, 2.5869140625, 2.69671630859375, 2.8065185546875, 2.91632080078125, 3.026123046875, 3.13592529296875, 3.2457275390625, 3.35552978515625, 3.46533203125, 3.57513427734375, 3.6849365234375, 3.79473876953125, 3.904541015625, 4.01434326171875, 4.1241455078125, 4.23394775390625, 4.34375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 13.0, 20.0, 31.0, 50.0, 100.0, 185.0, 440.0, 934.0, 2126.0, 4938.0, 10851.0, 23727.0, 51615.0, 103441.0, 178520.0, 233081.0, 200045.0, 122063.0, 62455.0, 29608.0, 13504.0, 5959.0, 2700.0, 1161.0, 494.0, 237.0, 100.0, 65.0, 28.0, 17.0, 10.0, 7.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.319091796875, -0.3079490661621094, -0.29680633544921875, -0.2856636047363281, -0.2745208740234375, -0.2633781433105469, -0.25223541259765625, -0.24109268188476562, -0.229949951171875, -0.21880722045898438, -0.20766448974609375, -0.19652175903320312, -0.1853790283203125, -0.17423629760742188, -0.16309356689453125, -0.15195083618164062, -0.14080810546875, -0.12966537475585938, -0.11852264404296875, -0.10737991333007812, -0.0962371826171875, -0.08509445190429688, -0.07395172119140625, -0.06280899047851562, -0.051666259765625, -0.040523529052734375, -0.02938079833984375, -0.018238067626953125, -0.0070953369140625, 0.004047393798828125, 0.01519012451171875, 0.026332855224609375, 0.0374755859375, 0.048618316650390625, 0.05976104736328125, 0.07090377807617188, 0.0820465087890625, 0.09318923950195312, 0.10433197021484375, 0.11547470092773438, 0.126617431640625, 0.13776016235351562, 0.14890289306640625, 0.16004562377929688, 0.1711883544921875, 0.18233108520507812, 0.19347381591796875, 0.20461654663085938, 0.21575927734375, 0.22690200805664062, 0.23804473876953125, 0.24918746948242188, 0.2603302001953125, 0.2714729309082031, 0.28261566162109375, 0.2937583923339844, 0.304901123046875, 0.3160438537597656, 0.32718658447265625, 0.3383293151855469, 0.3494720458984375, 0.3606147766113281, 0.37175750732421875, 0.3829002380371094, 0.39404296875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 10.0, 4.0, 10.0, 11.0, 11.0, 17.0, 18.0, 22.0, 20.0, 27.0, 32.0, 34.0, 54.0, 61.0, 34.0, 37.0, 46.0, 46.0, 47.0, 57.0, 50.0, 39.0, 36.0, 49.0, 39.0, 31.0, 26.0, 25.0, 11.0, 22.0, 10.0, 13.0, 12.0, 12.0, 7.0, 2.0, 2.0, 8.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.22265625, -6.0350341796875, -5.847412109375, -5.6597900390625, -5.47216796875, -5.2845458984375, -5.096923828125, -4.9093017578125, -4.7216796875, -4.5340576171875, -4.346435546875, -4.1588134765625, -3.97119140625, -3.7835693359375, -3.595947265625, -3.4083251953125, -3.220703125, -3.0330810546875, -2.845458984375, -2.6578369140625, -2.47021484375, -2.2825927734375, -2.094970703125, -1.9073486328125, -1.7197265625, -1.5321044921875, -1.344482421875, -1.1568603515625, -0.96923828125, -0.7816162109375, -0.593994140625, -0.4063720703125, -0.21875, -0.0311279296875, 0.156494140625, 0.3441162109375, 0.53173828125, 0.7193603515625, 0.906982421875, 1.0946044921875, 1.2822265625, 1.4698486328125, 1.657470703125, 1.8450927734375, 2.03271484375, 2.2203369140625, 2.407958984375, 2.5955810546875, 2.783203125, 2.9708251953125, 3.158447265625, 3.3460693359375, 3.53369140625, 3.7213134765625, 3.908935546875, 4.0965576171875, 4.2841796875, 4.4718017578125, 4.659423828125, 4.8470458984375, 5.03466796875, 5.2222900390625, 5.409912109375, 5.5975341796875, 5.78515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 12.0, 13.0, 28.0, 30.0, 58.0, 112.0, 172.0, 251.0, 441.0, 597.0, 1071.0, 2083.0, 4085.0, 8684.0, 21257.0, 62843.0, 215208.0, 444229.0, 194137.0, 56897.0, 19597.0, 8229.0, 3901.0, 1929.0, 1113.0, 556.0, 353.0, 236.0, 147.0, 96.0, 58.0, 45.0, 25.0, 17.0, 13.0, 13.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08587646484375, -0.08323097229003906, -0.08058547973632812, -0.07793998718261719, -0.07529449462890625, -0.07264900207519531, -0.07000350952148438, -0.06735801696777344, -0.0647125244140625, -0.06206703186035156, -0.059421539306640625, -0.05677604675292969, -0.05413055419921875, -0.05148506164550781, -0.048839569091796875, -0.04619407653808594, -0.043548583984375, -0.04090309143066406, -0.038257598876953125, -0.03561210632324219, -0.03296661376953125, -0.030321121215820312, -0.027675628662109375, -0.025030136108398438, -0.0223846435546875, -0.019739151000976562, -0.017093658447265625, -0.014448165893554688, -0.01180267333984375, -0.009157180786132812, -0.006511688232421875, -0.0038661956787109375, -0.001220703125, 0.0014247894287109375, 0.004070281982421875, 0.0067157745361328125, 0.00936126708984375, 0.012006759643554688, 0.014652252197265625, 0.017297744750976562, 0.0199432373046875, 0.022588729858398438, 0.025234222412109375, 0.027879714965820312, 0.03052520751953125, 0.03317070007324219, 0.035816192626953125, 0.03846168518066406, 0.041107177734375, 0.04375267028808594, 0.046398162841796875, 0.04904365539550781, 0.05168914794921875, 0.05433464050292969, 0.056980133056640625, 0.05962562561035156, 0.0622711181640625, 0.06491661071777344, 0.06756210327148438, 0.07020759582519531, 0.07285308837890625, 0.07549858093261719, 0.07814407348632812, 0.08078956604003906, 0.08343505859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 11.0, 11.0, 20.0, 33.0, 41.0, 59.0, 81.0, 154.0, 134.0, 126.0, 93.0, 72.0, 48.0, 31.0, 16.0, 19.0, 13.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0001087188720703125, -0.00010549649596214294, -0.00010227411985397339, -9.905174374580383e-05, -9.582936763763428e-05, -9.260699152946472e-05, -8.938461542129517e-05, -8.616223931312561e-05, -8.293986320495605e-05, -7.97174870967865e-05, -7.649511098861694e-05, -7.327273488044739e-05, -7.005035877227783e-05, -6.682798266410828e-05, -6.360560655593872e-05, -6.0383230447769165e-05, -5.716085433959961e-05, -5.3938478231430054e-05, -5.07161021232605e-05, -4.749372601509094e-05, -4.427134990692139e-05, -4.104897379875183e-05, -3.7826597690582275e-05, -3.460422158241272e-05, -3.1381845474243164e-05, -2.815946936607361e-05, -2.4937093257904053e-05, -2.1714717149734497e-05, -1.849234104156494e-05, -1.5269964933395386e-05, -1.204758882522583e-05, -8.825212717056274e-06, -5.602836608886719e-06, -2.380460500717163e-06, 8.419156074523926e-07, 4.064291715621948e-06, 7.286667823791504e-06, 1.050904393196106e-05, 1.3731420040130615e-05, 1.695379614830017e-05, 2.0176172256469727e-05, 2.3398548364639282e-05, 2.6620924472808838e-05, 2.9843300580978394e-05, 3.306567668914795e-05, 3.6288052797317505e-05, 3.951042890548706e-05, 4.2732805013656616e-05, 4.595518112182617e-05, 4.917755722999573e-05, 5.239993333816528e-05, 5.562230944633484e-05, 5.8844685554504395e-05, 6.206706166267395e-05, 6.52894377708435e-05, 6.851181387901306e-05, 7.173418998718262e-05, 7.495656609535217e-05, 7.817894220352173e-05, 8.140131831169128e-05, 8.462369441986084e-05, 8.78460705280304e-05, 9.106844663619995e-05, 9.429082274436951e-05, 9.751319885253906e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 5.0, 7.0, 7.0, 15.0, 10.0, 16.0, 33.0, 32.0, 51.0, 86.0, 155.0, 361.0, 816.0, 2411.0, 7835.0, 35408.0, 291620.0, 615082.0, 75236.0, 13468.0, 3643.0, 1285.0, 447.0, 202.0, 109.0, 52.0, 40.0, 34.0, 23.0, 15.0, 11.0, 6.0, 10.0, 1.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1688232421875, -0.16415977478027344, -0.15949630737304688, -0.1548328399658203, -0.15016937255859375, -0.1455059051513672, -0.14084243774414062, -0.13617897033691406, -0.1315155029296875, -0.12685203552246094, -0.12218856811523438, -0.11752510070800781, -0.11286163330078125, -0.10819816589355469, -0.10353469848632812, -0.09887123107910156, -0.094207763671875, -0.08954429626464844, -0.08488082885742188, -0.08021736145019531, -0.07555389404296875, -0.07089042663574219, -0.06622695922851562, -0.06156349182128906, -0.0569000244140625, -0.05223655700683594, -0.047573089599609375, -0.04290962219238281, -0.03824615478515625, -0.03358268737792969, -0.028919219970703125, -0.024255752563476562, -0.01959228515625, -0.014928817749023438, -0.010265350341796875, -0.0056018829345703125, -0.00093841552734375, 0.0037250518798828125, 0.008388519287109375, 0.013051986694335938, 0.0177154541015625, 0.022378921508789062, 0.027042388916015625, 0.03170585632324219, 0.03636932373046875, 0.04103279113769531, 0.045696258544921875, 0.05035972595214844, 0.055023193359375, 0.05968666076660156, 0.06435012817382812, 0.06901359558105469, 0.07367706298828125, 0.07834053039550781, 0.08300399780273438, 0.08766746520996094, 0.0923309326171875, 0.09699440002441406, 0.10165786743164062, 0.10632133483886719, 0.11098480224609375, 0.11564826965332031, 0.12031173706054688, 0.12497520446777344, 0.129638671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 3.0, 9.0, 10.0, 8.0, 18.0, 9.0, 9.0, 25.0, 27.0, 32.0, 38.0, 57.0, 55.0, 51.0, 82.0, 81.0, 84.0, 67.0, 69.0, 49.0, 47.0, 46.0, 27.0, 26.0, 17.0, 11.0, 1.0, 12.0, 11.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.030487060546875, -0.029604673385620117, -0.028722286224365234, -0.02783989906311035, -0.02695751190185547, -0.026075124740600586, -0.025192737579345703, -0.02431035041809082, -0.023427963256835938, -0.022545576095581055, -0.021663188934326172, -0.02078080177307129, -0.019898414611816406, -0.019016027450561523, -0.01813364028930664, -0.017251253128051758, -0.016368865966796875, -0.015486478805541992, -0.01460409164428711, -0.013721704483032227, -0.012839317321777344, -0.011956930160522461, -0.011074542999267578, -0.010192155838012695, -0.009309768676757812, -0.00842738151550293, -0.007544994354248047, -0.006662607192993164, -0.005780220031738281, -0.0048978328704833984, -0.004015445709228516, -0.003133058547973633, -0.00225067138671875, -0.0013682842254638672, -0.0004858970642089844, 0.00039649009704589844, 0.0012788772583007812, 0.002161264419555664, 0.003043651580810547, 0.00392603874206543, 0.0048084259033203125, 0.005690813064575195, 0.006573200225830078, 0.007455587387084961, 0.008337974548339844, 0.009220361709594727, 0.01010274887084961, 0.010985136032104492, 0.011867523193359375, 0.012749910354614258, 0.01363229751586914, 0.014514684677124023, 0.015397071838378906, 0.01627945899963379, 0.017161846160888672, 0.018044233322143555, 0.018926620483398438, 0.01980900764465332, 0.020691394805908203, 0.021573781967163086, 0.02245616912841797, 0.02333855628967285, 0.024220943450927734, 0.025103330612182617, 0.0259857177734375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 9.0, 45.0, 219.0, 450.0, 238.0, 49.0, 7.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.95737838745117, -35.32083511352539, -34.68429183959961, -34.04774475097656, -33.41120147705078, -32.774658203125, -32.13811492919922, -31.501569747924805, -30.865026473999023, -30.228483200073242, -29.591938018798828, -28.955394744873047, -28.318849563598633, -27.68230628967285, -27.045761108398438, -26.409217834472656, -25.772674560546875, -25.136131286621094, -24.49958610534668, -23.8630428314209, -23.226497650146484, -22.589954376220703, -21.953411102294922, -21.316865921020508, -20.680320739746094, -20.043777465820312, -19.4072322845459, -18.770689010620117, -18.134143829345703, -17.497600555419922, -16.86105728149414, -16.224512100219727, -15.587968826293945, -14.951424598693848, -14.31488037109375, -13.678337097167969, -13.041792869567871, -12.405248641967773, -11.768704414367676, -11.132160186767578, -10.495616912841797, -9.8590726852417, -9.222528457641602, -8.58598518371582, -7.949440956115723, -7.312896728515625, -6.676352500915527, -6.039808750152588, -5.40326452255249, -4.766720294952393, -4.130176544189453, -3.4936323165893555, -2.857088327407837, -2.2205443382263184, -1.5840001106262207, -0.9474563598632812, -0.3109121322631836, 0.32563191652297974, 0.9621759653091431, 1.5987200736999512, 2.2352640628814697, 2.8718080520629883, 3.508352279663086, 4.144896030426025, 4.781440258026123]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 8.0, 7.0, 8.0, 9.0, 21.0, 16.0, 20.0, 25.0, 26.0, 24.0, 24.0, 29.0, 37.0, 38.0, 30.0, 34.0, 41.0, 50.0, 48.0, 60.0, 45.0, 42.0, 49.0, 37.0, 43.0, 31.0, 33.0, 20.0, 28.0, 24.0, 22.0, 16.0, 11.0, 9.0, 9.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.5625016689300537, -2.472991943359375, -2.3834822177886963, -2.2939724922180176, -2.204462766647339, -2.11495304107666, -2.0254435539245605, -1.9359337091445923, -1.8464239835739136, -1.7569142580032349, -1.6674045324325562, -1.577894926071167, -1.4883852005004883, -1.3988754749298096, -1.3093657493591309, -1.2198560237884521, -1.1303462982177734, -1.0408365726470947, -0.951326847076416, -0.8618171811103821, -0.7723074555397034, -0.6827977299690247, -0.5932880640029907, -0.503778338432312, -0.4142686128616333, -0.3247588872909546, -0.23524919152259827, -0.14573949575424194, -0.05622977018356323, 0.03327995538711548, 0.12278962135314941, 0.21229934692382812, 0.30180931091308594, 0.39131903648376465, 0.48082873225212097, 0.5703384280204773, 0.659848153591156, 0.7493578791618347, 0.8388675451278687, 0.9283772706985474, 1.017886996269226, 1.1073967218399048, 1.1969064474105835, 1.2864160537719727, 1.3759257793426514, 1.46543550491333, 1.5549452304840088, 1.6444549560546875, 1.7339646816253662, 1.823474407196045, 1.9129841327667236, 2.0024938583374023, 2.092003583908081, 2.1815133094787598, 2.2710227966308594, 2.360532760620117, 2.450042247772217, 2.5395519733428955, 2.629061698913574, 2.718571424484253, 2.8080811500549316, 2.8975908756256104, 2.987100601196289, 3.0766100883483887, 3.1661200523376465]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 8.0, 9.0, 17.0, 12.0, 14.0, 19.0, 15.0, 25.0, 52.0, 86.0, 124.0, 309.0, 900.0, 3274.0, 17087.0, 104966.0, 432315.0, 387381.0, 84145.0, 13590.0, 2783.0, 761.0, 267.0, 134.0, 82.0, 37.0, 26.0, 23.0, 9.0, 7.0, 13.0, 14.0, 13.0, 7.0, 6.0, 7.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.08984375, -4.93048095703125, -4.7711181640625, -4.61175537109375, -4.452392578125, -4.29302978515625, -4.1336669921875, -3.97430419921875, -3.81494140625, -3.65557861328125, -3.4962158203125, -3.33685302734375, -3.177490234375, -3.01812744140625, -2.8587646484375, -2.69940185546875, -2.5400390625, -2.38067626953125, -2.2213134765625, -2.06195068359375, -1.902587890625, -1.74322509765625, -1.5838623046875, -1.42449951171875, -1.26513671875, -1.10577392578125, -0.9464111328125, -0.78704833984375, -0.627685546875, -0.46832275390625, -0.3089599609375, -0.14959716796875, 0.009765625, 0.16912841796875, 0.3284912109375, 0.48785400390625, 0.647216796875, 0.80657958984375, 0.9659423828125, 1.12530517578125, 1.28466796875, 1.44403076171875, 1.6033935546875, 1.76275634765625, 1.922119140625, 2.08148193359375, 2.2408447265625, 2.40020751953125, 2.5595703125, 2.71893310546875, 2.8782958984375, 3.03765869140625, 3.197021484375, 3.35638427734375, 3.5157470703125, 3.67510986328125, 3.83447265625, 3.99383544921875, 4.1531982421875, 4.31256103515625, 4.471923828125, 4.63128662109375, 4.7906494140625, 4.95001220703125, 5.109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 4.0, 3.0, 12.0, 6.0, 1.0, 6.0, 15.0, 16.0, 19.0, 20.0, 22.0, 21.0, 22.0, 31.0, 27.0, 29.0, 34.0, 48.0, 42.0, 38.0, 46.0, 55.0, 40.0, 51.0, 47.0, 40.0, 36.0, 30.0, 24.0, 32.0, 33.0, 34.0, 18.0, 22.0, 12.0, 12.0, 12.0, 12.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.265625, -4.116455078125, -3.96728515625, -3.818115234375, -3.6689453125, -3.519775390625, -3.37060546875, -3.221435546875, -3.072265625, -2.923095703125, -2.77392578125, -2.624755859375, -2.4755859375, -2.326416015625, -2.17724609375, -2.028076171875, -1.87890625, -1.729736328125, -1.58056640625, -1.431396484375, -1.2822265625, -1.133056640625, -0.98388671875, -0.834716796875, -0.685546875, -0.536376953125, -0.38720703125, -0.238037109375, -0.0888671875, 0.060302734375, 0.20947265625, 0.358642578125, 0.5078125, 0.656982421875, 0.80615234375, 0.955322265625, 1.1044921875, 1.253662109375, 1.40283203125, 1.552001953125, 1.701171875, 1.850341796875, 1.99951171875, 2.148681640625, 2.2978515625, 2.447021484375, 2.59619140625, 2.745361328125, 2.89453125, 3.043701171875, 3.19287109375, 3.342041015625, 3.4912109375, 3.640380859375, 3.78955078125, 3.938720703125, 4.087890625, 4.237060546875, 4.38623046875, 4.535400390625, 4.6845703125, 4.833740234375, 4.98291015625, 5.132080078125, 5.28125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 7.0, 13.0, 16.0, 12.0, 12.0, 15.0, 17.0, 21.0, 27.0, 38.0, 54.0, 66.0, 86.0, 131.0, 231.0, 307.0, 589.0, 3251.0, 136368.0, 845836.0, 58041.0, 1884.0, 520.0, 271.0, 163.0, 132.0, 119.0, 68.0, 60.0, 33.0, 33.0, 21.0, 16.0, 21.0, 13.0, 7.0, 12.0, 6.0, 4.0, 4.0, 9.0, 3.0, 0.0, 2.0, 5.0, 3.0, 0.0, 1.0], "bins": [-11.1171875, -10.8031005859375, -10.489013671875, -10.1749267578125, -9.86083984375, -9.5467529296875, -9.232666015625, -8.9185791015625, -8.6044921875, -8.2904052734375, -7.976318359375, -7.6622314453125, -7.34814453125, -7.0340576171875, -6.719970703125, -6.4058837890625, -6.091796875, -5.7777099609375, -5.463623046875, -5.1495361328125, -4.83544921875, -4.5213623046875, -4.207275390625, -3.8931884765625, -3.5791015625, -3.2650146484375, -2.950927734375, -2.6368408203125, -2.32275390625, -2.0086669921875, -1.694580078125, -1.3804931640625, -1.06640625, -0.7523193359375, -0.438232421875, -0.1241455078125, 0.18994140625, 0.5040283203125, 0.818115234375, 1.1322021484375, 1.4462890625, 1.7603759765625, 2.074462890625, 2.3885498046875, 2.70263671875, 3.0167236328125, 3.330810546875, 3.6448974609375, 3.958984375, 4.2730712890625, 4.587158203125, 4.9012451171875, 5.21533203125, 5.5294189453125, 5.843505859375, 6.1575927734375, 6.4716796875, 6.7857666015625, 7.099853515625, 7.4139404296875, 7.72802734375, 8.0421142578125, 8.356201171875, 8.6702880859375, 8.984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 9.0, 11.0, 5.0, 12.0, 4.0, 11.0, 21.0, 23.0, 31.0, 30.0, 27.0, 44.0, 52.0, 41.0, 55.0, 40.0, 50.0, 43.0, 45.0, 39.0, 43.0, 43.0, 43.0, 33.0, 35.0, 24.0, 34.0, 19.0, 13.0, 13.0, 18.0, 14.0, 10.0, 9.0, 6.0, 10.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-5.8828125, -5.71270751953125, -5.5426025390625, -5.37249755859375, -5.202392578125, -5.03228759765625, -4.8621826171875, -4.69207763671875, -4.52197265625, -4.35186767578125, -4.1817626953125, -4.01165771484375, -3.841552734375, -3.67144775390625, -3.5013427734375, -3.33123779296875, -3.1611328125, -2.99102783203125, -2.8209228515625, -2.65081787109375, -2.480712890625, -2.31060791015625, -2.1405029296875, -1.97039794921875, -1.80029296875, -1.63018798828125, -1.4600830078125, -1.28997802734375, -1.119873046875, -0.94976806640625, -0.7796630859375, -0.60955810546875, -0.439453125, -0.26934814453125, -0.0992431640625, 0.07086181640625, 0.240966796875, 0.41107177734375, 0.5811767578125, 0.75128173828125, 0.92138671875, 1.09149169921875, 1.2615966796875, 1.43170166015625, 1.601806640625, 1.77191162109375, 1.9420166015625, 2.11212158203125, 2.2822265625, 2.45233154296875, 2.6224365234375, 2.79254150390625, 2.962646484375, 3.13275146484375, 3.3028564453125, 3.47296142578125, 3.64306640625, 3.81317138671875, 3.9832763671875, 4.15338134765625, 4.323486328125, 4.49359130859375, 4.6636962890625, 4.83380126953125, 5.00390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 4.0, 9.0, 9.0, 9.0, 22.0, 49.0, 101.0, 270.0, 946.0, 7025.0, 631672.0, 401533.0, 5591.0, 860.0, 214.0, 100.0, 48.0, 34.0, 16.0, 10.0, 5.0, 7.0, 2.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.77734375, -6.60333251953125, -6.4293212890625, -6.25531005859375, -6.081298828125, -5.90728759765625, -5.7332763671875, -5.55926513671875, -5.38525390625, -5.21124267578125, -5.0372314453125, -4.86322021484375, -4.689208984375, -4.51519775390625, -4.3411865234375, -4.16717529296875, -3.9931640625, -3.81915283203125, -3.6451416015625, -3.47113037109375, -3.297119140625, -3.12310791015625, -2.9490966796875, -2.77508544921875, -2.60107421875, -2.42706298828125, -2.2530517578125, -2.07904052734375, -1.905029296875, -1.73101806640625, -1.5570068359375, -1.38299560546875, -1.208984375, -1.03497314453125, -0.8609619140625, -0.68695068359375, -0.512939453125, -0.33892822265625, -0.1649169921875, 0.00909423828125, 0.18310546875, 0.35711669921875, 0.5311279296875, 0.70513916015625, 0.879150390625, 1.05316162109375, 1.2271728515625, 1.40118408203125, 1.5751953125, 1.74920654296875, 1.9232177734375, 2.09722900390625, 2.271240234375, 2.44525146484375, 2.6192626953125, 2.79327392578125, 2.96728515625, 3.14129638671875, 3.3153076171875, 3.48931884765625, 3.663330078125, 3.83734130859375, 4.0113525390625, 4.18536376953125, 4.359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 13.0, 15.0, 19.0, 40.0, 53.0, 95.0, 112.0, 133.0, 140.0, 123.0, 85.0, 60.0, 39.0, 23.0, 17.0, 10.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004935264587402344, -0.00047988444566726685, -0.0004662424325942993, -0.0004526004195213318, -0.00043895840644836426, -0.00042531639337539673, -0.0004116743803024292, -0.00039803236722946167, -0.00038439035415649414, -0.0003707483410835266, -0.0003571063280105591, -0.00034346431493759155, -0.000329822301864624, -0.0003161802887916565, -0.00030253827571868896, -0.00028889626264572144, -0.0002752542495727539, -0.0002616122364997864, -0.00024797022342681885, -0.00023432821035385132, -0.0002206861972808838, -0.00020704418420791626, -0.00019340217113494873, -0.0001797601580619812, -0.00016611814498901367, -0.00015247613191604614, -0.0001388341188430786, -0.00012519210577011108, -0.00011155009269714355, -9.790807962417603e-05, -8.42660665512085e-05, -7.062405347824097e-05, -5.698204040527344e-05, -4.334002733230591e-05, -2.969801425933838e-05, -1.605600118637085e-05, -2.4139881134033203e-06, 1.1228024959564209e-05, 2.4870038032531738e-05, 3.851205110549927e-05, 5.21540641784668e-05, 6.579607725143433e-05, 7.943809032440186e-05, 9.308010339736938e-05, 0.00010672211647033691, 0.00012036412954330444, 0.00013400614261627197, 0.0001476481556892395, 0.00016129016876220703, 0.00017493218183517456, 0.0001885741949081421, 0.00020221620798110962, 0.00021585822105407715, 0.00022950023412704468, 0.0002431422472000122, 0.00025678426027297974, 0.00027042627334594727, 0.0002840682864189148, 0.0002977102994918823, 0.00031135231256484985, 0.0003249943256378174, 0.0003386363387107849, 0.00035227835178375244, 0.00036592036485671997, 0.0003795623779296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 10.0, 10.0, 20.0, 24.0, 54.0, 96.0, 174.0, 590.0, 3552.0, 199169.0, 836393.0, 7009.0, 943.0, 273.0, 98.0, 50.0, 27.0, 24.0, 13.0, 7.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.752227783203125, -3.54547119140625, -3.338714599609375, -3.1319580078125, -2.925201416015625, -2.71844482421875, -2.511688232421875, -2.304931640625, -2.098175048828125, -1.89141845703125, -1.684661865234375, -1.4779052734375, -1.271148681640625, -1.06439208984375, -0.857635498046875, -0.65087890625, -0.444122314453125, -0.23736572265625, -0.030609130859375, 0.1761474609375, 0.382904052734375, 0.58966064453125, 0.796417236328125, 1.003173828125, 1.209930419921875, 1.41668701171875, 1.623443603515625, 1.8302001953125, 2.036956787109375, 2.24371337890625, 2.450469970703125, 2.6572265625, 2.863983154296875, 3.07073974609375, 3.277496337890625, 3.4842529296875, 3.691009521484375, 3.89776611328125, 4.104522705078125, 4.311279296875, 4.518035888671875, 4.72479248046875, 4.931549072265625, 5.1383056640625, 5.345062255859375, 5.55181884765625, 5.758575439453125, 5.96533203125, 6.172088623046875, 6.37884521484375, 6.585601806640625, 6.7923583984375, 6.999114990234375, 7.20587158203125, 7.412628173828125, 7.619384765625, 7.826141357421875, 8.03289794921875, 8.239654541015625, 8.4464111328125, 8.653167724609375, 8.85992431640625, 9.066680908203125, 9.2734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 8.0, 14.0, 27.0, 41.0, 60.0, 108.0, 109.0, 158.0, 151.0, 109.0, 73.0, 50.0, 34.0, 15.0, 17.0, 9.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.6135177612304688, -1.5766448974609375, -1.5397720336914062, -1.502899169921875, -1.4660263061523438, -1.4291534423828125, -1.3922805786132812, -1.35540771484375, -1.3185348510742188, -1.2816619873046875, -1.2447891235351562, -1.207916259765625, -1.1710433959960938, -1.1341705322265625, -1.0972976684570312, -1.0604248046875, -1.0235519409179688, -0.9866790771484375, -0.9498062133789062, -0.912933349609375, -0.8760604858398438, -0.8391876220703125, -0.8023147583007812, -0.76544189453125, -0.7285690307617188, -0.6916961669921875, -0.6548233032226562, -0.617950439453125, -0.5810775756835938, -0.5442047119140625, -0.5073318481445312, -0.470458984375, -0.43358612060546875, -0.3967132568359375, -0.35984039306640625, -0.322967529296875, -0.28609466552734375, -0.2492218017578125, -0.21234893798828125, -0.17547607421875, -0.13860321044921875, -0.1017303466796875, -0.06485748291015625, -0.027984619140625, 0.00888824462890625, 0.0457611083984375, 0.08263397216796875, 0.1195068359375, 0.15637969970703125, 0.1932525634765625, 0.23012542724609375, 0.266998291015625, 0.30387115478515625, 0.3407440185546875, 0.37761688232421875, 0.41448974609375, 0.45136260986328125, 0.4882354736328125, 0.5251083374023438, 0.561981201171875, 0.5988540649414062, 0.6357269287109375, 0.6725997924804688, 0.70947265625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 15.0, 22.0, 35.0, 44.0, 73.0, 79.0, 92.0, 110.0, 114.0, 95.0, 104.0, 73.0, 52.0, 33.0, 33.0, 14.0, 5.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.735433578491211, -10.41178035736084, -10.088127136230469, -9.764473915100098, -9.440820693969727, -9.117166519165039, -8.793513298034668, -8.469860076904297, -8.146206855773926, -7.822553634643555, -7.498900413513184, -7.175246715545654, -6.851593494415283, -6.527940273284912, -6.204286575317383, -5.880633354187012, -5.556980133056641, -5.2333269119262695, -4.909673690795898, -4.586019992828369, -4.262366771697998, -3.938713550567627, -3.6150600910186768, -3.2914066314697266, -2.9677534103393555, -2.6441001892089844, -2.320446729660034, -1.9967933893203735, -1.673140048980713, -1.3494867086410522, -1.0258333683013916, -0.7021799087524414, -0.3785257339477539, -0.05487239360809326, 0.2687809467315674, 0.592434287071228, 0.9160876274108887, 1.2397409677505493, 1.56339430809021, 1.8870477676391602, 2.2107009887695312, 2.5343542098999023, 2.8580076694488525, 3.1816611289978027, 3.505314350128174, 3.828967571258545, 4.152621269226074, 4.476274490356445, 4.799927711486816, 5.1235809326171875, 5.447234153747559, 5.770887851715088, 6.094541072845459, 6.41819429397583, 6.741847991943359, 7.0655012130737305, 7.389154434204102, 7.712807655334473, 8.036460876464844, 8.360114097595215, 8.683767318725586, 9.007421493530273, 9.331074714660645, 9.654727935791016, 9.978381156921387]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 6.0, 7.0, 8.0, 19.0, 19.0, 19.0, 24.0, 26.0, 23.0, 30.0, 39.0, 29.0, 36.0, 41.0, 53.0, 39.0, 39.0, 40.0, 46.0, 52.0, 41.0, 41.0, 43.0, 28.0, 42.0, 31.0, 37.0, 20.0, 19.0, 19.0, 11.0, 13.0, 12.0, 11.0, 14.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.183972358703613, -8.88526725769043, -8.586563110351562, -8.287858009338379, -7.989152908325195, -7.69044828414917, -7.3917436599731445, -7.093038558959961, -6.7943339347839355, -6.49562931060791, -6.196924209594727, -5.898219585418701, -5.599514961242676, -5.300809860229492, -5.002105236053467, -4.703400611877441, -4.404695510864258, -4.105990886688232, -3.807285785675049, -3.5085811614990234, -3.209876298904419, -2.9111714363098145, -2.612466812133789, -2.3137619495391846, -2.01505708694458, -1.7163522243499756, -1.4176474809646606, -1.1189427375793457, -0.8202378749847412, -0.5215330123901367, -0.22282826900482178, 0.07587647438049316, 0.37458133697509766, 0.6732861399650574, 0.9719909429550171, 1.270695686340332, 1.5694005489349365, 1.868105411529541, 2.1668100357055664, 2.465514898300171, 2.7642197608947754, 3.06292462348938, 3.3616294860839844, 3.6603341102600098, 3.9590389728546143, 4.257743835449219, 4.556448459625244, 4.8551530838012695, 5.153858184814453, 5.4525628089904785, 5.751267910003662, 6.0499725341796875, 6.348677635192871, 6.6473822593688965, 6.946086883544922, 7.2447919845581055, 7.543496608734131, 7.842201232910156, 8.14090633392334, 8.439611434936523, 8.73831558227539, 9.037020683288574, 9.335725784301758, 9.634429931640625, 9.933135032653809]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 9.0, 5.0, 11.0, 21.0, 16.0, 29.0, 33.0, 38.0, 91.0, 107.0, 170.0, 266.0, 498.0, 1570.0, 12236.0, 248084.0, 2983694.0, 907572.0, 35005.0, 3103.0, 725.0, 342.0, 213.0, 138.0, 92.0, 43.0, 44.0, 38.0, 20.0, 12.0, 11.0, 10.0, 6.0, 4.0, 11.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9453125, -8.6539306640625, -8.362548828125, -8.0711669921875, -7.77978515625, -7.4884033203125, -7.197021484375, -6.9056396484375, -6.6142578125, -6.3228759765625, -6.031494140625, -5.7401123046875, -5.44873046875, -5.1573486328125, -4.865966796875, -4.5745849609375, -4.283203125, -3.9918212890625, -3.700439453125, -3.4090576171875, -3.11767578125, -2.8262939453125, -2.534912109375, -2.2435302734375, -1.9521484375, -1.6607666015625, -1.369384765625, -1.0780029296875, -0.78662109375, -0.4952392578125, -0.203857421875, 0.0875244140625, 0.37890625, 0.6702880859375, 0.961669921875, 1.2530517578125, 1.54443359375, 1.8358154296875, 2.127197265625, 2.4185791015625, 2.7099609375, 3.0013427734375, 3.292724609375, 3.5841064453125, 3.87548828125, 4.1668701171875, 4.458251953125, 4.7496337890625, 5.041015625, 5.3323974609375, 5.623779296875, 5.9151611328125, 6.20654296875, 6.4979248046875, 6.789306640625, 7.0806884765625, 7.3720703125, 7.6634521484375, 7.954833984375, 8.2462158203125, 8.53759765625, 8.8289794921875, 9.120361328125, 9.4117431640625, 9.703125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 10.0, 11.0, 7.0, 13.0, 13.0, 21.0, 21.0, 22.0, 22.0, 35.0, 25.0, 34.0, 50.0, 37.0, 42.0, 43.0, 41.0, 47.0, 41.0, 45.0, 42.0, 49.0, 39.0, 34.0, 34.0, 41.0, 18.0, 27.0, 26.0, 18.0, 16.0, 17.0, 11.0, 7.0, 3.0, 7.0, 9.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.083984375, -2.972320556640625, -2.86065673828125, -2.748992919921875, -2.6373291015625, -2.525665283203125, -2.41400146484375, -2.302337646484375, -2.190673828125, -2.079010009765625, -1.96734619140625, -1.855682373046875, -1.7440185546875, -1.632354736328125, -1.52069091796875, -1.409027099609375, -1.29736328125, -1.185699462890625, -1.07403564453125, -0.962371826171875, -0.8507080078125, -0.739044189453125, -0.62738037109375, -0.515716552734375, -0.404052734375, -0.292388916015625, -0.18072509765625, -0.069061279296875, 0.0426025390625, 0.154266357421875, 0.26593017578125, 0.377593994140625, 0.4892578125, 0.600921630859375, 0.71258544921875, 0.824249267578125, 0.9359130859375, 1.047576904296875, 1.15924072265625, 1.270904541015625, 1.382568359375, 1.494232177734375, 1.60589599609375, 1.717559814453125, 1.8292236328125, 1.940887451171875, 2.05255126953125, 2.164215087890625, 2.27587890625, 2.387542724609375, 2.49920654296875, 2.610870361328125, 2.7225341796875, 2.834197998046875, 2.94586181640625, 3.057525634765625, 3.169189453125, 3.280853271484375, 3.39251708984375, 3.504180908203125, 3.6158447265625, 3.727508544921875, 3.83917236328125, 3.950836181640625, 4.0625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 21.0, 14.0, 21.0, 26.0, 61.0, 84.0, 113.0, 186.0, 268.0, 424.0, 805.0, 1611.0, 4853.0, 34645.0, 888766.0, 3108825.0, 137163.0, 11226.0, 2553.0, 1059.0, 543.0, 339.0, 207.0, 111.0, 82.0, 80.0, 42.0, 43.0, 27.0, 16.0, 11.0, 11.0, 5.0, 5.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.7734375, -6.5335693359375, -6.293701171875, -6.0538330078125, -5.81396484375, -5.5740966796875, -5.334228515625, -5.0943603515625, -4.8544921875, -4.6146240234375, -4.374755859375, -4.1348876953125, -3.89501953125, -3.6551513671875, -3.415283203125, -3.1754150390625, -2.935546875, -2.6956787109375, -2.455810546875, -2.2159423828125, -1.97607421875, -1.7362060546875, -1.496337890625, -1.2564697265625, -1.0166015625, -0.7767333984375, -0.536865234375, -0.2969970703125, -0.05712890625, 0.1827392578125, 0.422607421875, 0.6624755859375, 0.90234375, 1.1422119140625, 1.382080078125, 1.6219482421875, 1.86181640625, 2.1016845703125, 2.341552734375, 2.5814208984375, 2.8212890625, 3.0611572265625, 3.301025390625, 3.5408935546875, 3.78076171875, 4.0206298828125, 4.260498046875, 4.5003662109375, 4.740234375, 4.9801025390625, 5.219970703125, 5.4598388671875, 5.69970703125, 5.9395751953125, 6.179443359375, 6.4193115234375, 6.6591796875, 6.8990478515625, 7.138916015625, 7.3787841796875, 7.61865234375, 7.8585205078125, 8.098388671875, 8.3382568359375, 8.578125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 12.0, 14.0, 13.0, 22.0, 24.0, 21.0, 36.0, 66.0, 79.0, 123.0, 154.0, 226.0, 275.0, 379.0, 444.0, 440.0, 417.0, 306.0, 275.0, 200.0, 147.0, 103.0, 85.0, 49.0, 45.0, 25.0, 27.0, 19.0, 14.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.822265625, -1.7746124267578125, -1.726959228515625, -1.6793060302734375, -1.63165283203125, -1.5839996337890625, -1.536346435546875, -1.4886932373046875, -1.4410400390625, -1.3933868408203125, -1.345733642578125, -1.2980804443359375, -1.25042724609375, -1.2027740478515625, -1.155120849609375, -1.1074676513671875, -1.059814453125, -1.0121612548828125, -0.964508056640625, -0.9168548583984375, -0.86920166015625, -0.8215484619140625, -0.773895263671875, -0.7262420654296875, -0.6785888671875, -0.6309356689453125, -0.583282470703125, -0.5356292724609375, -0.48797607421875, -0.4403228759765625, -0.392669677734375, -0.3450164794921875, -0.29736328125, -0.2497100830078125, -0.202056884765625, -0.1544036865234375, -0.10675048828125, -0.0590972900390625, -0.011444091796875, 0.0362091064453125, 0.0838623046875, 0.1315155029296875, 0.179168701171875, 0.2268218994140625, 0.27447509765625, 0.3221282958984375, 0.369781494140625, 0.4174346923828125, 0.465087890625, 0.5127410888671875, 0.560394287109375, 0.6080474853515625, 0.65570068359375, 0.7033538818359375, 0.751007080078125, 0.7986602783203125, 0.8463134765625, 0.8939666748046875, 0.941619873046875, 0.9892730712890625, 1.03692626953125, 1.0845794677734375, 1.132232666015625, 1.1798858642578125, 1.2275390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 13.0, 29.0, 52.0, 75.0, 101.0, 139.0, 142.0, 118.0, 122.0, 87.0, 56.0, 30.0, 19.0, 7.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.18076229095459, -14.85482406616211, -14.528885841369629, -14.202947616577148, -13.877009391784668, -13.551071166992188, -13.225132942199707, -12.899194717407227, -12.573257446289062, -12.247319221496582, -11.921380996704102, -11.595442771911621, -11.26950454711914, -10.94356632232666, -10.61762809753418, -10.291690826416016, -9.965751647949219, -9.639813423156738, -9.313875198364258, -8.987936973571777, -8.661998748779297, -8.336060523986816, -8.010122299194336, -7.684184551239014, -7.358246326446533, -7.032308101654053, -6.706369876861572, -6.380431652069092, -6.0544939041137695, -5.728555679321289, -5.402617454528809, -5.076679229736328, -4.7507405281066895, -4.424802303314209, -4.0988640785217285, -3.772926092147827, -3.4469878673553467, -3.121049642562866, -2.795111656188965, -2.4691734313964844, -2.143235206604004, -1.8172969818115234, -1.4913588762283325, -1.1654207706451416, -0.8394825458526611, -0.5135443210601807, -0.18760621547698975, 0.13833189010620117, 0.46427011489868164, 0.7902082800865173, 1.116146445274353, 1.442084550857544, 1.7680227756500244, 2.093961000442505, 2.4198989868164062, 2.7458372116088867, 3.071775436401367, 3.3977136611938477, 3.723651885986328, 4.049590110778809, 4.375528335571289, 4.7014665603637695, 5.027404308319092, 5.353342533111572, 5.679280757904053]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 14.0, 10.0, 15.0, 15.0, 20.0, 26.0, 18.0, 28.0, 32.0, 39.0, 37.0, 25.0, 35.0, 47.0, 42.0, 37.0, 42.0, 47.0, 43.0, 40.0, 36.0, 39.0, 36.0, 38.0, 30.0, 29.0, 29.0, 30.0, 15.0, 14.0, 18.0, 14.0, 12.0, 11.0, 6.0, 3.0, 6.0, 1.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.415496587753296, -3.293851613998413, -3.1722066402435303, -3.0505619049072266, -2.9289169311523438, -2.807271957397461, -2.685626983642578, -2.5639820098876953, -2.4423370361328125, -2.3206920623779297, -2.199047088623047, -2.077402114868164, -1.9557573795318604, -1.8341124057769775, -1.7124674320220947, -1.590822458267212, -1.4691777229309082, -1.3475327491760254, -1.2258878946304321, -1.1042429208755493, -0.9825980067253113, -0.8609530925750732, -0.7393081188201904, -0.6176632046699524, -0.49601829051971436, -0.3743733763694763, -0.2527284324169159, -0.13108348846435547, -0.009438574314117432, 0.1122063398361206, 0.23385131359100342, 0.35549622774124146, 0.4771413803100586, 0.5987862944602966, 0.7204312086105347, 0.8420761823654175, 0.9637210965156555, 1.0853660106658936, 1.2070109844207764, 1.3286559581756592, 1.4503008127212524, 1.5719457864761353, 1.6935906410217285, 1.8152356147766113, 1.9368805885314941, 2.058525562286377, 2.1801705360412598, 2.3018152713775635, 2.4234602451324463, 2.545105218887329, 2.666750192642212, 2.7883949279785156, 2.9100399017333984, 3.0316848754882812, 3.153329849243164, 3.274974822998047, 3.3966197967529297, 3.5182647705078125, 3.6399097442626953, 3.761554718017578, 3.883199453353882, 4.004844665527344, 4.126489639282227, 4.248134136199951, 4.369779109954834]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 12.0, 16.0, 22.0, 36.0, 47.0, 100.0, 146.0, 255.0, 477.0, 994.0, 2314.0, 6057.0, 17894.0, 57628.0, 174003.0, 348675.0, 278862.0, 108480.0, 34658.0, 11013.0, 3775.0, 1489.0, 665.0, 355.0, 210.0, 111.0, 88.0, 48.0, 38.0, 15.0, 18.0, 12.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57763671875, -0.558868408203125, -0.54010009765625, -0.521331787109375, -0.5025634765625, -0.483795166015625, -0.46502685546875, -0.446258544921875, -0.427490234375, -0.408721923828125, -0.38995361328125, -0.371185302734375, -0.3524169921875, -0.333648681640625, -0.31488037109375, -0.296112060546875, -0.27734375, -0.258575439453125, -0.23980712890625, -0.221038818359375, -0.2022705078125, -0.183502197265625, -0.16473388671875, -0.145965576171875, -0.127197265625, -0.108428955078125, -0.08966064453125, -0.070892333984375, -0.0521240234375, -0.033355712890625, -0.01458740234375, 0.004180908203125, 0.02294921875, 0.041717529296875, 0.06048583984375, 0.079254150390625, 0.0980224609375, 0.116790771484375, 0.13555908203125, 0.154327392578125, 0.173095703125, 0.191864013671875, 0.21063232421875, 0.229400634765625, 0.2481689453125, 0.266937255859375, 0.28570556640625, 0.304473876953125, 0.3232421875, 0.342010498046875, 0.36077880859375, 0.379547119140625, 0.3983154296875, 0.417083740234375, 0.43585205078125, 0.454620361328125, 0.473388671875, 0.492156982421875, 0.51092529296875, 0.529693603515625, 0.5484619140625, 0.567230224609375, 0.58599853515625, 0.604766845703125, 0.62353515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 9.0, 12.0, 16.0, 18.0, 36.0, 38.0, 26.0, 47.0, 60.0, 53.0, 46.0, 51.0, 55.0, 60.0, 57.0, 61.0, 55.0, 58.0, 43.0, 48.0, 31.0, 34.0, 17.0, 17.0, 13.0, 17.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.6470947265625, -2.528564453125, -2.4100341796875, -2.29150390625, -2.1729736328125, -2.054443359375, -1.9359130859375, -1.8173828125, -1.6988525390625, -1.580322265625, -1.4617919921875, -1.34326171875, -1.2247314453125, -1.106201171875, -0.9876708984375, -0.869140625, -0.7506103515625, -0.632080078125, -0.5135498046875, -0.39501953125, -0.2764892578125, -0.157958984375, -0.0394287109375, 0.0791015625, 0.1976318359375, 0.316162109375, 0.4346923828125, 0.55322265625, 0.6717529296875, 0.790283203125, 0.9088134765625, 1.02734375, 1.1458740234375, 1.264404296875, 1.3829345703125, 1.50146484375, 1.6199951171875, 1.738525390625, 1.8570556640625, 1.9755859375, 2.0941162109375, 2.212646484375, 2.3311767578125, 2.44970703125, 2.5682373046875, 2.686767578125, 2.8052978515625, 2.923828125, 3.0423583984375, 3.160888671875, 3.2794189453125, 3.39794921875, 3.5164794921875, 3.635009765625, 3.7535400390625, 3.8720703125, 3.9906005859375, 4.109130859375, 4.2276611328125, 4.34619140625, 4.4647216796875, 4.583251953125, 4.7017822265625, 4.8203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 22.0, 35.0, 60.0, 136.0, 221.0, 529.0, 1121.0, 2805.0, 6754.0, 16337.0, 39558.0, 93155.0, 196871.0, 287455.0, 217219.0, 107800.0, 46204.0, 18931.0, 7681.0, 3194.0, 1293.0, 583.0, 300.0, 145.0, 71.0, 22.0, 15.0, 10.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.457763671875, -0.44525146484375, -0.4327392578125, -0.42022705078125, -0.40771484375, -0.39520263671875, -0.3826904296875, -0.37017822265625, -0.357666015625, -0.34515380859375, -0.3326416015625, -0.32012939453125, -0.3076171875, -0.29510498046875, -0.2825927734375, -0.27008056640625, -0.257568359375, -0.24505615234375, -0.2325439453125, -0.22003173828125, -0.20751953125, -0.19500732421875, -0.1824951171875, -0.16998291015625, -0.157470703125, -0.14495849609375, -0.1324462890625, -0.11993408203125, -0.107421875, -0.09490966796875, -0.0823974609375, -0.06988525390625, -0.057373046875, -0.04486083984375, -0.0323486328125, -0.01983642578125, -0.00732421875, 0.00518798828125, 0.0177001953125, 0.03021240234375, 0.042724609375, 0.05523681640625, 0.0677490234375, 0.08026123046875, 0.0927734375, 0.10528564453125, 0.1177978515625, 0.13031005859375, 0.142822265625, 0.15533447265625, 0.1678466796875, 0.18035888671875, 0.19287109375, 0.20538330078125, 0.2178955078125, 0.23040771484375, 0.242919921875, 0.25543212890625, 0.2679443359375, 0.28045654296875, 0.29296875, 0.30548095703125, 0.3179931640625, 0.33050537109375, 0.343017578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 5.0, 3.0, 8.0, 12.0, 14.0, 16.0, 17.0, 18.0, 24.0, 24.0, 26.0, 33.0, 37.0, 46.0, 41.0, 60.0, 59.0, 60.0, 54.0, 56.0, 46.0, 48.0, 52.0, 35.0, 41.0, 24.0, 25.0, 24.0, 17.0, 10.0, 6.0, 18.0, 7.0, 7.0, 8.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-7.3203125, -7.121826171875, -6.92333984375, -6.724853515625, -6.5263671875, -6.327880859375, -6.12939453125, -5.930908203125, -5.732421875, -5.533935546875, -5.33544921875, -5.136962890625, -4.9384765625, -4.739990234375, -4.54150390625, -4.343017578125, -4.14453125, -3.946044921875, -3.74755859375, -3.549072265625, -3.3505859375, -3.152099609375, -2.95361328125, -2.755126953125, -2.556640625, -2.358154296875, -2.15966796875, -1.961181640625, -1.7626953125, -1.564208984375, -1.36572265625, -1.167236328125, -0.96875, -0.770263671875, -0.57177734375, -0.373291015625, -0.1748046875, 0.023681640625, 0.22216796875, 0.420654296875, 0.619140625, 0.817626953125, 1.01611328125, 1.214599609375, 1.4130859375, 1.611572265625, 1.81005859375, 2.008544921875, 2.20703125, 2.405517578125, 2.60400390625, 2.802490234375, 3.0009765625, 3.199462890625, 3.39794921875, 3.596435546875, 3.794921875, 3.993408203125, 4.19189453125, 4.390380859375, 4.5888671875, 4.787353515625, 4.98583984375, 5.184326171875, 5.3828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 11.0, 8.0, 14.0, 26.0, 45.0, 64.0, 92.0, 137.0, 211.0, 388.0, 723.0, 1496.0, 3764.0, 11310.0, 48583.0, 305514.0, 548075.0, 98573.0, 19480.0, 5823.0, 2095.0, 917.0, 473.0, 277.0, 165.0, 99.0, 60.0, 46.0, 28.0, 22.0, 9.0, 4.0, 8.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.10186767578125, -0.09888935089111328, -0.09591102600097656, -0.09293270111083984, -0.08995437622070312, -0.0869760513305664, -0.08399772644042969, -0.08101940155029297, -0.07804107666015625, -0.07506275177001953, -0.07208442687988281, -0.0691061019897461, -0.06612777709960938, -0.06314945220947266, -0.06017112731933594, -0.05719280242919922, -0.0542144775390625, -0.05123615264892578, -0.04825782775878906, -0.045279502868652344, -0.042301177978515625, -0.039322853088378906, -0.03634452819824219, -0.03336620330810547, -0.03038787841796875, -0.02740955352783203, -0.024431228637695312, -0.021452903747558594, -0.018474578857421875, -0.015496253967285156, -0.012517929077148438, -0.009539604187011719, -0.006561279296875, -0.0035829544067382812, -0.0006046295166015625, 0.0023736953735351562, 0.005352020263671875, 0.008330345153808594, 0.011308670043945312, 0.014286994934082031, 0.01726531982421875, 0.02024364471435547, 0.023221969604492188, 0.026200294494628906, 0.029178619384765625, 0.032156944274902344, 0.03513526916503906, 0.03811359405517578, 0.0410919189453125, 0.04407024383544922, 0.04704856872558594, 0.050026893615722656, 0.053005218505859375, 0.055983543395996094, 0.05896186828613281, 0.06194019317626953, 0.06491851806640625, 0.06789684295654297, 0.07087516784667969, 0.0738534927368164, 0.07683181762695312, 0.07981014251708984, 0.08278846740722656, 0.08576679229736328, 0.0887451171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 5.0, 17.0, 18.0, 30.0, 40.0, 46.0, 77.0, 112.0, 116.0, 138.0, 110.0, 91.0, 62.0, 39.0, 34.0, 20.0, 10.0, 14.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.432699203491211e-05, -7.178634405136108e-05, -6.924569606781006e-05, -6.670504808425903e-05, -6.416440010070801e-05, -6.162375211715698e-05, -5.908310413360596e-05, -5.654245615005493e-05, -5.4001808166503906e-05, -5.146116018295288e-05, -4.8920512199401855e-05, -4.637986421585083e-05, -4.3839216232299805e-05, -4.129856824874878e-05, -3.8757920265197754e-05, -3.621727228164673e-05, -3.36766242980957e-05, -3.113597631454468e-05, -2.8595328330993652e-05, -2.6054680347442627e-05, -2.35140323638916e-05, -2.0973384380340576e-05, -1.843273639678955e-05, -1.5892088413238525e-05, -1.33514404296875e-05, -1.0810792446136475e-05, -8.27014446258545e-06, -5.729496479034424e-06, -3.1888484954833984e-06, -6.48200511932373e-07, 1.8924474716186523e-06, 4.433095455169678e-06, 6.973743438720703e-06, 9.514391422271729e-06, 1.2055039405822754e-05, 1.459568738937378e-05, 1.7136335372924805e-05, 1.967698335647583e-05, 2.2217631340026855e-05, 2.475827932357788e-05, 2.7298927307128906e-05, 2.983957529067993e-05, 3.238022327423096e-05, 3.492087125778198e-05, 3.746151924133301e-05, 4.000216722488403e-05, 4.254281520843506e-05, 4.5083463191986084e-05, 4.762411117553711e-05, 5.0164759159088135e-05, 5.270540714263916e-05, 5.5246055126190186e-05, 5.778670310974121e-05, 6.0327351093292236e-05, 6.286799907684326e-05, 6.540864706039429e-05, 6.794929504394531e-05, 7.048994302749634e-05, 7.303059101104736e-05, 7.557123899459839e-05, 7.811188697814941e-05, 8.065253496170044e-05, 8.319318294525146e-05, 8.573383092880249e-05, 8.827447891235352e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 4.0, 2.0, 8.0, 7.0, 3.0, 14.0, 7.0, 14.0, 25.0, 24.0, 58.0, 124.0, 218.0, 415.0, 1105.0, 3000.0, 11061.0, 65413.0, 623256.0, 302879.0, 30645.0, 6711.0, 1970.0, 788.0, 338.0, 187.0, 87.0, 51.0, 27.0, 21.0, 10.0, 13.0, 7.0, 4.0, 7.0, 7.0, 3.0, 5.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.11977005004882812, -0.11588287353515625, -0.11199569702148438, -0.1081085205078125, -0.10422134399414062, -0.10033416748046875, -0.09644699096679688, -0.092559814453125, -0.08867263793945312, -0.08478546142578125, -0.08089828491210938, -0.0770111083984375, -0.07312393188476562, -0.06923675537109375, -0.06534957885742188, -0.06146240234375, -0.057575225830078125, -0.05368804931640625, -0.049800872802734375, -0.0459136962890625, -0.042026519775390625, -0.03813934326171875, -0.034252166748046875, -0.030364990234375, -0.026477813720703125, -0.02259063720703125, -0.018703460693359375, -0.0148162841796875, -0.010929107666015625, -0.00704193115234375, -0.003154754638671875, 0.000732421875, 0.004619598388671875, 0.00850677490234375, 0.012393951416015625, 0.0162811279296875, 0.020168304443359375, 0.02405548095703125, 0.027942657470703125, 0.031829833984375, 0.035717010498046875, 0.03960418701171875, 0.043491363525390625, 0.0473785400390625, 0.051265716552734375, 0.05515289306640625, 0.059040069580078125, 0.06292724609375, 0.06681442260742188, 0.07070159912109375, 0.07458877563476562, 0.0784759521484375, 0.08236312866210938, 0.08625030517578125, 0.09013748168945312, 0.094024658203125, 0.09791183471679688, 0.10179901123046875, 0.10568618774414062, 0.1095733642578125, 0.11346054077148438, 0.11734771728515625, 0.12123489379882812, 0.1251220703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 14.0, 16.0, 11.0, 25.0, 38.0, 46.0, 59.0, 80.0, 103.0, 100.0, 111.0, 87.0, 77.0, 44.0, 43.0, 43.0, 27.0, 14.0, 11.0, 11.0, 4.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0254974365234375, -0.02469491958618164, -0.02389240264892578, -0.023089885711669922, -0.022287368774414062, -0.021484851837158203, -0.020682334899902344, -0.019879817962646484, -0.019077301025390625, -0.018274784088134766, -0.017472267150878906, -0.016669750213623047, -0.015867233276367188, -0.015064716339111328, -0.014262199401855469, -0.01345968246459961, -0.01265716552734375, -0.01185464859008789, -0.011052131652832031, -0.010249614715576172, -0.009447097778320312, -0.008644580841064453, -0.007842063903808594, -0.007039546966552734, -0.006237030029296875, -0.005434513092041016, -0.004631996154785156, -0.003829479217529297, -0.0030269622802734375, -0.002224445343017578, -0.0014219284057617188, -0.0006194114685058594, 0.00018310546875, 0.0009856224060058594, 0.0017881393432617188, 0.002590656280517578, 0.0033931732177734375, 0.004195690155029297, 0.004998207092285156, 0.005800724029541016, 0.006603240966796875, 0.007405757904052734, 0.008208274841308594, 0.009010791778564453, 0.009813308715820312, 0.010615825653076172, 0.011418342590332031, 0.01222085952758789, 0.01302337646484375, 0.01382589340209961, 0.014628410339355469, 0.015430927276611328, 0.016233444213867188, 0.017035961151123047, 0.017838478088378906, 0.018640995025634766, 0.019443511962890625, 0.020246028900146484, 0.021048545837402344, 0.021851062774658203, 0.022653579711914062, 0.023456096649169922, 0.02425861358642578, 0.02506113052368164, 0.0258636474609375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 15.0, 91.0, 304.0, 380.0, 181.0, 31.0, 7.0, 5.0, 0.0, 3.0], "bins": [-31.23577880859375, -30.69000816345215, -30.144237518310547, -29.598466873168945, -29.052696228027344, -28.506925582885742, -27.96115493774414, -27.415386199951172, -26.869613647460938, -26.323843002319336, -25.778072357177734, -25.232301712036133, -24.68653106689453, -24.14076042175293, -23.594989776611328, -23.04922103881836, -22.503450393676758, -21.957679748535156, -21.411909103393555, -20.866138458251953, -20.32036781311035, -19.77459716796875, -19.22882652282715, -18.683055877685547, -18.137287139892578, -17.591516494750977, -17.045745849609375, -16.499975204467773, -15.954204559326172, -15.40843391418457, -14.862664222717285, -14.316893577575684, -13.77112102508545, -13.225350379943848, -12.679579734802246, -12.133809089660645, -11.58803939819336, -11.042268753051758, -10.496498107910156, -9.950727462768555, -9.404956817626953, -8.859186172485352, -8.31341552734375, -7.767645359039307, -7.221874713897705, -6.6761040687561035, -6.13033390045166, -5.584563255310059, -5.038792610168457, -4.4930219650268555, -3.947251558303833, -3.4014811515808105, -2.855710506439209, -2.3099398612976074, -1.764169454574585, -1.2183990478515625, -0.6726281642913818, -0.12685763835906982, 0.4189128875732422, 0.9646834135055542, 1.5104539394378662, 2.0562245845794678, 2.6019949913024902, 3.1477653980255127, 3.6935360431671143]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 12.0, 14.0, 15.0, 17.0, 23.0, 22.0, 30.0, 31.0, 43.0, 41.0, 42.0, 27.0, 49.0, 54.0, 41.0, 48.0, 52.0, 46.0, 36.0, 49.0, 33.0, 47.0, 30.0, 29.0, 31.0, 26.0, 20.0, 15.0, 10.0, 14.0, 12.0, 11.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4967775344848633, -2.408999443054199, -2.321221113204956, -2.233443021774292, -2.145664930343628, -2.0578866004943848, -1.9701085090637207, -1.8823304176330566, -1.794552206993103, -1.7067739963531494, -1.6189959049224854, -1.5312176942825317, -1.4434394836425781, -1.355661392211914, -1.2678831815719604, -1.1801049709320068, -1.0923268795013428, -1.0045486688613892, -0.9167705774307251, -0.8289923667907715, -0.7412142157554626, -0.6534360647201538, -0.5656578540802002, -0.47787970304489136, -0.3901015520095825, -0.3023234009742737, -0.21454522013664246, -0.12676703929901123, -0.03898888826370239, 0.048789262771606445, 0.13656747341156006, 0.2243456244468689, 0.31212353706359863, 0.39990168809890747, 0.4876798689365387, 0.5754580497741699, 0.6632362008094788, 0.7510143518447876, 0.8387925624847412, 0.92657071352005, 1.0143488645553589, 1.1021270751953125, 1.1899051666259766, 1.2776833772659302, 1.3654615879058838, 1.4532396793365479, 1.5410178899765015, 1.628796100616455, 1.7165741920471191, 1.8043524026870728, 1.8921304941177368, 1.9799087047576904, 2.0676867961883545, 2.1554651260375977, 2.2432432174682617, 2.331021308898926, 2.41879940032959, 2.506577491760254, 2.594355821609497, 2.682133913040161, 2.769912004470825, 2.8576903343200684, 2.9454684257507324, 3.0332465171813965, 3.1210248470306396]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 11.0, 16.0, 15.0, 30.0, 79.0, 178.0, 349.0, 933.0, 3179.0, 11469.0, 47552.0, 197092.0, 489506.0, 224982.0, 54401.0, 13276.0, 3624.0, 1047.0, 426.0, 177.0, 85.0, 39.0, 23.0, 22.0, 9.0, 4.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.94140625, -3.8203125, -3.69921875, -3.578125, -3.45703125, -3.3359375, -3.21484375, -3.09375, -2.97265625, -2.8515625, -2.73046875, -2.609375, -2.48828125, -2.3671875, -2.24609375, -2.125, -2.00390625, -1.8828125, -1.76171875, -1.640625, -1.51953125, -1.3984375, -1.27734375, -1.15625, -1.03515625, -0.9140625, -0.79296875, -0.671875, -0.55078125, -0.4296875, -0.30859375, -0.1875, -0.06640625, 0.0546875, 0.17578125, 0.296875, 0.41796875, 0.5390625, 0.66015625, 0.78125, 0.90234375, 1.0234375, 1.14453125, 1.265625, 1.38671875, 1.5078125, 1.62890625, 1.75, 1.87109375, 1.9921875, 2.11328125, 2.234375, 2.35546875, 2.4765625, 2.59765625, 2.71875, 2.83984375, 2.9609375, 3.08203125, 3.203125, 3.32421875, 3.4453125, 3.56640625, 3.6875, 3.80859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 11.0, 10.0, 12.0, 23.0, 22.0, 24.0, 24.0, 25.0, 36.0, 42.0, 40.0, 39.0, 50.0, 43.0, 44.0, 44.0, 52.0, 47.0, 47.0, 41.0, 45.0, 39.0, 40.0, 34.0, 21.0, 23.0, 27.0, 14.0, 14.0, 13.0, 11.0, 12.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.17578125, -5.01300048828125, -4.8502197265625, -4.68743896484375, -4.524658203125, -4.36187744140625, -4.1990966796875, -4.03631591796875, -3.87353515625, -3.71075439453125, -3.5479736328125, -3.38519287109375, -3.222412109375, -3.05963134765625, -2.8968505859375, -2.73406982421875, -2.5712890625, -2.40850830078125, -2.2457275390625, -2.08294677734375, -1.920166015625, -1.75738525390625, -1.5946044921875, -1.43182373046875, -1.26904296875, -1.10626220703125, -0.9434814453125, -0.78070068359375, -0.617919921875, -0.45513916015625, -0.2923583984375, -0.12957763671875, 0.033203125, 0.19598388671875, 0.3587646484375, 0.52154541015625, 0.684326171875, 0.84710693359375, 1.0098876953125, 1.17266845703125, 1.33544921875, 1.49822998046875, 1.6610107421875, 1.82379150390625, 1.986572265625, 2.14935302734375, 2.3121337890625, 2.47491455078125, 2.6376953125, 2.80047607421875, 2.9632568359375, 3.12603759765625, 3.288818359375, 3.45159912109375, 3.6143798828125, 3.77716064453125, 3.93994140625, 4.10272216796875, 4.2655029296875, 4.42828369140625, 4.591064453125, 4.75384521484375, 4.9166259765625, 5.07940673828125, 5.2421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 10.0, 15.0, 6.0, 27.0, 15.0, 20.0, 24.0, 34.0, 36.0, 61.0, 100.0, 153.0, 250.0, 481.0, 2124.0, 122692.0, 901574.0, 18994.0, 979.0, 375.0, 186.0, 110.0, 73.0, 45.0, 28.0, 36.0, 18.0, 14.0, 13.0, 7.0, 11.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.625, -11.253662109375, -10.88232421875, -10.510986328125, -10.1396484375, -9.768310546875, -9.39697265625, -9.025634765625, -8.654296875, -8.282958984375, -7.91162109375, -7.540283203125, -7.1689453125, -6.797607421875, -6.42626953125, -6.054931640625, -5.68359375, -5.312255859375, -4.94091796875, -4.569580078125, -4.1982421875, -3.826904296875, -3.45556640625, -3.084228515625, -2.712890625, -2.341552734375, -1.97021484375, -1.598876953125, -1.2275390625, -0.856201171875, -0.48486328125, -0.113525390625, 0.2578125, 0.629150390625, 1.00048828125, 1.371826171875, 1.7431640625, 2.114501953125, 2.48583984375, 2.857177734375, 3.228515625, 3.599853515625, 3.97119140625, 4.342529296875, 4.7138671875, 5.085205078125, 5.45654296875, 5.827880859375, 6.19921875, 6.570556640625, 6.94189453125, 7.313232421875, 7.6845703125, 8.055908203125, 8.42724609375, 8.798583984375, 9.169921875, 9.541259765625, 9.91259765625, 10.283935546875, 10.6552734375, 11.026611328125, 11.39794921875, 11.769287109375, 12.140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 9.0, 16.0, 14.0, 16.0, 11.0, 22.0, 20.0, 21.0, 27.0, 42.0, 33.0, 33.0, 46.0, 34.0, 41.0, 48.0, 49.0, 43.0, 37.0, 36.0, 45.0, 37.0, 42.0, 35.0, 23.0, 34.0, 25.0, 28.0, 32.0, 8.0, 9.0, 13.0, 12.0, 5.0, 9.0, 12.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-6.34765625, -6.1689453125, -5.990234375, -5.8115234375, -5.6328125, -5.4541015625, -5.275390625, -5.0966796875, -4.91796875, -4.7392578125, -4.560546875, -4.3818359375, -4.203125, -4.0244140625, -3.845703125, -3.6669921875, -3.48828125, -3.3095703125, -3.130859375, -2.9521484375, -2.7734375, -2.5947265625, -2.416015625, -2.2373046875, -2.05859375, -1.8798828125, -1.701171875, -1.5224609375, -1.34375, -1.1650390625, -0.986328125, -0.8076171875, -0.62890625, -0.4501953125, -0.271484375, -0.0927734375, 0.0859375, 0.2646484375, 0.443359375, 0.6220703125, 0.80078125, 0.9794921875, 1.158203125, 1.3369140625, 1.515625, 1.6943359375, 1.873046875, 2.0517578125, 2.23046875, 2.4091796875, 2.587890625, 2.7666015625, 2.9453125, 3.1240234375, 3.302734375, 3.4814453125, 3.66015625, 3.8388671875, 4.017578125, 4.1962890625, 4.375, 4.5537109375, 4.732421875, 4.9111328125, 5.08984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 9.0, 15.0, 37.0, 117.0, 603.0, 25177.0, 1019129.0, 3102.0, 244.0, 52.0, 27.0, 20.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.3626708984375, -9.053466796875, -8.7442626953125, -8.43505859375, -8.1258544921875, -7.816650390625, -7.5074462890625, -7.1982421875, -6.8890380859375, -6.579833984375, -6.2706298828125, -5.96142578125, -5.6522216796875, -5.343017578125, -5.0338134765625, -4.724609375, -4.4154052734375, -4.106201171875, -3.7969970703125, -3.48779296875, -3.1785888671875, -2.869384765625, -2.5601806640625, -2.2509765625, -1.9417724609375, -1.632568359375, -1.3233642578125, -1.01416015625, -0.7049560546875, -0.395751953125, -0.0865478515625, 0.22265625, 0.5318603515625, 0.841064453125, 1.1502685546875, 1.45947265625, 1.7686767578125, 2.077880859375, 2.3870849609375, 2.6962890625, 3.0054931640625, 3.314697265625, 3.6239013671875, 3.93310546875, 4.2423095703125, 4.551513671875, 4.8607177734375, 5.169921875, 5.4791259765625, 5.788330078125, 6.0975341796875, 6.40673828125, 6.7159423828125, 7.025146484375, 7.3343505859375, 7.6435546875, 7.9527587890625, 8.261962890625, 8.5711669921875, 8.88037109375, 9.1895751953125, 9.498779296875, 9.8079833984375, 10.1171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 14.0, 30.0, 35.0, 49.0, 72.0, 89.0, 115.0, 97.0, 114.0, 92.0, 69.0, 60.0, 49.0, 29.0, 23.0, 11.0, 12.0, 3.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002415180206298828, -0.0002328045666217804, -0.00022409111261367798, -0.00021537765860557556, -0.00020666420459747314, -0.00019795075058937073, -0.0001892372965812683, -0.0001805238425731659, -0.00017181038856506348, -0.00016309693455696106, -0.00015438348054885864, -0.00014567002654075623, -0.0001369565725326538, -0.0001282431185245514, -0.00011952966451644897, -0.00011081621050834656, -0.00010210275650024414, -9.338930249214172e-05, -8.46758484840393e-05, -7.596239447593689e-05, -6.724894046783447e-05, -5.8535486459732056e-05, -4.982203245162964e-05, -4.110857844352722e-05, -3.2395124435424805e-05, -2.3681670427322388e-05, -1.496821641921997e-05, -6.254762411117554e-06, 2.4586915969848633e-06, 1.117214560508728e-05, 1.9885599613189697e-05, 2.8599053621292114e-05, 3.731250762939453e-05, 4.602596163749695e-05, 5.4739415645599365e-05, 6.345286965370178e-05, 7.21663236618042e-05, 8.087977766990662e-05, 8.959323167800903e-05, 9.830668568611145e-05, 0.00010702013969421387, 0.00011573359370231628, 0.0001244470477104187, 0.00013316050171852112, 0.00014187395572662354, 0.00015058740973472595, 0.00015930086374282837, 0.00016801431775093079, 0.0001767277717590332, 0.00018544122576713562, 0.00019415467977523804, 0.00020286813378334045, 0.00021158158779144287, 0.0002202950417995453, 0.0002290084958076477, 0.00023772194981575012, 0.00024643540382385254, 0.00025514885783195496, 0.0002638623118400574, 0.0002725757658481598, 0.0002812892198562622, 0.0002900026738643646, 0.00029871612787246704, 0.00030742958188056946, 0.0003161430358886719]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 15.0, 31.0, 101.0, 376.0, 4297.0, 1034390.0, 8596.0, 574.0, 113.0, 32.0, 10.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.90625, -17.52191162109375, -17.1375732421875, -16.75323486328125, -16.368896484375, -15.98455810546875, -15.6002197265625, -15.21588134765625, -14.83154296875, -14.44720458984375, -14.0628662109375, -13.67852783203125, -13.294189453125, -12.90985107421875, -12.5255126953125, -12.14117431640625, -11.7568359375, -11.37249755859375, -10.9881591796875, -10.60382080078125, -10.219482421875, -9.83514404296875, -9.4508056640625, -9.06646728515625, -8.68212890625, -8.29779052734375, -7.9134521484375, -7.52911376953125, -7.144775390625, -6.76043701171875, -6.3760986328125, -5.99176025390625, -5.607421875, -5.22308349609375, -4.8387451171875, -4.45440673828125, -4.070068359375, -3.68572998046875, -3.3013916015625, -2.91705322265625, -2.53271484375, -2.14837646484375, -1.7640380859375, -1.37969970703125, -0.995361328125, -0.61102294921875, -0.2266845703125, 0.15765380859375, 0.5419921875, 0.92633056640625, 1.3106689453125, 1.69500732421875, 2.079345703125, 2.46368408203125, 2.8480224609375, 3.23236083984375, 3.61669921875, 4.00103759765625, 4.3853759765625, 4.76971435546875, 5.154052734375, 5.53839111328125, 5.9227294921875, 6.30706787109375, 6.69140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 12.0, 28.0, 87.0, 151.0, 275.0, 224.0, 131.0, 56.0, 23.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.111328125, -1.045257568359375, -0.97918701171875, -0.913116455078125, -0.8470458984375, -0.780975341796875, -0.71490478515625, -0.648834228515625, -0.582763671875, -0.516693115234375, -0.45062255859375, -0.384552001953125, -0.3184814453125, -0.252410888671875, -0.18634033203125, -0.120269775390625, -0.05419921875, 0.011871337890625, 0.07794189453125, 0.144012451171875, 0.2100830078125, 0.276153564453125, 0.34222412109375, 0.408294677734375, 0.474365234375, 0.540435791015625, 0.60650634765625, 0.672576904296875, 0.7386474609375, 0.804718017578125, 0.87078857421875, 0.936859130859375, 1.0029296875, 1.069000244140625, 1.13507080078125, 1.201141357421875, 1.2672119140625, 1.333282470703125, 1.39935302734375, 1.465423583984375, 1.531494140625, 1.597564697265625, 1.66363525390625, 1.729705810546875, 1.7957763671875, 1.861846923828125, 1.92791748046875, 1.993988037109375, 2.06005859375, 2.126129150390625, 2.19219970703125, 2.258270263671875, 2.3243408203125, 2.390411376953125, 2.45648193359375, 2.522552490234375, 2.588623046875, 2.654693603515625, 2.72076416015625, 2.786834716796875, 2.8529052734375, 2.918975830078125, 2.98504638671875, 3.051116943359375, 3.1171875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 13.0, 19.0, 44.0, 74.0, 88.0, 107.0, 104.0, 142.0, 112.0, 82.0, 82.0, 56.0, 26.0, 18.0, 13.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.801612377166748, -5.464967250823975, -5.128322124481201, -4.791677474975586, -4.4550323486328125, -4.118387222290039, -3.7817420959472656, -3.445096969604492, -3.1084518432617188, -2.7718067169189453, -2.435161590576172, -2.0985167026519775, -1.761871576309204, -1.4252264499664307, -1.0885815620422363, -0.7519364356994629, -0.41529130935668945, -0.07864624261856079, 0.25799882411956787, 0.5946438312530518, 0.9312889575958252, 1.2679340839385986, 1.604578971862793, 1.9412240982055664, 2.27786922454834, 2.6145143508911133, 2.9511594772338867, 3.287804365158081, 3.6244494915008545, 3.961094617843628, 4.297739505767822, 4.634384632110596, 4.971029281616211, 5.307674407958984, 5.644319534301758, 5.980964660644531, 6.317609786987305, 6.654254913330078, 6.990899562835693, 7.327544689178467, 7.66418981552124, 8.000834465026855, 8.337479591369629, 8.674124717712402, 9.010769844055176, 9.34741497039795, 9.684060096740723, 10.020705223083496, 10.35735034942627, 10.693995475769043, 11.030640602111816, 11.36728572845459, 11.703930854797363, 12.040575981140137, 12.377220153808594, 12.713865280151367, 13.05051040649414, 13.387155532836914, 13.723800659179688, 14.060445785522461, 14.397090911865234, 14.733736038208008, 15.070381164550781, 15.407026290893555, 15.743671417236328]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 5.0, 4.0, 18.0, 12.0, 16.0, 19.0, 18.0, 20.0, 36.0, 23.0, 38.0, 38.0, 33.0, 36.0, 23.0, 35.0, 38.0, 45.0, 42.0, 41.0, 32.0, 60.0, 31.0, 31.0, 30.0, 31.0, 30.0, 27.0, 24.0, 26.0, 19.0, 20.0, 14.0, 12.0, 8.0, 12.0, 10.0, 11.0, 3.0, 4.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.518416404724121, -7.246252059936523, -6.974087715148926, -6.701923370361328, -6.429759502410889, -6.157595157623291, -5.885430812835693, -5.613266468048096, -5.341102600097656, -5.068938255310059, -4.796773910522461, -4.524609565734863, -4.252445697784424, -3.980281352996826, -3.7081170082092285, -3.435952663421631, -3.163788318634033, -2.8916239738464355, -2.619459867477417, -2.3472955226898193, -2.075131416320801, -1.8029670715332031, -1.5308027267456055, -1.2586385011672974, -0.9864742755889893, -0.7143100500106812, -0.44214576482772827, -0.1699814796447754, 0.10218274593353271, 0.3743469715118408, 0.6465113162994385, 0.9186755418777466, 1.1908397674560547, 1.4630039930343628, 1.735168218612671, 2.0073325634002686, 2.279496669769287, 2.5516610145568848, 2.8238253593444824, 3.09598970413208, 3.3681538105010986, 3.6403181552886963, 3.912482261657715, 4.1846466064453125, 4.45681095123291, 4.728975296020508, 5.0011396408081055, 5.273303508758545, 5.545467853546143, 5.81763219833374, 6.089796543121338, 6.361960411071777, 6.634124755859375, 6.906289100646973, 7.17845344543457, 7.450617790222168, 7.722782135009766, 7.994946479797363, 8.267110824584961, 8.539275169372559, 8.811439514160156, 9.083602905273438, 9.355768203735352, 9.627931594848633, 9.90009593963623]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 5.0, 9.0, 12.0, 13.0, 21.0, 21.0, 24.0, 36.0, 54.0, 63.0, 99.0, 129.0, 278.0, 472.0, 1168.0, 5634.0, 46226.0, 652203.0, 2822598.0, 615032.0, 42513.0, 5167.0, 1194.0, 490.0, 255.0, 167.0, 113.0, 81.0, 51.0, 32.0, 37.0, 19.0, 17.0, 13.0, 8.0, 6.0, 8.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03125, -6.8079833984375, -6.584716796875, -6.3614501953125, -6.13818359375, -5.9149169921875, -5.691650390625, -5.4683837890625, -5.2451171875, -5.0218505859375, -4.798583984375, -4.5753173828125, -4.35205078125, -4.1287841796875, -3.905517578125, -3.6822509765625, -3.458984375, -3.2357177734375, -3.012451171875, -2.7891845703125, -2.56591796875, -2.3426513671875, -2.119384765625, -1.8961181640625, -1.6728515625, -1.4495849609375, -1.226318359375, -1.0030517578125, -0.77978515625, -0.5565185546875, -0.333251953125, -0.1099853515625, 0.11328125, 0.3365478515625, 0.559814453125, 0.7830810546875, 1.00634765625, 1.2296142578125, 1.452880859375, 1.6761474609375, 1.8994140625, 2.1226806640625, 2.345947265625, 2.5692138671875, 2.79248046875, 3.0157470703125, 3.239013671875, 3.4622802734375, 3.685546875, 3.9088134765625, 4.132080078125, 4.3553466796875, 4.57861328125, 4.8018798828125, 5.025146484375, 5.2484130859375, 5.4716796875, 5.6949462890625, 5.918212890625, 6.1414794921875, 6.36474609375, 6.5880126953125, 6.811279296875, 7.0345458984375, 7.2578125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 6.0, 10.0, 14.0, 16.0, 17.0, 23.0, 23.0, 30.0, 38.0, 43.0, 38.0, 37.0, 38.0, 35.0, 45.0, 63.0, 41.0, 43.0, 48.0, 42.0, 41.0, 38.0, 41.0, 37.0, 30.0, 29.0, 20.0, 19.0, 27.0, 13.0, 7.0, 11.0, 3.0, 6.0, 9.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.647308349609375, -2.53875732421875, -2.430206298828125, -2.3216552734375, -2.213104248046875, -2.10455322265625, -1.996002197265625, -1.887451171875, -1.778900146484375, -1.67034912109375, -1.561798095703125, -1.4532470703125, -1.344696044921875, -1.23614501953125, -1.127593994140625, -1.01904296875, -0.910491943359375, -0.80194091796875, -0.693389892578125, -0.5848388671875, -0.476287841796875, -0.36773681640625, -0.259185791015625, -0.150634765625, -0.042083740234375, 0.06646728515625, 0.175018310546875, 0.2835693359375, 0.392120361328125, 0.50067138671875, 0.609222412109375, 0.7177734375, 0.826324462890625, 0.93487548828125, 1.043426513671875, 1.1519775390625, 1.260528564453125, 1.36907958984375, 1.477630615234375, 1.586181640625, 1.694732666015625, 1.80328369140625, 1.911834716796875, 2.0203857421875, 2.128936767578125, 2.23748779296875, 2.346038818359375, 2.45458984375, 2.563140869140625, 2.67169189453125, 2.780242919921875, 2.8887939453125, 2.997344970703125, 3.10589599609375, 3.214447021484375, 3.322998046875, 3.431549072265625, 3.54010009765625, 3.648651123046875, 3.7572021484375, 3.865753173828125, 3.97430419921875, 4.082855224609375, 4.19140625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 7.0, 9.0, 14.0, 19.0, 28.0, 62.0, 120.0, 265.0, 582.0, 1476.0, 7744.0, 403594.0, 3730275.0, 44919.0, 3418.0, 951.0, 371.0, 173.0, 92.0, 64.0, 37.0, 20.0, 16.0, 3.0, 7.0, 2.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7265625, -9.341796875, -8.95703125, -8.572265625, -8.1875, -7.802734375, -7.41796875, -7.033203125, -6.6484375, -6.263671875, -5.87890625, -5.494140625, -5.109375, -4.724609375, -4.33984375, -3.955078125, -3.5703125, -3.185546875, -2.80078125, -2.416015625, -2.03125, -1.646484375, -1.26171875, -0.876953125, -0.4921875, -0.107421875, 0.27734375, 0.662109375, 1.046875, 1.431640625, 1.81640625, 2.201171875, 2.5859375, 2.970703125, 3.35546875, 3.740234375, 4.125, 4.509765625, 4.89453125, 5.279296875, 5.6640625, 6.048828125, 6.43359375, 6.818359375, 7.203125, 7.587890625, 7.97265625, 8.357421875, 8.7421875, 9.126953125, 9.51171875, 9.896484375, 10.28125, 10.666015625, 11.05078125, 11.435546875, 11.8203125, 12.205078125, 12.58984375, 12.974609375, 13.359375, 13.744140625, 14.12890625, 14.513671875, 14.8984375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 18.0, 22.0, 37.0, 62.0, 88.0, 166.0, 282.0, 482.0, 610.0, 663.0, 594.0, 414.0, 249.0, 160.0, 75.0, 64.0, 33.0, 18.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.033203125, -2.9599151611328125, -2.886627197265625, -2.8133392333984375, -2.74005126953125, -2.6667633056640625, -2.593475341796875, -2.5201873779296875, -2.4468994140625, -2.3736114501953125, -2.300323486328125, -2.2270355224609375, -2.15374755859375, -2.0804595947265625, -2.007171630859375, -1.9338836669921875, -1.860595703125, -1.7873077392578125, -1.714019775390625, -1.6407318115234375, -1.56744384765625, -1.4941558837890625, -1.420867919921875, -1.3475799560546875, -1.2742919921875, -1.2010040283203125, -1.127716064453125, -1.0544281005859375, -0.98114013671875, -0.9078521728515625, -0.834564208984375, -0.7612762451171875, -0.68798828125, -0.6147003173828125, -0.541412353515625, -0.4681243896484375, -0.39483642578125, -0.3215484619140625, -0.248260498046875, -0.1749725341796875, -0.1016845703125, -0.0283966064453125, 0.044891357421875, 0.1181793212890625, 0.19146728515625, 0.2647552490234375, 0.338043212890625, 0.4113311767578125, 0.484619140625, 0.5579071044921875, 0.631195068359375, 0.7044830322265625, 0.77777099609375, 0.8510589599609375, 0.924346923828125, 0.9976348876953125, 1.0709228515625, 1.1442108154296875, 1.217498779296875, 1.2907867431640625, 1.36407470703125, 1.4373626708984375, 1.510650634765625, 1.5839385986328125, 1.6572265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 13.0, 20.0, 32.0, 56.0, 64.0, 95.0, 88.0, 111.0, 108.0, 98.0, 97.0, 67.0, 52.0, 44.0, 17.0, 12.0, 7.0, 6.0, 4.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.965921878814697, -6.728592395782471, -6.491262912750244, -6.253932952880859, -6.016603469848633, -5.779273986816406, -5.54194450378418, -5.304615020751953, -5.067285537719727, -4.8299560546875, -4.592626571655273, -4.355297088623047, -4.117967128753662, -3.8806376457214355, -3.643308162689209, -3.4059786796569824, -3.1686487197875977, -2.931319236755371, -2.6939895153045654, -2.456660032272339, -2.219330310821533, -1.9820008277893066, -1.74467134475708, -1.507341742515564, -1.2700121402740479, -1.0326825380325317, -0.7953529953956604, -0.5580234527587891, -0.32069385051727295, -0.08336424827575684, 0.15396523475646973, 0.39129483699798584, 0.6286249160766602, 0.8659545183181763, 1.1032841205596924, 1.340613603591919, 1.577943205833435, 1.8152728080749512, 2.0526022911071777, 2.2899317741394043, 2.52726149559021, 2.7645909786224365, 3.001920700073242, 3.2392501831054688, 3.4765796661376953, 3.713909387588501, 3.9512388706207275, 4.188568592071533, 4.42589807510376, 4.663227558135986, 4.900557041168213, 5.137887001037598, 5.375216484069824, 5.612545967102051, 5.849875450134277, 6.087204933166504, 6.3245344161987305, 6.561863899230957, 6.799193382263184, 7.03652286529541, 7.273852825164795, 7.5111823081970215, 7.748511791229248, 7.985841274261475, 8.22317123413086]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 6.0, 4.0, 6.0, 10.0, 14.0, 12.0, 22.0, 21.0, 30.0, 43.0, 28.0, 36.0, 29.0, 40.0, 37.0, 33.0, 41.0, 48.0, 51.0, 57.0, 38.0, 44.0, 38.0, 35.0, 24.0, 33.0, 42.0, 32.0, 20.0, 27.0, 22.0, 16.0, 8.0, 12.0, 12.0, 12.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2223548889160156, -3.102600336074829, -2.9828457832336426, -2.863091230392456, -2.7433366775512695, -2.623582124710083, -2.5038275718688965, -2.38407301902771, -2.2643184661865234, -2.144563913345337, -2.0248093605041504, -1.9050548076629639, -1.7853002548217773, -1.6655457019805908, -1.5457911491394043, -1.4260365962982178, -1.3062820434570312, -1.1865274906158447, -1.0667729377746582, -0.9470183849334717, -0.8272638320922852, -0.7075092792510986, -0.5877547264099121, -0.4680001735687256, -0.34824562072753906, -0.22849106788635254, -0.10873651504516602, 0.011018037796020508, 0.13077259063720703, 0.25052714347839355, 0.3702816963195801, 0.4900362491607666, 0.6097908020019531, 0.7295453548431396, 0.8492999076843262, 0.9690544605255127, 1.0888090133666992, 1.2085635662078857, 1.3283181190490723, 1.4480726718902588, 1.5678272247314453, 1.6875817775726318, 1.8073363304138184, 1.9270908832550049, 2.0468454360961914, 2.166599988937378, 2.2863545417785645, 2.406109094619751, 2.5258636474609375, 2.645618200302124, 2.7653727531433105, 2.885127305984497, 3.0048818588256836, 3.12463641166687, 3.2443909645080566, 3.364145517349243, 3.4839000701904297, 3.603654623031616, 3.7234091758728027, 3.8431637287139893, 3.962918281555176, 4.082673072814941, 4.202427387237549, 4.322181701660156, 4.441936492919922]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 12.0, 8.0, 18.0, 27.0, 35.0, 66.0, 85.0, 120.0, 195.0, 298.0, 604.0, 1482.0, 5029.0, 21605.0, 102386.0, 364286.0, 396420.0, 120688.0, 26024.0, 5888.0, 1723.0, 671.0, 310.0, 198.0, 118.0, 88.0, 62.0, 37.0, 18.0, 23.0, 15.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7470703125, -0.7213592529296875, -0.695648193359375, -0.6699371337890625, -0.64422607421875, -0.6185150146484375, -0.592803955078125, -0.5670928955078125, -0.5413818359375, -0.5156707763671875, -0.489959716796875, -0.4642486572265625, -0.43853759765625, -0.4128265380859375, -0.387115478515625, -0.3614044189453125, -0.335693359375, -0.3099822998046875, -0.284271240234375, -0.2585601806640625, -0.23284912109375, -0.2071380615234375, -0.181427001953125, -0.1557159423828125, -0.1300048828125, -0.1042938232421875, -0.078582763671875, -0.0528717041015625, -0.02716064453125, -0.0014495849609375, 0.024261474609375, 0.0499725341796875, 0.07568359375, 0.1013946533203125, 0.127105712890625, 0.1528167724609375, 0.17852783203125, 0.2042388916015625, 0.229949951171875, 0.2556610107421875, 0.2813720703125, 0.3070831298828125, 0.332794189453125, 0.3585052490234375, 0.38421630859375, 0.4099273681640625, 0.435638427734375, 0.4613494873046875, 0.487060546875, 0.5127716064453125, 0.538482666015625, 0.5641937255859375, 0.58990478515625, 0.6156158447265625, 0.641326904296875, 0.6670379638671875, 0.6927490234375, 0.7184600830078125, 0.744171142578125, 0.7698822021484375, 0.79559326171875, 0.8213043212890625, 0.847015380859375, 0.8727264404296875, 0.8984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 14.0, 22.0, 21.0, 24.0, 31.0, 29.0, 31.0, 49.0, 45.0, 47.0, 51.0, 50.0, 56.0, 43.0, 51.0, 42.0, 55.0, 39.0, 40.0, 33.0, 41.0, 26.0, 24.0, 19.0, 25.0, 27.0, 11.0, 11.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.413360595703125, -2.31500244140625, -2.216644287109375, -2.1182861328125, -2.019927978515625, -1.92156982421875, -1.823211669921875, -1.724853515625, -1.626495361328125, -1.52813720703125, -1.429779052734375, -1.3314208984375, -1.233062744140625, -1.13470458984375, -1.036346435546875, -0.93798828125, -0.839630126953125, -0.74127197265625, -0.642913818359375, -0.5445556640625, -0.446197509765625, -0.34783935546875, -0.249481201171875, -0.151123046875, -0.052764892578125, 0.04559326171875, 0.143951416015625, 0.2423095703125, 0.340667724609375, 0.43902587890625, 0.537384033203125, 0.6357421875, 0.734100341796875, 0.83245849609375, 0.930816650390625, 1.0291748046875, 1.127532958984375, 1.22589111328125, 1.324249267578125, 1.422607421875, 1.520965576171875, 1.61932373046875, 1.717681884765625, 1.8160400390625, 1.914398193359375, 2.01275634765625, 2.111114501953125, 2.20947265625, 2.307830810546875, 2.40618896484375, 2.504547119140625, 2.6029052734375, 2.701263427734375, 2.79962158203125, 2.897979736328125, 2.996337890625, 3.094696044921875, 3.19305419921875, 3.291412353515625, 3.3897705078125, 3.488128662109375, 3.58648681640625, 3.684844970703125, 3.783203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 3.0, 2.0, 3.0, 7.0, 9.0, 8.0, 13.0, 17.0, 33.0, 49.0, 75.0, 118.0, 202.0, 381.0, 679.0, 1243.0, 2234.0, 4116.0, 7302.0, 13050.0, 23364.0, 41017.0, 67781.0, 105310.0, 145979.0, 170716.0, 156315.0, 118778.0, 78559.0, 47858.0, 27999.0, 15777.0, 8755.0, 4797.0, 2572.0, 1518.0, 818.0, 454.0, 255.0, 137.0, 102.0, 34.0, 47.0, 21.0, 13.0, 11.0, 6.0, 4.0, 4.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.255126953125, -0.247314453125, -0.239501953125, -0.231689453125, -0.223876953125, -0.216064453125, -0.208251953125, -0.200439453125, -0.192626953125, -0.184814453125, -0.177001953125, -0.169189453125, -0.161376953125, -0.153564453125, -0.145751953125, -0.137939453125, -0.130126953125, -0.122314453125, -0.114501953125, -0.106689453125, -0.098876953125, -0.091064453125, -0.083251953125, -0.075439453125, -0.067626953125, -0.059814453125, -0.052001953125, -0.044189453125, -0.036376953125, -0.028564453125, -0.020751953125, -0.012939453125, -0.005126953125, 0.002685546875, 0.010498046875, 0.018310546875, 0.026123046875, 0.033935546875, 0.041748046875, 0.049560546875, 0.057373046875, 0.065185546875, 0.072998046875, 0.080810546875, 0.088623046875, 0.096435546875, 0.104248046875, 0.112060546875, 0.119873046875, 0.127685546875, 0.135498046875, 0.143310546875, 0.151123046875, 0.158935546875, 0.166748046875, 0.174560546875, 0.182373046875, 0.190185546875, 0.197998046875, 0.205810546875, 0.213623046875, 0.221435546875, 0.229248046875, 0.237060546875, 0.244873046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 10.0, 4.0, 4.0, 6.0, 4.0, 13.0, 14.0, 18.0, 6.0, 15.0, 13.0, 18.0, 23.0, 26.0, 20.0, 45.0, 27.0, 36.0, 35.0, 22.0, 54.0, 33.0, 42.0, 38.0, 37.0, 36.0, 41.0, 41.0, 29.0, 29.0, 35.0, 34.0, 33.0, 24.0, 18.0, 24.0, 9.0, 13.0, 16.0, 10.0, 9.0, 7.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.94921875, -4.7945556640625, -4.639892578125, -4.4852294921875, -4.33056640625, -4.1759033203125, -4.021240234375, -3.8665771484375, -3.7119140625, -3.5572509765625, -3.402587890625, -3.2479248046875, -3.09326171875, -2.9385986328125, -2.783935546875, -2.6292724609375, -2.474609375, -2.3199462890625, -2.165283203125, -2.0106201171875, -1.85595703125, -1.7012939453125, -1.546630859375, -1.3919677734375, -1.2373046875, -1.0826416015625, -0.927978515625, -0.7733154296875, -0.61865234375, -0.4639892578125, -0.309326171875, -0.1546630859375, 0.0, 0.1546630859375, 0.309326171875, 0.4639892578125, 0.61865234375, 0.7733154296875, 0.927978515625, 1.0826416015625, 1.2373046875, 1.3919677734375, 1.546630859375, 1.7012939453125, 1.85595703125, 2.0106201171875, 2.165283203125, 2.3199462890625, 2.474609375, 2.6292724609375, 2.783935546875, 2.9385986328125, 3.09326171875, 3.2479248046875, 3.402587890625, 3.5572509765625, 3.7119140625, 3.8665771484375, 4.021240234375, 4.1759033203125, 4.33056640625, 4.4852294921875, 4.639892578125, 4.7945556640625, 4.94921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 8.0, 9.0, 20.0, 35.0, 44.0, 54.0, 107.0, 180.0, 265.0, 474.0, 760.0, 1307.0, 2504.0, 5203.0, 12575.0, 36906.0, 122801.0, 362076.0, 337527.0, 110207.0, 33415.0, 11618.0, 4875.0, 2352.0, 1286.0, 738.0, 435.0, 271.0, 154.0, 118.0, 68.0, 54.0, 27.0, 24.0, 9.0, 9.0, 9.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0765380859375, -0.07434844970703125, -0.0721588134765625, -0.06996917724609375, -0.067779541015625, -0.06558990478515625, -0.0634002685546875, -0.06121063232421875, -0.05902099609375, -0.05683135986328125, -0.0546417236328125, -0.05245208740234375, -0.050262451171875, -0.04807281494140625, -0.0458831787109375, -0.04369354248046875, -0.04150390625, -0.03931427001953125, -0.0371246337890625, -0.03493499755859375, -0.032745361328125, -0.03055572509765625, -0.0283660888671875, -0.02617645263671875, -0.02398681640625, -0.02179718017578125, -0.0196075439453125, -0.01741790771484375, -0.015228271484375, -0.01303863525390625, -0.0108489990234375, -0.00865936279296875, -0.0064697265625, -0.00428009033203125, -0.0020904541015625, 9.918212890625e-05, 0.002288818359375, 0.00447845458984375, 0.0066680908203125, 0.00885772705078125, 0.01104736328125, 0.01323699951171875, 0.0154266357421875, 0.01761627197265625, 0.019805908203125, 0.02199554443359375, 0.0241851806640625, 0.02637481689453125, 0.028564453125, 0.03075408935546875, 0.0329437255859375, 0.03513336181640625, 0.037322998046875, 0.03951263427734375, 0.0417022705078125, 0.04389190673828125, 0.04608154296875, 0.04827117919921875, 0.0504608154296875, 0.05265045166015625, 0.054840087890625, 0.05702972412109375, 0.0592193603515625, 0.06140899658203125, 0.0635986328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 5.0, 2.0, 6.0, 7.0, 13.0, 16.0, 20.0, 36.0, 46.0, 59.0, 61.0, 84.0, 100.0, 84.0, 81.0, 118.0, 69.0, 55.0, 42.0, 35.0, 21.0, 10.0, 13.0, 8.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.644559860229492e-05, -5.42299821972847e-05, -5.2014365792274475e-05, -4.979874938726425e-05, -4.758313298225403e-05, -4.5367516577243805e-05, -4.315190017223358e-05, -4.093628376722336e-05, -3.8720667362213135e-05, -3.650505095720291e-05, -3.428943455219269e-05, -3.2073818147182465e-05, -2.985820174217224e-05, -2.7642585337162018e-05, -2.5426968932151794e-05, -2.321135252714157e-05, -2.0995736122131348e-05, -1.8780119717121124e-05, -1.65645033121109e-05, -1.4348886907100677e-05, -1.2133270502090454e-05, -9.91765409708023e-06, -7.702037692070007e-06, -5.486421287059784e-06, -3.2708048820495605e-06, -1.0551884770393372e-06, 1.1604279279708862e-06, 3.3760443329811096e-06, 5.591660737991333e-06, 7.807277143001556e-06, 1.002289354801178e-05, 1.2238509953022003e-05, 1.4454126358032227e-05, 1.666974276304245e-05, 1.8885359168052673e-05, 2.1100975573062897e-05, 2.331659197807312e-05, 2.5532208383083344e-05, 2.7747824788093567e-05, 2.996344119310379e-05, 3.2179057598114014e-05, 3.439467400312424e-05, 3.661029040813446e-05, 3.8825906813144684e-05, 4.104152321815491e-05, 4.325713962316513e-05, 4.5472756028175354e-05, 4.768837243318558e-05, 4.99039888381958e-05, 5.2119605243206024e-05, 5.433522164821625e-05, 5.655083805322647e-05, 5.8766454458236694e-05, 6.098207086324692e-05, 6.319768726825714e-05, 6.541330367326736e-05, 6.762892007827759e-05, 6.984453648328781e-05, 7.206015288829803e-05, 7.427576929330826e-05, 7.649138569831848e-05, 7.87070021033287e-05, 8.092261850833893e-05, 8.313823491334915e-05, 8.535385131835938e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 7.0, 13.0, 9.0, 13.0, 20.0, 21.0, 20.0, 41.0, 61.0, 92.0, 155.0, 222.0, 435.0, 965.0, 1961.0, 4932.0, 14452.0, 56143.0, 297355.0, 514291.0, 117463.0, 26172.0, 7925.0, 2966.0, 1303.0, 596.0, 331.0, 207.0, 105.0, 85.0, 58.0, 40.0, 22.0, 13.0, 15.0, 7.0, 10.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.09033203125, -0.08743953704833984, -0.08454704284667969, -0.08165454864501953, -0.07876205444335938, -0.07586956024169922, -0.07297706604003906, -0.0700845718383789, -0.06719207763671875, -0.0642995834350586, -0.06140708923339844, -0.05851459503173828, -0.055622100830078125, -0.05272960662841797, -0.04983711242675781, -0.046944618225097656, -0.0440521240234375, -0.041159629821777344, -0.03826713562011719, -0.03537464141845703, -0.032482147216796875, -0.02958965301513672, -0.026697158813476562, -0.023804664611816406, -0.02091217041015625, -0.018019676208496094, -0.015127182006835938, -0.012234687805175781, -0.009342193603515625, -0.006449699401855469, -0.0035572052001953125, -0.0006647109985351562, 0.002227783203125, 0.005120277404785156, 0.008012771606445312, 0.010905265808105469, 0.013797760009765625, 0.01669025421142578, 0.019582748413085938, 0.022475242614746094, 0.02536773681640625, 0.028260231018066406, 0.031152725219726562, 0.03404521942138672, 0.036937713623046875, 0.03983020782470703, 0.04272270202636719, 0.045615196228027344, 0.0485076904296875, 0.051400184631347656, 0.05429267883300781, 0.05718517303466797, 0.060077667236328125, 0.06297016143798828, 0.06586265563964844, 0.0687551498413086, 0.07164764404296875, 0.0745401382446289, 0.07743263244628906, 0.08032512664794922, 0.08321762084960938, 0.08611011505126953, 0.08900260925292969, 0.09189510345458984, 0.09478759765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 0.0, 3.0, 4.0, 0.0, 4.0, 9.0, 14.0, 11.0, 16.0, 19.0, 28.0, 31.0, 38.0, 58.0, 44.0, 66.0, 64.0, 85.0, 69.0, 74.0, 66.0, 49.0, 51.0, 43.0, 29.0, 19.0, 25.0, 14.0, 14.0, 7.0, 7.0, 7.0, 4.0, 7.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.024627685546875, -0.023868560791015625, -0.02310943603515625, -0.022350311279296875, -0.0215911865234375, -0.020832061767578125, -0.02007293701171875, -0.019313812255859375, -0.0185546875, -0.017795562744140625, -0.01703643798828125, -0.016277313232421875, -0.0155181884765625, -0.014759063720703125, -0.01399993896484375, -0.013240814208984375, -0.012481689453125, -0.011722564697265625, -0.01096343994140625, -0.010204315185546875, -0.0094451904296875, -0.008686065673828125, -0.00792694091796875, -0.007167816162109375, -0.00640869140625, -0.005649566650390625, -0.00489044189453125, -0.004131317138671875, -0.0033721923828125, -0.002613067626953125, -0.00185394287109375, -0.001094818115234375, -0.000335693359375, 0.000423431396484375, 0.00118255615234375, 0.001941680908203125, 0.0027008056640625, 0.003459930419921875, 0.00421905517578125, 0.004978179931640625, 0.0057373046875, 0.006496429443359375, 0.00725555419921875, 0.008014678955078125, 0.0087738037109375, 0.009532928466796875, 0.01029205322265625, 0.011051177978515625, 0.011810302734375, 0.012569427490234375, 0.01332855224609375, 0.014087677001953125, 0.0148468017578125, 0.015605926513671875, 0.01636505126953125, 0.017124176025390625, 0.01788330078125, 0.018642425537109375, 0.01940155029296875, 0.020160675048828125, 0.0209197998046875, 0.021678924560546875, 0.02243804931640625, 0.023197174072265625, 0.023956298828125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 25.0, 65.0, 154.0, 265.0, 234.0, 165.0, 67.0, 20.0, 10.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.17115592956543, -14.826726913452148, -14.482297897338867, -14.137869834899902, -13.793440818786621, -13.44901180267334, -13.104583740234375, -12.760154724121094, -12.415725708007812, -12.071296691894531, -11.72686767578125, -11.382439613342285, -11.038010597229004, -10.693581581115723, -10.349153518676758, -10.004724502563477, -9.660295486450195, -9.315866470336914, -8.971437454223633, -8.627009391784668, -8.282580375671387, -7.9381513595581055, -7.593722820281982, -7.249294281005859, -6.904865264892578, -6.560436248779297, -6.216007709503174, -5.871579170227051, -5.5271501541137695, -5.182721138000488, -4.838292598724365, -4.493864059448242, -4.149434566497803, -3.8050057888031006, -3.4605770111083984, -3.1161482334136963, -2.771719455718994, -2.427290678024292, -2.08286190032959, -1.7384331226348877, -1.3940043449401855, -1.0495755672454834, -0.7051467895507812, -0.3607180118560791, -0.016289234161376953, 0.3281395435333252, 0.6725683212280273, 1.0169970989227295, 1.3614258766174316, 1.7058546543121338, 2.050283432006836, 2.394712209701538, 2.7391409873962402, 3.0835697650909424, 3.4279985427856445, 3.7724273204803467, 4.116856098175049, 4.461284637451172, 4.805713653564453, 5.150142669677734, 5.494571208953857, 5.8389997482299805, 6.183428764343262, 6.527857780456543, 6.872286319732666]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 7.0, 9.0, 5.0, 14.0, 11.0, 17.0, 23.0, 30.0, 39.0, 40.0, 32.0, 40.0, 37.0, 40.0, 37.0, 49.0, 60.0, 54.0, 47.0, 46.0, 41.0, 34.0, 36.0, 33.0, 41.0, 35.0, 24.0, 19.0, 23.0, 17.0, 12.0, 20.0, 8.0, 7.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.383441686630249, -2.2934117317199707, -2.2033820152282715, -2.113352060317993, -2.023322105407715, -1.9332923889160156, -1.8432624340057373, -1.7532325983047485, -1.6632027626037598, -1.573172926902771, -1.4831430912017822, -1.393113136291504, -1.3030833005905151, -1.2130534648895264, -1.123023509979248, -1.0329936742782593, -0.9429638385772705, -0.8529340028762817, -0.7629041075706482, -0.6728742122650146, -0.5828443765640259, -0.4928145110607147, -0.40278464555740356, -0.31275475025177, -0.22272491455078125, -0.1326950490474701, -0.042665183544158936, 0.04736468195915222, 0.13739454746246338, 0.22742441296577454, 0.3174542784690857, 0.40748417377471924, 0.4975137710571289, 0.5875436067581177, 0.6775735020637512, 0.7676033973693848, 0.8576332330703735, 0.9476630687713623, 1.0376930236816406, 1.1277228593826294, 1.2177526950836182, 1.307782530784607, 1.3978123664855957, 1.487842321395874, 1.5778721570968628, 1.6679019927978516, 1.7579319477081299, 1.8479617834091187, 1.9379916191101074, 2.0280215740203857, 2.118051290512085, 2.2080812454223633, 2.2981109619140625, 2.388140916824341, 2.478170871734619, 2.5682005882263184, 2.6582305431365967, 2.748260498046875, 2.838290214538574, 2.9283201694488525, 3.018350124359131, 3.10837984085083, 3.1984097957611084, 3.2884397506713867, 3.378469467163086]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 15.0, 16.0, 45.0, 57.0, 115.0, 304.0, 653.0, 1746.0, 6120.0, 23515.0, 91917.0, 425766.0, 383943.0, 84410.0, 21451.0, 5602.0, 1632.0, 639.0, 271.0, 145.0, 74.0, 42.0, 20.0, 16.0, 8.0, 4.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.85546875, -2.73114013671875, -2.6068115234375, -2.48248291015625, -2.358154296875, -2.23382568359375, -2.1094970703125, -1.98516845703125, -1.86083984375, -1.73651123046875, -1.6121826171875, -1.48785400390625, -1.363525390625, -1.23919677734375, -1.1148681640625, -0.99053955078125, -0.8662109375, -0.74188232421875, -0.6175537109375, -0.49322509765625, -0.368896484375, -0.24456787109375, -0.1202392578125, 0.00408935546875, 0.12841796875, 0.25274658203125, 0.3770751953125, 0.50140380859375, 0.625732421875, 0.75006103515625, 0.8743896484375, 0.99871826171875, 1.123046875, 1.24737548828125, 1.3717041015625, 1.49603271484375, 1.620361328125, 1.74468994140625, 1.8690185546875, 1.99334716796875, 2.11767578125, 2.24200439453125, 2.3663330078125, 2.49066162109375, 2.614990234375, 2.73931884765625, 2.8636474609375, 2.98797607421875, 3.1123046875, 3.23663330078125, 3.3609619140625, 3.48529052734375, 3.609619140625, 3.73394775390625, 3.8582763671875, 3.98260498046875, 4.10693359375, 4.23126220703125, 4.3555908203125, 4.47991943359375, 4.604248046875, 4.72857666015625, 4.8529052734375, 4.97723388671875, 5.1015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 17.0, 15.0, 13.0, 23.0, 20.0, 33.0, 28.0, 31.0, 39.0, 44.0, 36.0, 35.0, 37.0, 50.0, 35.0, 43.0, 44.0, 41.0, 44.0, 35.0, 33.0, 36.0, 24.0, 42.0, 20.0, 24.0, 18.0, 23.0, 13.0, 21.0, 13.0, 17.0, 2.0, 7.0, 10.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.36138916015625, -4.2149658203125, -4.06854248046875, -3.922119140625, -3.77569580078125, -3.6292724609375, -3.48284912109375, -3.33642578125, -3.19000244140625, -3.0435791015625, -2.89715576171875, -2.750732421875, -2.60430908203125, -2.4578857421875, -2.31146240234375, -2.1650390625, -2.01861572265625, -1.8721923828125, -1.72576904296875, -1.579345703125, -1.43292236328125, -1.2864990234375, -1.14007568359375, -0.99365234375, -0.84722900390625, -0.7008056640625, -0.55438232421875, -0.407958984375, -0.26153564453125, -0.1151123046875, 0.03131103515625, 0.177734375, 0.32415771484375, 0.4705810546875, 0.61700439453125, 0.763427734375, 0.90985107421875, 1.0562744140625, 1.20269775390625, 1.34912109375, 1.49554443359375, 1.6419677734375, 1.78839111328125, 1.934814453125, 2.08123779296875, 2.2276611328125, 2.37408447265625, 2.5205078125, 2.66693115234375, 2.8133544921875, 2.95977783203125, 3.106201171875, 3.25262451171875, 3.3990478515625, 3.54547119140625, 3.69189453125, 3.83831787109375, 3.9847412109375, 4.13116455078125, 4.277587890625, 4.42401123046875, 4.5704345703125, 4.71685791015625, 4.86328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 12.0, 10.0, 5.0, 6.0, 20.0, 20.0, 17.0, 23.0, 34.0, 53.0, 104.0, 141.0, 307.0, 906.0, 17036.0, 941460.0, 85841.0, 1593.0, 447.0, 180.0, 95.0, 65.0, 32.0, 36.0, 16.0, 17.0, 15.0, 13.0, 11.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.734375, -14.33251953125, -13.9306640625, -13.52880859375, -13.126953125, -12.72509765625, -12.3232421875, -11.92138671875, -11.51953125, -11.11767578125, -10.7158203125, -10.31396484375, -9.912109375, -9.51025390625, -9.1083984375, -8.70654296875, -8.3046875, -7.90283203125, -7.5009765625, -7.09912109375, -6.697265625, -6.29541015625, -5.8935546875, -5.49169921875, -5.08984375, -4.68798828125, -4.2861328125, -3.88427734375, -3.482421875, -3.08056640625, -2.6787109375, -2.27685546875, -1.875, -1.47314453125, -1.0712890625, -0.66943359375, -0.267578125, 0.13427734375, 0.5361328125, 0.93798828125, 1.33984375, 1.74169921875, 2.1435546875, 2.54541015625, 2.947265625, 3.34912109375, 3.7509765625, 4.15283203125, 4.5546875, 4.95654296875, 5.3583984375, 5.76025390625, 6.162109375, 6.56396484375, 6.9658203125, 7.36767578125, 7.76953125, 8.17138671875, 8.5732421875, 8.97509765625, 9.376953125, 9.77880859375, 10.1806640625, 10.58251953125, 10.984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 8.0, 7.0, 12.0, 11.0, 11.0, 21.0, 19.0, 19.0, 41.0, 19.0, 23.0, 16.0, 29.0, 41.0, 42.0, 41.0, 51.0, 44.0, 41.0, 51.0, 33.0, 48.0, 47.0, 35.0, 27.0, 47.0, 24.0, 27.0, 22.0, 17.0, 26.0, 17.0, 13.0, 12.0, 9.0, 5.0, 6.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.7421875, -5.56597900390625, -5.3897705078125, -5.21356201171875, -5.037353515625, -4.86114501953125, -4.6849365234375, -4.50872802734375, -4.33251953125, -4.15631103515625, -3.9801025390625, -3.80389404296875, -3.627685546875, -3.45147705078125, -3.2752685546875, -3.09906005859375, -2.9228515625, -2.74664306640625, -2.5704345703125, -2.39422607421875, -2.218017578125, -2.04180908203125, -1.8656005859375, -1.68939208984375, -1.51318359375, -1.33697509765625, -1.1607666015625, -0.98455810546875, -0.808349609375, -0.63214111328125, -0.4559326171875, -0.27972412109375, -0.103515625, 0.07269287109375, 0.2489013671875, 0.42510986328125, 0.601318359375, 0.77752685546875, 0.9537353515625, 1.12994384765625, 1.30615234375, 1.48236083984375, 1.6585693359375, 1.83477783203125, 2.010986328125, 2.18719482421875, 2.3634033203125, 2.53961181640625, 2.7158203125, 2.89202880859375, 3.0682373046875, 3.24444580078125, 3.420654296875, 3.59686279296875, 3.7730712890625, 3.94927978515625, 4.12548828125, 4.30169677734375, 4.4779052734375, 4.65411376953125, 4.830322265625, 5.00653076171875, 5.1827392578125, 5.35894775390625, 5.53515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 4.0, 11.0, 10.0, 17.0, 34.0, 52.0, 104.0, 207.0, 687.0, 3110.0, 52271.0, 965863.0, 22897.0, 2334.0, 539.0, 176.0, 90.0, 51.0, 29.0, 20.0, 12.0, 6.0, 8.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25390625, -4.11846923828125, -3.9830322265625, -3.84759521484375, -3.712158203125, -3.57672119140625, -3.4412841796875, -3.30584716796875, -3.17041015625, -3.03497314453125, -2.8995361328125, -2.76409912109375, -2.628662109375, -2.49322509765625, -2.3577880859375, -2.22235107421875, -2.0869140625, -1.95147705078125, -1.8160400390625, -1.68060302734375, -1.545166015625, -1.40972900390625, -1.2742919921875, -1.13885498046875, -1.00341796875, -0.86798095703125, -0.7325439453125, -0.59710693359375, -0.461669921875, -0.32623291015625, -0.1907958984375, -0.05535888671875, 0.080078125, 0.21551513671875, 0.3509521484375, 0.48638916015625, 0.621826171875, 0.75726318359375, 0.8927001953125, 1.02813720703125, 1.16357421875, 1.29901123046875, 1.4344482421875, 1.56988525390625, 1.705322265625, 1.84075927734375, 1.9761962890625, 2.11163330078125, 2.2470703125, 2.38250732421875, 2.5179443359375, 2.65338134765625, 2.788818359375, 2.92425537109375, 3.0596923828125, 3.19512939453125, 3.33056640625, 3.46600341796875, 3.6014404296875, 3.73687744140625, 3.872314453125, 4.00775146484375, 4.1431884765625, 4.27862548828125, 4.4140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 22.0, 27.0, 44.0, 48.0, 64.0, 98.0, 172.0, 162.0, 104.0, 64.0, 52.0, 38.0, 30.0, 17.0, 14.0, 12.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0003829002380371094, -0.00037333741784095764, -0.0003637745976448059, -0.0003542117774486542, -0.00034464895725250244, -0.0003350861370563507, -0.000325523316860199, -0.00031596049666404724, -0.0003063976764678955, -0.0002968348562717438, -0.00028727203607559204, -0.0002777092158794403, -0.0002681463956832886, -0.00025858357548713684, -0.0002490207552909851, -0.00023945793509483337, -0.00022989511489868164, -0.0002203322947025299, -0.00021076947450637817, -0.00020120665431022644, -0.0001916438341140747, -0.00018208101391792297, -0.00017251819372177124, -0.0001629553735256195, -0.00015339255332946777, -0.00014382973313331604, -0.0001342669129371643, -0.00012470409274101257, -0.00011514127254486084, -0.0001055784523487091, -9.601563215255737e-05, -8.645281195640564e-05, -7.68899917602539e-05, -6.732717156410217e-05, -5.776435136795044e-05, -4.8201531171798706e-05, -3.863871097564697e-05, -2.907589077949524e-05, -1.9513070583343506e-05, -9.950250387191772e-06, -3.8743019104003906e-07, 9.175390005111694e-06, 1.8738210201263428e-05, 2.830103039741516e-05, 3.7863850593566895e-05, 4.742667078971863e-05, 5.698949098587036e-05, 6.65523111820221e-05, 7.611513137817383e-05, 8.567795157432556e-05, 9.52407717704773e-05, 0.00010480359196662903, 0.00011436641216278076, 0.0001239292323589325, 0.00013349205255508423, 0.00014305487275123596, 0.0001526176929473877, 0.00016218051314353943, 0.00017174333333969116, 0.0001813061535358429, 0.00019086897373199463, 0.00020043179392814636, 0.0002099946141242981, 0.00021955743432044983, 0.00022912025451660156]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 9.0, 9.0, 22.0, 20.0, 23.0, 38.0, 76.0, 135.0, 268.0, 547.0, 1665.0, 7593.0, 445688.0, 581148.0, 8264.0, 1792.0, 592.0, 275.0, 133.0, 100.0, 51.0, 29.0, 14.0, 19.0, 12.0, 6.0, 9.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.890625, -4.7509765625, -4.611328125, -4.4716796875, -4.33203125, -4.1923828125, -4.052734375, -3.9130859375, -3.7734375, -3.6337890625, -3.494140625, -3.3544921875, -3.21484375, -3.0751953125, -2.935546875, -2.7958984375, -2.65625, -2.5166015625, -2.376953125, -2.2373046875, -2.09765625, -1.9580078125, -1.818359375, -1.6787109375, -1.5390625, -1.3994140625, -1.259765625, -1.1201171875, -0.98046875, -0.8408203125, -0.701171875, -0.5615234375, -0.421875, -0.2822265625, -0.142578125, -0.0029296875, 0.13671875, 0.2763671875, 0.416015625, 0.5556640625, 0.6953125, 0.8349609375, 0.974609375, 1.1142578125, 1.25390625, 1.3935546875, 1.533203125, 1.6728515625, 1.8125, 1.9521484375, 2.091796875, 2.2314453125, 2.37109375, 2.5107421875, 2.650390625, 2.7900390625, 2.9296875, 3.0693359375, 3.208984375, 3.3486328125, 3.48828125, 3.6279296875, 3.767578125, 3.9072265625, 4.046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 14.0, 15.0, 14.0, 31.0, 23.0, 39.0, 54.0, 69.0, 82.0, 182.0, 149.0, 74.0, 79.0, 41.0, 34.0, 25.0, 21.0, 20.0, 5.0, 6.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.88232421875, -0.8546600341796875, -0.826995849609375, -0.7993316650390625, -0.77166748046875, -0.7440032958984375, -0.716339111328125, -0.6886749267578125, -0.6610107421875, -0.6333465576171875, -0.605682373046875, -0.5780181884765625, -0.55035400390625, -0.5226898193359375, -0.495025634765625, -0.4673614501953125, -0.439697265625, -0.4120330810546875, -0.384368896484375, -0.3567047119140625, -0.32904052734375, -0.3013763427734375, -0.273712158203125, -0.2460479736328125, -0.2183837890625, -0.1907196044921875, -0.163055419921875, -0.1353912353515625, -0.10772705078125, -0.0800628662109375, -0.052398681640625, -0.0247344970703125, 0.0029296875, 0.0305938720703125, 0.058258056640625, 0.0859222412109375, 0.11358642578125, 0.1412506103515625, 0.168914794921875, 0.1965789794921875, 0.2242431640625, 0.2519073486328125, 0.279571533203125, 0.3072357177734375, 0.33489990234375, 0.3625640869140625, 0.390228271484375, 0.4178924560546875, 0.445556640625, 0.4732208251953125, 0.500885009765625, 0.5285491943359375, 0.55621337890625, 0.5838775634765625, 0.611541748046875, 0.6392059326171875, 0.6668701171875, 0.6945343017578125, 0.722198486328125, 0.7498626708984375, 0.77752685546875, 0.8051910400390625, 0.832855224609375, 0.8605194091796875, 0.88818359375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 12.0, 20.0, 27.0, 46.0, 66.0, 66.0, 98.0, 121.0, 121.0, 102.0, 81.0, 80.0, 66.0, 34.0, 23.0, 17.0, 10.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.639266014099121, -8.355813980102539, -8.072362899780273, -7.788910865783691, -7.505458831787109, -7.2220072746276855, -6.938555717468262, -6.65510368347168, -6.371652126312256, -6.088200569152832, -5.80474853515625, -5.521296977996826, -5.237845420837402, -4.95439338684082, -4.6709418296813965, -4.387490272521973, -4.104038238525391, -3.8205864429473877, -3.5371346473693848, -3.253683090209961, -2.970231294631958, -2.686779499053955, -2.4033279418945312, -2.1198761463165283, -1.8364243507385254, -1.5529725551605225, -1.269520878791809, -0.9860691428184509, -0.7026174068450928, -0.41916561126708984, -0.13571393489837646, 0.14773774147033691, 0.43119049072265625, 0.7146422266960144, 0.9980939626693726, 1.281545639038086, 1.5649974346160889, 1.8484492301940918, 2.1319007873535156, 2.4153525829315186, 2.6988043785095215, 2.9822561740875244, 3.2657079696655273, 3.549159526824951, 3.832611322402954, 4.116063117980957, 4.399514675140381, 4.682966232299805, 4.966418266296387, 5.2498698234558105, 5.533321857452393, 5.816773414611816, 6.100225448608398, 6.383677005767822, 6.667128562927246, 6.950580596923828, 7.234032154083252, 7.517483711242676, 7.800935745239258, 8.08438777923584, 8.367838859558105, 8.651290893554688, 8.93474292755127, 9.218194007873535, 9.501646041870117]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 5.0, 4.0, 10.0, 1.0, 8.0, 11.0, 9.0, 5.0, 14.0, 14.0, 19.0, 15.0, 24.0, 26.0, 23.0, 27.0, 22.0, 29.0, 28.0, 37.0, 37.0, 20.0, 23.0, 45.0, 39.0, 27.0, 43.0, 22.0, 38.0, 29.0, 29.0, 25.0, 28.0, 25.0, 27.0, 31.0, 24.0, 20.0, 10.0, 14.0, 16.0, 17.0, 12.0, 10.0, 10.0, 9.0, 7.0, 6.0, 5.0, 1.0, 0.0, 8.0, 3.0, 5.0, 2.0, 1.0], "bins": [-7.011007308959961, -6.798781871795654, -6.586556911468506, -6.374331474304199, -6.162106037139893, -5.949880599975586, -5.7376556396484375, -5.525430202484131, -5.313204765319824, -5.100979328155518, -4.888754367828369, -4.6765289306640625, -4.464303493499756, -4.252078056335449, -4.039853096008301, -3.827627658843994, -3.6154024600982666, -3.403177261352539, -3.1909518241882324, -2.978726625442505, -2.7665011882781982, -2.5542759895324707, -2.342050552368164, -2.1298253536224365, -1.9176000356674194, -1.7053747177124023, -1.4931493997573853, -1.2809240818023682, -1.0686988830566406, -0.8564735651016235, -0.6442482471466064, -0.43202292919158936, -0.21979761123657227, -0.00757230818271637, 0.20465299487113953, 0.41687828302383423, 0.6291036009788513, 0.8413288593292236, 1.0535541772842407, 1.2657794952392578, 1.478004813194275, 1.690230131149292, 1.902455449104309, 2.114680767059326, 2.3269059658050537, 2.5391311645507812, 2.751356601715088, 2.9635820388793945, 3.175807237625122, 3.3880324363708496, 3.6002578735351562, 3.812483072280884, 4.024708271026611, 4.236933708190918, 4.449159145355225, 4.661384582519531, 4.87360954284668, 5.085834980010986, 5.298059940338135, 5.510285377502441, 5.722510814666748, 5.934736251831055, 6.146961212158203, 6.35918664932251, 6.571412086486816]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 8.0, 9.0, 14.0, 17.0, 18.0, 33.0, 42.0, 47.0, 74.0, 125.0, 173.0, 323.0, 629.0, 1636.0, 5951.0, 31966.0, 261035.0, 1890414.0, 1748611.0, 217538.0, 27089.0, 5367.0, 1541.0, 604.0, 344.0, 209.0, 125.0, 101.0, 67.0, 41.0, 31.0, 25.0, 20.0, 16.0, 14.0, 7.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.43841552734375, -4.2674560546875, -4.09649658203125, -3.925537109375, -3.75457763671875, -3.5836181640625, -3.41265869140625, -3.24169921875, -3.07073974609375, -2.8997802734375, -2.72882080078125, -2.557861328125, -2.38690185546875, -2.2159423828125, -2.04498291015625, -1.8740234375, -1.70306396484375, -1.5321044921875, -1.36114501953125, -1.190185546875, -1.01922607421875, -0.8482666015625, -0.67730712890625, -0.50634765625, -0.33538818359375, -0.1644287109375, 0.00653076171875, 0.177490234375, 0.34844970703125, 0.5194091796875, 0.69036865234375, 0.861328125, 1.03228759765625, 1.2032470703125, 1.37420654296875, 1.545166015625, 1.71612548828125, 1.8870849609375, 2.05804443359375, 2.22900390625, 2.39996337890625, 2.5709228515625, 2.74188232421875, 2.912841796875, 3.08380126953125, 3.2547607421875, 3.42572021484375, 3.5966796875, 3.76763916015625, 3.9385986328125, 4.10955810546875, 4.280517578125, 4.45147705078125, 4.6224365234375, 4.79339599609375, 4.96435546875, 5.13531494140625, 5.3062744140625, 5.47723388671875, 5.648193359375, 5.81915283203125, 5.9901123046875, 6.16107177734375, 6.33203125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 9.0, 10.0, 9.0, 15.0, 23.0, 27.0, 20.0, 40.0, 49.0, 41.0, 40.0, 50.0, 43.0, 51.0, 52.0, 51.0, 42.0, 52.0, 47.0, 38.0, 37.0, 52.0, 34.0, 31.0, 28.0, 22.0, 14.0, 16.0, 14.0, 14.0, 7.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.085235595703125, -2.96929931640625, -2.853363037109375, -2.7374267578125, -2.621490478515625, -2.50555419921875, -2.389617919921875, -2.273681640625, -2.157745361328125, -2.04180908203125, -1.925872802734375, -1.8099365234375, -1.694000244140625, -1.57806396484375, -1.462127685546875, -1.34619140625, -1.230255126953125, -1.11431884765625, -0.998382568359375, -0.8824462890625, -0.766510009765625, -0.65057373046875, -0.534637451171875, -0.418701171875, -0.302764892578125, -0.18682861328125, -0.070892333984375, 0.0450439453125, 0.160980224609375, 0.27691650390625, 0.392852783203125, 0.5087890625, 0.624725341796875, 0.74066162109375, 0.856597900390625, 0.9725341796875, 1.088470458984375, 1.20440673828125, 1.320343017578125, 1.436279296875, 1.552215576171875, 1.66815185546875, 1.784088134765625, 1.9000244140625, 2.015960693359375, 2.13189697265625, 2.247833251953125, 2.36376953125, 2.479705810546875, 2.59564208984375, 2.711578369140625, 2.8275146484375, 2.943450927734375, 3.05938720703125, 3.175323486328125, 3.291259765625, 3.407196044921875, 3.52313232421875, 3.639068603515625, 3.7550048828125, 3.870941162109375, 3.98687744140625, 4.102813720703125, 4.21875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 7.0, 3.0, 4.0, 5.0, 8.0, 9.0, 12.0, 37.0, 33.0, 47.0, 71.0, 110.0, 177.0, 359.0, 692.0, 1522.0, 4642.0, 29448.0, 1051741.0, 3022076.0, 71943.0, 7517.0, 1971.0, 824.0, 410.0, 220.0, 133.0, 84.0, 45.0, 35.0, 20.0, 19.0, 14.0, 14.0, 8.0, 5.0, 6.0, 6.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6484375, -6.394287109375, -6.14013671875, -5.885986328125, -5.6318359375, -5.377685546875, -5.12353515625, -4.869384765625, -4.615234375, -4.361083984375, -4.10693359375, -3.852783203125, -3.5986328125, -3.344482421875, -3.09033203125, -2.836181640625, -2.58203125, -2.327880859375, -2.07373046875, -1.819580078125, -1.5654296875, -1.311279296875, -1.05712890625, -0.802978515625, -0.548828125, -0.294677734375, -0.04052734375, 0.213623046875, 0.4677734375, 0.721923828125, 0.97607421875, 1.230224609375, 1.484375, 1.738525390625, 1.99267578125, 2.246826171875, 2.5009765625, 2.755126953125, 3.00927734375, 3.263427734375, 3.517578125, 3.771728515625, 4.02587890625, 4.280029296875, 4.5341796875, 4.788330078125, 5.04248046875, 5.296630859375, 5.55078125, 5.804931640625, 6.05908203125, 6.313232421875, 6.5673828125, 6.821533203125, 7.07568359375, 7.329833984375, 7.583984375, 7.838134765625, 8.09228515625, 8.346435546875, 8.6005859375, 8.854736328125, 9.10888671875, 9.363037109375, 9.6171875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 10.0, 13.0, 12.0, 22.0, 35.0, 42.0, 67.0, 114.0, 145.0, 210.0, 320.0, 429.0, 496.0, 518.0, 458.0, 357.0, 253.0, 180.0, 103.0, 91.0, 66.0, 33.0, 24.0, 21.0, 10.0, 9.0, 10.0, 9.0, 0.0, 0.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.732421875, -1.681854248046875, -1.63128662109375, -1.580718994140625, -1.5301513671875, -1.479583740234375, -1.42901611328125, -1.378448486328125, -1.327880859375, -1.277313232421875, -1.22674560546875, -1.176177978515625, -1.1256103515625, -1.075042724609375, -1.02447509765625, -0.973907470703125, -0.92333984375, -0.872772216796875, -0.82220458984375, -0.771636962890625, -0.7210693359375, -0.670501708984375, -0.61993408203125, -0.569366455078125, -0.518798828125, -0.468231201171875, -0.41766357421875, -0.367095947265625, -0.3165283203125, -0.265960693359375, -0.21539306640625, -0.164825439453125, -0.1142578125, -0.063690185546875, -0.01312255859375, 0.037445068359375, 0.0880126953125, 0.138580322265625, 0.18914794921875, 0.239715576171875, 0.290283203125, 0.340850830078125, 0.39141845703125, 0.441986083984375, 0.4925537109375, 0.543121337890625, 0.59368896484375, 0.644256591796875, 0.69482421875, 0.745391845703125, 0.79595947265625, 0.846527099609375, 0.8970947265625, 0.947662353515625, 0.99822998046875, 1.048797607421875, 1.099365234375, 1.149932861328125, 1.20050048828125, 1.251068115234375, 1.3016357421875, 1.352203369140625, 1.40277099609375, 1.453338623046875, 1.50390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 9.0, 13.0, 19.0, 20.0, 47.0, 48.0, 49.0, 66.0, 81.0, 79.0, 77.0, 68.0, 70.0, 66.0, 64.0, 48.0, 46.0, 30.0, 22.0, 15.0, 27.0, 16.0, 9.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.763986825942993, -3.6003661155700684, -3.4367451667785645, -3.2731244564056396, -3.109503746032715, -2.94588303565979, -2.7822623252868652, -2.6186413764953613, -2.4550206661224365, -2.2913999557495117, -2.127779006958008, -1.964158296585083, -1.8005375862121582, -1.6369168758392334, -1.473296046257019, -1.3096752166748047, -1.1460545063018799, -0.9824337363243103, -0.8188129663467407, -0.6551921963691711, -0.49157142639160156, -0.327950656414032, -0.1643298864364624, -0.0007090568542480469, 0.16291165351867676, 0.32653242349624634, 0.4901531934738159, 0.6537739634513855, 0.8173947334289551, 0.9810155034065247, 1.1446362733840942, 1.3082571029663086, 1.4718775749206543, 1.635498285293579, 1.7991191148757935, 1.9627399444580078, 2.1263606548309326, 2.2899813652038574, 2.4536023139953613, 2.617223024368286, 2.780843734741211, 2.9444644451141357, 3.1080851554870605, 3.2717061042785645, 3.4353268146514893, 3.598947525024414, 3.762568473815918, 3.9261891841888428, 4.089809894561768, 4.2534308433532715, 4.417051315307617, 4.580672264099121, 4.744293212890625, 4.907913684844971, 5.071534633636475, 5.23515510559082, 5.398776054382324, 5.562397003173828, 5.726017475128174, 5.889638423919678, 6.053258895874023, 6.216879844665527, 6.380500793457031, 6.544121742248535, 6.707742214202881]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 7.0, 8.0, 20.0, 13.0, 15.0, 19.0, 16.0, 29.0, 30.0, 38.0, 51.0, 24.0, 30.0, 34.0, 40.0, 54.0, 32.0, 52.0, 45.0, 48.0, 32.0, 38.0, 28.0, 39.0, 43.0, 35.0, 31.0, 23.0, 24.0, 18.0, 14.0, 13.0, 8.0, 8.0, 12.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.936814308166504, -3.8266875743865967, -3.7165610790252686, -3.6064343452453613, -3.496307849884033, -3.386181116104126, -3.2760543823242188, -3.1659278869628906, -3.0558013916015625, -2.9456746578216553, -2.835548162460327, -2.72542142868042, -2.615294933319092, -2.5051681995391846, -2.3950414657592773, -2.284914970397949, -2.174788236618042, -2.0646615028381348, -1.9545350074768066, -1.8444082736968994, -1.7342817783355713, -1.624155044555664, -1.5140284299850464, -1.4039018154144287, -1.293775200843811, -1.1836485862731934, -1.0735219717025757, -0.9633952975273132, -0.8532686829566956, -0.7431420683860779, -0.6330153942108154, -0.5228887796401978, -0.412761926651001, -0.3026353120803833, -0.19250866770744324, -0.08238202333450317, 0.027744591236114502, 0.13787120580673218, 0.24799787998199463, 0.3581244945526123, 0.46825110912323, 0.5783777236938477, 0.6885043382644653, 0.7986310124397278, 0.9087576270103455, 1.0188841819763184, 1.1290109157562256, 1.2391375303268433, 1.349264144897461, 1.4593907594680786, 1.5695173740386963, 1.6796441078186035, 1.7897706031799316, 1.8998973369598389, 2.010024070739746, 2.120150566101074, 2.2302770614624023, 2.3404037952423096, 2.4505302906036377, 2.560657024383545, 2.670783519744873, 2.7809102535247803, 2.8910369873046875, 3.0011634826660156, 3.111290216445923]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 11.0, 8.0, 13.0, 23.0, 17.0, 39.0, 57.0, 80.0, 126.0, 234.0, 373.0, 777.0, 1470.0, 3448.0, 9295.0, 32361.0, 137456.0, 437246.0, 316440.0, 78302.0, 19580.0, 6242.0, 2465.0, 1125.0, 556.0, 318.0, 165.0, 114.0, 71.0, 44.0, 27.0, 26.0, 16.0, 7.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6021575927734375, -0.578826904296875, -0.5554962158203125, -0.53216552734375, -0.5088348388671875, -0.485504150390625, -0.4621734619140625, -0.4388427734375, -0.4155120849609375, -0.392181396484375, -0.3688507080078125, -0.34552001953125, -0.3221893310546875, -0.298858642578125, -0.2755279541015625, -0.252197265625, -0.2288665771484375, -0.205535888671875, -0.1822052001953125, -0.15887451171875, -0.1355438232421875, -0.112213134765625, -0.0888824462890625, -0.0655517578125, -0.0422210693359375, -0.018890380859375, 0.0044403076171875, 0.02777099609375, 0.0511016845703125, 0.074432373046875, 0.0977630615234375, 0.12109375, 0.1444244384765625, 0.167755126953125, 0.1910858154296875, 0.21441650390625, 0.2377471923828125, 0.261077880859375, 0.2844085693359375, 0.3077392578125, 0.3310699462890625, 0.354400634765625, 0.3777313232421875, 0.40106201171875, 0.4243927001953125, 0.447723388671875, 0.4710540771484375, 0.494384765625, 0.5177154541015625, 0.541046142578125, 0.5643768310546875, 0.58770751953125, 0.6110382080078125, 0.634368896484375, 0.6576995849609375, 0.6810302734375, 0.7043609619140625, 0.727691650390625, 0.7510223388671875, 0.77435302734375, 0.7976837158203125, 0.821014404296875, 0.8443450927734375, 0.86767578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 11.0, 15.0, 10.0, 14.0, 17.0, 25.0, 28.0, 33.0, 41.0, 44.0, 42.0, 55.0, 54.0, 50.0, 44.0, 52.0, 50.0, 65.0, 46.0, 30.0, 49.0, 38.0, 38.0, 24.0, 28.0, 17.0, 16.0, 13.0, 10.0, 13.0, 6.0, 3.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.302734375, -2.21453857421875, -2.1263427734375, -2.03814697265625, -1.949951171875, -1.86175537109375, -1.7735595703125, -1.68536376953125, -1.59716796875, -1.50897216796875, -1.4207763671875, -1.33258056640625, -1.244384765625, -1.15618896484375, -1.0679931640625, -0.97979736328125, -0.8916015625, -0.80340576171875, -0.7152099609375, -0.62701416015625, -0.538818359375, -0.45062255859375, -0.3624267578125, -0.27423095703125, -0.18603515625, -0.09783935546875, -0.0096435546875, 0.07855224609375, 0.166748046875, 0.25494384765625, 0.3431396484375, 0.43133544921875, 0.51953125, 0.60772705078125, 0.6959228515625, 0.78411865234375, 0.872314453125, 0.96051025390625, 1.0487060546875, 1.13690185546875, 1.22509765625, 1.31329345703125, 1.4014892578125, 1.48968505859375, 1.577880859375, 1.66607666015625, 1.7542724609375, 1.84246826171875, 1.9306640625, 2.01885986328125, 2.1070556640625, 2.19525146484375, 2.283447265625, 2.37164306640625, 2.4598388671875, 2.54803466796875, 2.63623046875, 2.72442626953125, 2.8126220703125, 2.90081787109375, 2.989013671875, 3.07720947265625, 3.1654052734375, 3.25360107421875, 3.341796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 12.0, 3.0, 16.0, 13.0, 16.0, 25.0, 29.0, 53.0, 121.0, 201.0, 408.0, 728.0, 1489.0, 3173.0, 6943.0, 14758.0, 31627.0, 65225.0, 123957.0, 196043.0, 228848.0, 174068.0, 101847.0, 52067.0, 24860.0, 11717.0, 5352.0, 2506.0, 1194.0, 573.0, 307.0, 130.0, 86.0, 50.0, 34.0, 23.0, 13.0, 9.0, 5.0, 8.0, 8.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.29833984375, -0.2896537780761719, -0.28096771240234375, -0.2722816467285156, -0.2635955810546875, -0.2549095153808594, -0.24622344970703125, -0.23753738403320312, -0.228851318359375, -0.22016525268554688, -0.21147918701171875, -0.20279312133789062, -0.1941070556640625, -0.18542098999023438, -0.17673492431640625, -0.16804885864257812, -0.15936279296875, -0.15067672729492188, -0.14199066162109375, -0.13330459594726562, -0.1246185302734375, -0.11593246459960938, -0.10724639892578125, -0.09856033325195312, -0.089874267578125, -0.08118820190429688, -0.07250213623046875, -0.06381607055664062, -0.0551300048828125, -0.046443939208984375, -0.03775787353515625, -0.029071807861328125, -0.0203857421875, -0.011699676513671875, -0.00301361083984375, 0.005672454833984375, 0.0143585205078125, 0.023044586181640625, 0.03173065185546875, 0.040416717529296875, 0.049102783203125, 0.057788848876953125, 0.06647491455078125, 0.07516098022460938, 0.0838470458984375, 0.09253311157226562, 0.10121917724609375, 0.10990524291992188, 0.11859130859375, 0.12727737426757812, 0.13596343994140625, 0.14464950561523438, 0.1533355712890625, 0.16202163696289062, 0.17070770263671875, 0.17939376831054688, 0.188079833984375, 0.19676589965820312, 0.20545196533203125, 0.21413803100585938, 0.2228240966796875, 0.23151016235351562, 0.24019622802734375, 0.24888229370117188, 0.257568359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 9.0, 6.0, 12.0, 9.0, 12.0, 21.0, 21.0, 23.0, 30.0, 34.0, 30.0, 37.0, 44.0, 52.0, 52.0, 50.0, 51.0, 39.0, 44.0, 59.0, 34.0, 38.0, 45.0, 27.0, 26.0, 34.0, 26.0, 19.0, 19.0, 16.0, 9.0, 13.0, 10.0, 6.0, 9.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.64453125, -5.49005126953125, -5.3355712890625, -5.18109130859375, -5.026611328125, -4.87213134765625, -4.7176513671875, -4.56317138671875, -4.40869140625, -4.25421142578125, -4.0997314453125, -3.94525146484375, -3.790771484375, -3.63629150390625, -3.4818115234375, -3.32733154296875, -3.1728515625, -3.01837158203125, -2.8638916015625, -2.70941162109375, -2.554931640625, -2.40045166015625, -2.2459716796875, -2.09149169921875, -1.93701171875, -1.78253173828125, -1.6280517578125, -1.47357177734375, -1.319091796875, -1.16461181640625, -1.0101318359375, -0.85565185546875, -0.701171875, -0.54669189453125, -0.3922119140625, -0.23773193359375, -0.083251953125, 0.07122802734375, 0.2257080078125, 0.38018798828125, 0.53466796875, 0.68914794921875, 0.8436279296875, 0.99810791015625, 1.152587890625, 1.30706787109375, 1.4615478515625, 1.61602783203125, 1.7705078125, 1.92498779296875, 2.0794677734375, 2.23394775390625, 2.388427734375, 2.54290771484375, 2.6973876953125, 2.85186767578125, 3.00634765625, 3.16082763671875, 3.3153076171875, 3.46978759765625, 3.624267578125, 3.77874755859375, 3.9332275390625, 4.08770751953125, 4.2421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 13.0, 7.0, 23.0, 30.0, 28.0, 41.0, 63.0, 90.0, 115.0, 185.0, 293.0, 520.0, 898.0, 1712.0, 3191.0, 6612.0, 14136.0, 35629.0, 102507.0, 291394.0, 362139.0, 144583.0, 48392.0, 18683.0, 8503.0, 4047.0, 2018.0, 1117.0, 564.0, 359.0, 227.0, 126.0, 95.0, 54.0, 39.0, 27.0, 23.0, 27.0, 13.0, 11.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.051910400390625, -0.050066471099853516, -0.04822254180908203, -0.04637861251831055, -0.04453468322753906, -0.04269075393676758, -0.040846824645996094, -0.03900289535522461, -0.037158966064453125, -0.03531503677368164, -0.033471107482910156, -0.03162717819213867, -0.029783248901367188, -0.027939319610595703, -0.02609539031982422, -0.024251461029052734, -0.02240753173828125, -0.020563602447509766, -0.01871967315673828, -0.016875743865966797, -0.015031814575195312, -0.013187885284423828, -0.011343955993652344, -0.00950002670288086, -0.007656097412109375, -0.005812168121337891, -0.003968238830566406, -0.002124309539794922, -0.0002803802490234375, 0.0015635490417480469, 0.0034074783325195312, 0.005251407623291016, 0.0070953369140625, 0.008939266204833984, 0.010783195495605469, 0.012627124786376953, 0.014471054077148438, 0.016314983367919922, 0.018158912658691406, 0.02000284194946289, 0.021846771240234375, 0.02369070053100586, 0.025534629821777344, 0.027378559112548828, 0.029222488403320312, 0.031066417694091797, 0.03291034698486328, 0.034754276275634766, 0.03659820556640625, 0.038442134857177734, 0.04028606414794922, 0.0421299934387207, 0.04397392272949219, 0.04581785202026367, 0.047661781311035156, 0.04950571060180664, 0.051349639892578125, 0.05319356918334961, 0.055037498474121094, 0.05688142776489258, 0.05872535705566406, 0.06056928634643555, 0.06241321563720703, 0.06425714492797852, 0.06610107421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 6.0, 1.0, 7.0, 6.0, 21.0, 11.0, 18.0, 30.0, 28.0, 36.0, 45.0, 55.0, 42.0, 69.0, 80.0, 80.0, 96.0, 61.0, 57.0, 53.0, 38.0, 37.0, 29.0, 23.0, 12.0, 12.0, 13.0, 10.0, 9.0, 4.0, 3.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-5.7816505432128906e-05, -5.6306831538677216e-05, -5.4797157645225525e-05, -5.3287483751773834e-05, -5.1777809858322144e-05, -5.026813596487045e-05, -4.875846207141876e-05, -4.724878817796707e-05, -4.573911428451538e-05, -4.422944039106369e-05, -4.2719766497612e-05, -4.121009260416031e-05, -3.970041871070862e-05, -3.819074481725693e-05, -3.668107092380524e-05, -3.5171397030353546e-05, -3.3661723136901855e-05, -3.2152049243450165e-05, -3.0642375349998474e-05, -2.9132701456546783e-05, -2.7623027563095093e-05, -2.6113353669643402e-05, -2.460367977619171e-05, -2.309400588274002e-05, -2.158433198928833e-05, -2.007465809583664e-05, -1.856498420238495e-05, -1.7055310308933258e-05, -1.5545636415481567e-05, -1.4035962522029877e-05, -1.2526288628578186e-05, -1.1016614735126495e-05, -9.506940841674805e-06, -7.997266948223114e-06, -6.487593054771423e-06, -4.977919161319733e-06, -3.468245267868042e-06, -1.9585713744163513e-06, -4.4889748096466064e-07, 1.06077641248703e-06, 2.5704503059387207e-06, 4.080124199390411e-06, 5.589798092842102e-06, 7.099471986293793e-06, 8.609145879745483e-06, 1.0118819773197174e-05, 1.1628493666648865e-05, 1.3138167560100555e-05, 1.4647841453552246e-05, 1.6157515347003937e-05, 1.7667189240455627e-05, 1.9176863133907318e-05, 2.068653702735901e-05, 2.21962109208107e-05, 2.370588481426239e-05, 2.521555870771408e-05, 2.672523260116577e-05, 2.8234906494617462e-05, 2.9744580388069153e-05, 3.1254254281520844e-05, 3.2763928174972534e-05, 3.4273602068424225e-05, 3.5783275961875916e-05, 3.7292949855327606e-05, 3.88026237487793e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 6.0, 6.0, 13.0, 19.0, 20.0, 25.0, 42.0, 50.0, 63.0, 116.0, 174.0, 282.0, 418.0, 828.0, 1419.0, 2638.0, 5436.0, 11676.0, 29282.0, 96211.0, 383767.0, 371569.0, 93115.0, 28580.0, 11399.0, 5280.0, 2702.0, 1386.0, 768.0, 457.0, 246.0, 169.0, 122.0, 70.0, 49.0, 41.0, 22.0, 23.0, 18.0, 8.0, 9.0, 1.0, 5.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0716552734375, -0.06941509246826172, -0.06717491149902344, -0.06493473052978516, -0.06269454956054688, -0.060454368591308594, -0.05821418762207031, -0.05597400665283203, -0.05373382568359375, -0.05149364471435547, -0.04925346374511719, -0.047013282775878906, -0.044773101806640625, -0.042532920837402344, -0.04029273986816406, -0.03805255889892578, -0.0358123779296875, -0.03357219696044922, -0.03133201599121094, -0.029091835021972656, -0.026851654052734375, -0.024611473083496094, -0.022371292114257812, -0.02013111114501953, -0.01789093017578125, -0.01565074920654297, -0.013410568237304688, -0.011170387268066406, -0.008930206298828125, -0.006690025329589844, -0.0044498443603515625, -0.0022096633911132812, 3.0517578125e-05, 0.0022706985473632812, 0.0045108795166015625, 0.006751060485839844, 0.008991241455078125, 0.011231422424316406, 0.013471603393554688, 0.01571178436279297, 0.01795196533203125, 0.02019214630126953, 0.022432327270507812, 0.024672508239746094, 0.026912689208984375, 0.029152870178222656, 0.03139305114746094, 0.03363323211669922, 0.0358734130859375, 0.03811359405517578, 0.04035377502441406, 0.042593955993652344, 0.044834136962890625, 0.047074317932128906, 0.04931449890136719, 0.05155467987060547, 0.05379486083984375, 0.05603504180908203, 0.05827522277832031, 0.060515403747558594, 0.06275558471679688, 0.06499576568603516, 0.06723594665527344, 0.06947612762451172, 0.07171630859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 13.0, 9.0, 9.0, 12.0, 22.0, 16.0, 20.0, 21.0, 25.0, 34.0, 54.0, 64.0, 60.0, 83.0, 65.0, 71.0, 74.0, 58.0, 50.0, 50.0, 31.0, 25.0, 21.0, 15.0, 23.0, 8.0, 7.0, 6.0, 6.0, 6.0, 7.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0189208984375, -0.01833939552307129, -0.017757892608642578, -0.017176389694213867, -0.016594886779785156, -0.016013383865356445, -0.015431880950927734, -0.014850378036499023, -0.014268875122070312, -0.013687372207641602, -0.01310586929321289, -0.01252436637878418, -0.011942863464355469, -0.011361360549926758, -0.010779857635498047, -0.010198354721069336, -0.009616851806640625, -0.009035348892211914, -0.008453845977783203, -0.007872343063354492, -0.007290840148925781, -0.00670933723449707, -0.006127834320068359, -0.0055463314056396484, -0.0049648284912109375, -0.0043833255767822266, -0.0038018226623535156, -0.0032203197479248047, -0.0026388168334960938, -0.002057313919067383, -0.0014758110046386719, -0.0008943080902099609, -0.00031280517578125, 0.00026869773864746094, 0.0008502006530761719, 0.0014317035675048828, 0.0020132064819335938, 0.0025947093963623047, 0.0031762123107910156, 0.0037577152252197266, 0.0043392181396484375, 0.0049207210540771484, 0.005502223968505859, 0.00608372688293457, 0.006665229797363281, 0.007246732711791992, 0.007828235626220703, 0.008409738540649414, 0.008991241455078125, 0.009572744369506836, 0.010154247283935547, 0.010735750198364258, 0.011317253112792969, 0.01189875602722168, 0.01248025894165039, 0.013061761856079102, 0.013643264770507812, 0.014224767684936523, 0.014806270599365234, 0.015387773513793945, 0.015969276428222656, 0.016550779342651367, 0.017132282257080078, 0.01771378517150879, 0.0182952880859375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 17.0, 25.0, 39.0, 71.0, 123.0, 135.0, 154.0, 123.0, 117.0, 75.0, 39.0, 37.0, 21.0, 13.0, 7.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.134188652038574, -5.962375640869141, -5.790562629699707, -5.618749618530273, -5.446937084197998, -5.2751240730285645, -5.103311061859131, -4.931498050689697, -4.759685516357422, -4.587872505187988, -4.416059494018555, -4.244246482849121, -4.072433948516846, -3.900620937347412, -3.7288079261779785, -3.556994915008545, -3.3851819038391113, -3.2133688926696777, -3.0415561199188232, -2.8697431087493896, -2.697930335998535, -2.5261173248291016, -2.354304313659668, -2.1824913024902344, -2.01067852973938, -1.8388656377792358, -1.6670527458190918, -1.4952397346496582, -1.3234268426895142, -1.1516139507293701, -0.9798009395599365, -0.8079880475997925, -0.6361756324768066, -0.4643627107143402, -0.2925497889518738, -0.12073683738708496, 0.05107605457305908, 0.22288894653320312, 0.3947019577026367, 0.5665148496627808, 0.7383277416229248, 0.9101406335830688, 1.081953525543213, 1.2537665367126465, 1.4255794286727905, 1.5973923206329346, 1.7692053318023682, 1.9410182237625122, 2.1128311157226562, 2.28464412689209, 2.4564568996429443, 2.628269910812378, 2.8000826835632324, 2.971895694732666, 3.1437087059020996, 3.315521717071533, 3.4873344898223877, 3.6591475009918213, 3.830960273742676, 4.002773284912109, 4.174586296081543, 4.346399307250977, 4.51821231842041, 4.6900248527526855, 4.861837863922119]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 10.0, 4.0, 20.0, 18.0, 16.0, 7.0, 31.0, 24.0, 32.0, 45.0, 39.0, 28.0, 32.0, 40.0, 43.0, 47.0, 38.0, 51.0, 47.0, 40.0, 35.0, 40.0, 27.0, 49.0, 38.0, 31.0, 32.0, 20.0, 20.0, 13.0, 14.0, 14.0, 9.0, 12.0, 9.0, 2.0, 5.0, 2.0, 1.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2405951023101807, -2.1690683364868164, -2.097541570663452, -2.026014804840088, -1.9544881582260132, -1.882961392402649, -1.8114347457885742, -1.73990797996521, -1.6683812141418457, -1.5968544483184814, -1.5253276824951172, -1.4538010358810425, -1.3822742700576782, -1.310747504234314, -1.2392208576202393, -1.167694091796875, -1.0961673259735107, -1.0246405601501465, -0.953113853931427, -0.8815871477127075, -0.8100603818893433, -0.738533616065979, -0.6670069098472595, -0.59548020362854, -0.5239534378051758, -0.4524267017841339, -0.38089996576309204, -0.30937322974205017, -0.2378464937210083, -0.16631975769996643, -0.09479302167892456, -0.023266315460205078, 0.04826021194458008, 0.11978694796562195, 0.19131368398666382, 0.2628404200077057, 0.33436715602874756, 0.40589389204978943, 0.4774206280708313, 0.5489473342895508, 0.620474100112915, 0.6920008659362793, 0.7635275721549988, 0.8350542783737183, 0.9065810441970825, 0.9781078100204468, 1.0496344566345215, 1.1211612224578857, 1.19268798828125, 1.2642147541046143, 1.3357415199279785, 1.4072681665420532, 1.4787949323654175, 1.5503216981887817, 1.6218483448028564, 1.6933751106262207, 1.764901876449585, 1.8364286422729492, 1.9079554080963135, 1.9794820547103882, 2.051008701324463, 2.122535467147827, 2.1940622329711914, 2.2655889987945557, 2.33711576461792]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 9.0, 11.0, 19.0, 30.0, 55.0, 86.0, 142.0, 293.0, 655.0, 1467.0, 4806.0, 15316.0, 52970.0, 261250.0, 589301.0, 86080.0, 24662.0, 7382.0, 2286.0, 893.0, 398.0, 198.0, 79.0, 57.0, 37.0, 22.0, 10.0, 13.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5625, -3.444488525390625, -3.32647705078125, -3.208465576171875, -3.0904541015625, -2.972442626953125, -2.85443115234375, -2.736419677734375, -2.618408203125, -2.500396728515625, -2.38238525390625, -2.264373779296875, -2.1463623046875, -2.028350830078125, -1.91033935546875, -1.792327880859375, -1.67431640625, -1.556304931640625, -1.43829345703125, -1.320281982421875, -1.2022705078125, -1.084259033203125, -0.96624755859375, -0.848236083984375, -0.730224609375, -0.612213134765625, -0.49420166015625, -0.376190185546875, -0.2581787109375, -0.140167236328125, -0.02215576171875, 0.095855712890625, 0.2138671875, 0.331878662109375, 0.44989013671875, 0.567901611328125, 0.6859130859375, 0.803924560546875, 0.92193603515625, 1.039947509765625, 1.157958984375, 1.275970458984375, 1.39398193359375, 1.511993408203125, 1.6300048828125, 1.748016357421875, 1.86602783203125, 1.984039306640625, 2.10205078125, 2.220062255859375, 2.33807373046875, 2.456085205078125, 2.5740966796875, 2.692108154296875, 2.81011962890625, 2.928131103515625, 3.046142578125, 3.164154052734375, 3.28216552734375, 3.400177001953125, 3.5181884765625, 3.636199951171875, 3.75421142578125, 3.872222900390625, 3.990234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 6.0, 4.0, 15.0, 15.0, 12.0, 14.0, 27.0, 29.0, 23.0, 32.0, 36.0, 45.0, 47.0, 44.0, 43.0, 50.0, 38.0, 61.0, 37.0, 46.0, 50.0, 42.0, 45.0, 33.0, 31.0, 26.0, 26.0, 23.0, 23.0, 12.0, 14.0, 8.0, 12.0, 9.0, 7.0, 4.0, 3.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3359375, -4.18731689453125, -4.0386962890625, -3.89007568359375, -3.741455078125, -3.59283447265625, -3.4442138671875, -3.29559326171875, -3.14697265625, -2.99835205078125, -2.8497314453125, -2.70111083984375, -2.552490234375, -2.40386962890625, -2.2552490234375, -2.10662841796875, -1.9580078125, -1.80938720703125, -1.6607666015625, -1.51214599609375, -1.363525390625, -1.21490478515625, -1.0662841796875, -0.91766357421875, -0.76904296875, -0.62042236328125, -0.4718017578125, -0.32318115234375, -0.174560546875, -0.02593994140625, 0.1226806640625, 0.27130126953125, 0.419921875, 0.56854248046875, 0.7171630859375, 0.86578369140625, 1.014404296875, 1.16302490234375, 1.3116455078125, 1.46026611328125, 1.60888671875, 1.75750732421875, 1.9061279296875, 2.05474853515625, 2.203369140625, 2.35198974609375, 2.5006103515625, 2.64923095703125, 2.7978515625, 2.94647216796875, 3.0950927734375, 3.24371337890625, 3.392333984375, 3.54095458984375, 3.6895751953125, 3.83819580078125, 3.98681640625, 4.13543701171875, 4.2840576171875, 4.43267822265625, 4.581298828125, 4.72991943359375, 4.8785400390625, 5.02716064453125, 5.17578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 8.0, 5.0, 7.0, 9.0, 10.0, 18.0, 17.0, 25.0, 30.0, 43.0, 41.0, 52.0, 104.0, 125.0, 207.0, 422.0, 1022.0, 7765.0, 185998.0, 827118.0, 22251.0, 1854.0, 560.0, 280.0, 151.0, 111.0, 65.0, 58.0, 42.0, 24.0, 16.0, 19.0, 20.0, 9.0, 17.0, 9.0, 8.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.8359375, -8.5614013671875, -8.286865234375, -8.0123291015625, -7.73779296875, -7.4632568359375, -7.188720703125, -6.9141845703125, -6.6396484375, -6.3651123046875, -6.090576171875, -5.8160400390625, -5.54150390625, -5.2669677734375, -4.992431640625, -4.7178955078125, -4.443359375, -4.1688232421875, -3.894287109375, -3.6197509765625, -3.34521484375, -3.0706787109375, -2.796142578125, -2.5216064453125, -2.2470703125, -1.9725341796875, -1.697998046875, -1.4234619140625, -1.14892578125, -0.8743896484375, -0.599853515625, -0.3253173828125, -0.05078125, 0.2237548828125, 0.498291015625, 0.7728271484375, 1.04736328125, 1.3218994140625, 1.596435546875, 1.8709716796875, 2.1455078125, 2.4200439453125, 2.694580078125, 2.9691162109375, 3.24365234375, 3.5181884765625, 3.792724609375, 4.0672607421875, 4.341796875, 4.6163330078125, 4.890869140625, 5.1654052734375, 5.43994140625, 5.7144775390625, 5.989013671875, 6.2635498046875, 6.5380859375, 6.8126220703125, 7.087158203125, 7.3616943359375, 7.63623046875, 7.9107666015625, 8.185302734375, 8.4598388671875, 8.734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 4.0, 6.0, 9.0, 18.0, 10.0, 13.0, 22.0, 20.0, 28.0, 39.0, 36.0, 36.0, 26.0, 47.0, 51.0, 48.0, 54.0, 55.0, 54.0, 52.0, 58.0, 49.0, 39.0, 32.0, 31.0, 20.0, 37.0, 11.0, 15.0, 10.0, 12.0, 20.0, 6.0, 14.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.43597412109375, -5.2508544921875, -5.06573486328125, -4.880615234375, -4.69549560546875, -4.5103759765625, -4.32525634765625, -4.14013671875, -3.95501708984375, -3.7698974609375, -3.58477783203125, -3.399658203125, -3.21453857421875, -3.0294189453125, -2.84429931640625, -2.6591796875, -2.47406005859375, -2.2889404296875, -2.10382080078125, -1.918701171875, -1.73358154296875, -1.5484619140625, -1.36334228515625, -1.17822265625, -0.99310302734375, -0.8079833984375, -0.62286376953125, -0.437744140625, -0.25262451171875, -0.0675048828125, 0.11761474609375, 0.302734375, 0.48785400390625, 0.6729736328125, 0.85809326171875, 1.043212890625, 1.22833251953125, 1.4134521484375, 1.59857177734375, 1.78369140625, 1.96881103515625, 2.1539306640625, 2.33905029296875, 2.524169921875, 2.70928955078125, 2.8944091796875, 3.07952880859375, 3.2646484375, 3.44976806640625, 3.6348876953125, 3.82000732421875, 4.005126953125, 4.19024658203125, 4.3753662109375, 4.56048583984375, 4.74560546875, 4.93072509765625, 5.1158447265625, 5.30096435546875, 5.486083984375, 5.67120361328125, 5.8563232421875, 6.04144287109375, 6.2265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 11.0, 27.0, 57.0, 183.0, 936.0, 10724.0, 1012677.0, 22071.0, 1412.0, 296.0, 75.0, 41.0, 18.0, 4.0, 6.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.74346923828125, -7.5572509765625, -7.37103271484375, -7.184814453125, -6.99859619140625, -6.8123779296875, -6.62615966796875, -6.43994140625, -6.25372314453125, -6.0675048828125, -5.88128662109375, -5.695068359375, -5.50885009765625, -5.3226318359375, -5.13641357421875, -4.9501953125, -4.76397705078125, -4.5777587890625, -4.39154052734375, -4.205322265625, -4.01910400390625, -3.8328857421875, -3.64666748046875, -3.46044921875, -3.27423095703125, -3.0880126953125, -2.90179443359375, -2.715576171875, -2.52935791015625, -2.3431396484375, -2.15692138671875, -1.970703125, -1.78448486328125, -1.5982666015625, -1.41204833984375, -1.225830078125, -1.03961181640625, -0.8533935546875, -0.66717529296875, -0.48095703125, -0.29473876953125, -0.1085205078125, 0.07769775390625, 0.263916015625, 0.45013427734375, 0.6363525390625, 0.82257080078125, 1.0087890625, 1.19500732421875, 1.3812255859375, 1.56744384765625, 1.753662109375, 1.93988037109375, 2.1260986328125, 2.31231689453125, 2.49853515625, 2.68475341796875, 2.8709716796875, 3.05718994140625, 3.243408203125, 3.42962646484375, 3.6158447265625, 3.80206298828125, 3.98828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 5.0, 7.0, 6.0, 10.0, 12.0, 19.0, 19.0, 22.0, 32.0, 42.0, 46.0, 78.0, 114.0, 183.0, 108.0, 61.0, 47.0, 43.0, 30.0, 20.0, 24.0, 19.0, 9.0, 10.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.00019502639770507812, -0.00018935278058052063, -0.00018367916345596313, -0.00017800554633140564, -0.00017233192920684814, -0.00016665831208229065, -0.00016098469495773315, -0.00015531107783317566, -0.00014963746070861816, -0.00014396384358406067, -0.00013829022645950317, -0.00013261660933494568, -0.00012694299221038818, -0.00012126937508583069, -0.0001155957579612732, -0.0001099221408367157, -0.0001042485237121582, -9.857490658760071e-05, -9.290128946304321e-05, -8.722767233848572e-05, -8.155405521392822e-05, -7.588043808937073e-05, -7.020682096481323e-05, -6.453320384025574e-05, -5.885958671569824e-05, -5.318596959114075e-05, -4.751235246658325e-05, -4.183873534202576e-05, -3.616511821746826e-05, -3.0491501092910767e-05, -2.481788396835327e-05, -1.9144266843795776e-05, -1.3470649719238281e-05, -7.797032594680786e-06, -2.123415470123291e-06, 3.550201654434204e-06, 9.2238187789917e-06, 1.4897435903549194e-05, 2.057105302810669e-05, 2.6244670152664185e-05, 3.191828727722168e-05, 3.7591904401779175e-05, 4.326552152633667e-05, 4.8939138650894165e-05, 5.461275577545166e-05, 6.0286372900009155e-05, 6.595999002456665e-05, 7.163360714912415e-05, 7.730722427368164e-05, 8.298084139823914e-05, 8.865445852279663e-05, 9.432807564735413e-05, 0.00010000169277191162, 0.00010567530989646912, 0.00011134892702102661, 0.0001170225441455841, 0.0001226961612701416, 0.0001283697783946991, 0.0001340433955192566, 0.0001397170126438141, 0.00014539062976837158, 0.00015106424689292908, 0.00015673786401748657, 0.00016241148114204407, 0.00016808509826660156]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 11.0, 19.0, 29.0, 65.0, 122.0, 361.0, 1006.0, 5204.0, 659553.0, 376016.0, 4673.0, 951.0, 306.0, 129.0, 54.0, 27.0, 13.0, 4.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.45831298828125, -4.2642822265625, -4.07025146484375, -3.876220703125, -3.68218994140625, -3.4881591796875, -3.29412841796875, -3.10009765625, -2.90606689453125, -2.7120361328125, -2.51800537109375, -2.323974609375, -2.12994384765625, -1.9359130859375, -1.74188232421875, -1.5478515625, -1.35382080078125, -1.1597900390625, -0.96575927734375, -0.771728515625, -0.57769775390625, -0.3836669921875, -0.18963623046875, 0.00439453125, 0.19842529296875, 0.3924560546875, 0.58648681640625, 0.780517578125, 0.97454833984375, 1.1685791015625, 1.36260986328125, 1.556640625, 1.75067138671875, 1.9447021484375, 2.13873291015625, 2.332763671875, 2.52679443359375, 2.7208251953125, 2.91485595703125, 3.10888671875, 3.30291748046875, 3.4969482421875, 3.69097900390625, 3.885009765625, 4.07904052734375, 4.2730712890625, 4.46710205078125, 4.6611328125, 4.85516357421875, 5.0491943359375, 5.24322509765625, 5.437255859375, 5.63128662109375, 5.8253173828125, 6.01934814453125, 6.21337890625, 6.40740966796875, 6.6014404296875, 6.79547119140625, 6.989501953125, 7.18353271484375, 7.3775634765625, 7.57159423828125, 7.765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 15.0, 17.0, 24.0, 45.0, 85.0, 162.0, 321.0, 147.0, 66.0, 45.0, 22.0, 15.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.9306640625, -1.890777587890625, -1.85089111328125, -1.811004638671875, -1.7711181640625, -1.731231689453125, -1.69134521484375, -1.651458740234375, -1.611572265625, -1.571685791015625, -1.53179931640625, -1.491912841796875, -1.4520263671875, -1.412139892578125, -1.37225341796875, -1.332366943359375, -1.29248046875, -1.252593994140625, -1.21270751953125, -1.172821044921875, -1.1329345703125, -1.093048095703125, -1.05316162109375, -1.013275146484375, -0.973388671875, -0.933502197265625, -0.89361572265625, -0.853729248046875, -0.8138427734375, -0.773956298828125, -0.73406982421875, -0.694183349609375, -0.654296875, -0.614410400390625, -0.57452392578125, -0.534637451171875, -0.4947509765625, -0.454864501953125, -0.41497802734375, -0.375091552734375, -0.335205078125, -0.295318603515625, -0.25543212890625, -0.215545654296875, -0.1756591796875, -0.135772705078125, -0.09588623046875, -0.055999755859375, -0.01611328125, 0.023773193359375, 0.06365966796875, 0.103546142578125, 0.1434326171875, 0.183319091796875, 0.22320556640625, 0.263092041015625, 0.302978515625, 0.342864990234375, 0.38275146484375, 0.422637939453125, 0.4625244140625, 0.502410888671875, 0.54229736328125, 0.582183837890625, 0.6220703125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 7.0, 9.0, 13.0, 24.0, 49.0, 64.0, 102.0, 135.0, 131.0, 135.0, 110.0, 81.0, 57.0, 40.0, 22.0, 20.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.997753381729126, -3.6640477180480957, -3.3303420543670654, -2.996636390686035, -2.662930727005005, -2.3292250633239746, -1.9955193996429443, -1.661813735961914, -1.3281080722808838, -0.9944024085998535, -0.6606967449188232, -0.32699108123779297, 0.006714582443237305, 0.3404202461242676, 0.6741259098052979, 1.0078315734863281, 1.3415372371673584, 1.6752429008483887, 2.008948564529419, 2.342654228210449, 2.6763598918914795, 3.0100655555725098, 3.34377121925354, 3.6774768829345703, 4.01118278503418, 4.344888687133789, 4.67859411239624, 5.012299537658691, 5.346005439758301, 5.67971134185791, 6.013416767120361, 6.3471221923828125, 6.680828094482422, 7.014533996582031, 7.348239421844482, 7.681944847106934, 8.015650749206543, 8.349356651306152, 8.683061599731445, 9.016767501831055, 9.350473403930664, 9.684179306030273, 10.017885208129883, 10.351590156555176, 10.685296058654785, 11.019001960754395, 11.352706909179688, 11.686412811279297, 12.020118713378906, 12.353824615478516, 12.687530517578125, 13.021235466003418, 13.354941368103027, 13.688647270202637, 14.02235221862793, 14.356058120727539, 14.689764022827148, 15.023469924926758, 15.357175827026367, 15.69088077545166, 16.024585723876953, 16.358291625976562, 16.691997528076172, 17.02570343017578, 17.35940933227539]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 7.0, 2.0, 3.0, 6.0, 11.0, 6.0, 10.0, 10.0, 13.0, 14.0, 21.0, 20.0, 27.0, 33.0, 38.0, 33.0, 25.0, 28.0, 53.0, 43.0, 31.0, 57.0, 37.0, 40.0, 50.0, 35.0, 30.0, 38.0, 44.0, 31.0, 25.0, 27.0, 28.0, 22.0, 23.0, 19.0, 13.0, 11.0, 10.0, 10.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-8.875509262084961, -8.623944282531738, -8.3723783493042, -8.120813369750977, -7.8692474365234375, -7.617681980133057, -7.366116523742676, -7.114551544189453, -6.862985610961914, -6.611420154571533, -6.359854698181152, -6.1082892417907715, -5.856723785400391, -5.60515832901001, -5.353592872619629, -5.102027893066406, -4.850462436676025, -4.5988969802856445, -4.347331523895264, -4.095766067504883, -3.844200611114502, -3.592635154724121, -3.3410699367523193, -3.0895044803619385, -2.8379390239715576, -2.5863735675811768, -2.334808111190796, -2.083242893218994, -1.8316773176193237, -1.5801118612289429, -1.3285465240478516, -1.0769810676574707, -0.8254156112670898, -0.573850154876709, -0.3222847580909729, -0.07071936130523682, 0.18084609508514404, 0.4324115514755249, 0.6839768886566162, 0.9355423450469971, 1.187107801437378, 1.4386732578277588, 1.6902387142181396, 1.941804051399231, 2.1933693885803223, 2.444934844970703, 2.696500301361084, 2.948065757751465, 3.1996312141418457, 3.4511966705322266, 3.7027621269226074, 3.9543275833129883, 4.205893039703369, 4.45745849609375, 4.709023475646973, 4.960589408874512, 5.212154388427734, 5.463719844818115, 5.715285301208496, 5.966850757598877, 6.218416213989258, 6.469981670379639, 6.7215471267700195, 6.973112106323242, 7.224678039550781]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 6.0, 9.0, 6.0, 12.0, 18.0, 16.0, 28.0, 21.0, 30.0, 35.0, 60.0, 67.0, 135.0, 218.0, 467.0, 1319.0, 7177.0, 92384.0, 2412709.0, 1621007.0, 51961.0, 4671.0, 990.0, 345.0, 157.0, 96.0, 67.0, 55.0, 40.0, 29.0, 27.0, 19.0, 21.0, 12.0, 10.0, 7.0, 10.0, 4.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.87109375, -7.60797119140625, -7.3448486328125, -7.08172607421875, -6.818603515625, -6.55548095703125, -6.2923583984375, -6.02923583984375, -5.76611328125, -5.50299072265625, -5.2398681640625, -4.97674560546875, -4.713623046875, -4.45050048828125, -4.1873779296875, -3.92425537109375, -3.6611328125, -3.39801025390625, -3.1348876953125, -2.87176513671875, -2.608642578125, -2.34552001953125, -2.0823974609375, -1.81927490234375, -1.55615234375, -1.29302978515625, -1.0299072265625, -0.76678466796875, -0.503662109375, -0.24053955078125, 0.0225830078125, 0.28570556640625, 0.548828125, 0.81195068359375, 1.0750732421875, 1.33819580078125, 1.601318359375, 1.86444091796875, 2.1275634765625, 2.39068603515625, 2.65380859375, 2.91693115234375, 3.1800537109375, 3.44317626953125, 3.706298828125, 3.96942138671875, 4.2325439453125, 4.49566650390625, 4.7587890625, 5.02191162109375, 5.2850341796875, 5.54815673828125, 5.811279296875, 6.07440185546875, 6.3375244140625, 6.60064697265625, 6.86376953125, 7.12689208984375, 7.3900146484375, 7.65313720703125, 7.916259765625, 8.17938232421875, 8.4425048828125, 8.70562744140625, 8.96875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 8.0, 4.0, 3.0, 4.0, 11.0, 10.0, 5.0, 20.0, 20.0, 16.0, 29.0, 26.0, 21.0, 33.0, 44.0, 42.0, 47.0, 48.0, 51.0, 40.0, 51.0, 48.0, 47.0, 38.0, 45.0, 38.0, 37.0, 31.0, 33.0, 22.0, 22.0, 23.0, 19.0, 21.0, 7.0, 12.0, 4.0, 7.0, 8.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.529296875, -2.434967041015625, -2.34063720703125, -2.246307373046875, -2.1519775390625, -2.057647705078125, -1.96331787109375, -1.868988037109375, -1.774658203125, -1.680328369140625, -1.58599853515625, -1.491668701171875, -1.3973388671875, -1.303009033203125, -1.20867919921875, -1.114349365234375, -1.02001953125, -0.925689697265625, -0.83135986328125, -0.737030029296875, -0.6427001953125, -0.548370361328125, -0.45404052734375, -0.359710693359375, -0.265380859375, -0.171051025390625, -0.07672119140625, 0.017608642578125, 0.1119384765625, 0.206268310546875, 0.30059814453125, 0.394927978515625, 0.4892578125, 0.583587646484375, 0.67791748046875, 0.772247314453125, 0.8665771484375, 0.960906982421875, 1.05523681640625, 1.149566650390625, 1.243896484375, 1.338226318359375, 1.43255615234375, 1.526885986328125, 1.6212158203125, 1.715545654296875, 1.80987548828125, 1.904205322265625, 1.99853515625, 2.092864990234375, 2.18719482421875, 2.281524658203125, 2.3758544921875, 2.470184326171875, 2.56451416015625, 2.658843994140625, 2.753173828125, 2.847503662109375, 2.94183349609375, 3.036163330078125, 3.1304931640625, 3.224822998046875, 3.31915283203125, 3.413482666015625, 3.5078125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 7.0, 6.0, 7.0, 11.0, 12.0, 23.0, 40.0, 58.0, 107.0, 176.0, 257.0, 480.0, 977.0, 2406.0, 11410.0, 190827.0, 3719948.0, 249572.0, 12932.0, 2740.0, 1075.0, 541.0, 237.0, 156.0, 95.0, 51.0, 40.0, 31.0, 18.0, 7.0, 5.0, 6.0, 0.0, 4.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-7.859375, -7.59326171875, -7.3271484375, -7.06103515625, -6.794921875, -6.52880859375, -6.2626953125, -5.99658203125, -5.73046875, -5.46435546875, -5.1982421875, -4.93212890625, -4.666015625, -4.39990234375, -4.1337890625, -3.86767578125, -3.6015625, -3.33544921875, -3.0693359375, -2.80322265625, -2.537109375, -2.27099609375, -2.0048828125, -1.73876953125, -1.47265625, -1.20654296875, -0.9404296875, -0.67431640625, -0.408203125, -0.14208984375, 0.1240234375, 0.39013671875, 0.65625, 0.92236328125, 1.1884765625, 1.45458984375, 1.720703125, 1.98681640625, 2.2529296875, 2.51904296875, 2.78515625, 3.05126953125, 3.3173828125, 3.58349609375, 3.849609375, 4.11572265625, 4.3818359375, 4.64794921875, 4.9140625, 5.18017578125, 5.4462890625, 5.71240234375, 5.978515625, 6.24462890625, 6.5107421875, 6.77685546875, 7.04296875, 7.30908203125, 7.5751953125, 7.84130859375, 8.107421875, 8.37353515625, 8.6396484375, 8.90576171875, 9.171875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 9.0, 8.0, 8.0, 15.0, 20.0, 39.0, 30.0, 53.0, 74.0, 88.0, 128.0, 214.0, 255.0, 330.0, 452.0, 458.0, 461.0, 405.0, 260.0, 188.0, 157.0, 106.0, 53.0, 58.0, 54.0, 43.0, 21.0, 19.0, 13.0, 9.0, 8.0, 6.0, 7.0, 4.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.5458984375, -1.502685546875, -1.45947265625, -1.416259765625, -1.373046875, -1.329833984375, -1.28662109375, -1.243408203125, -1.2001953125, -1.156982421875, -1.11376953125, -1.070556640625, -1.02734375, -0.984130859375, -0.94091796875, -0.897705078125, -0.8544921875, -0.811279296875, -0.76806640625, -0.724853515625, -0.681640625, -0.638427734375, -0.59521484375, -0.552001953125, -0.5087890625, -0.465576171875, -0.42236328125, -0.379150390625, -0.3359375, -0.292724609375, -0.24951171875, -0.206298828125, -0.1630859375, -0.119873046875, -0.07666015625, -0.033447265625, 0.009765625, 0.052978515625, 0.09619140625, 0.139404296875, 0.1826171875, 0.225830078125, 0.26904296875, 0.312255859375, 0.35546875, 0.398681640625, 0.44189453125, 0.485107421875, 0.5283203125, 0.571533203125, 0.61474609375, 0.657958984375, 0.701171875, 0.744384765625, 0.78759765625, 0.830810546875, 0.8740234375, 0.917236328125, 0.96044921875, 1.003662109375, 1.046875, 1.090087890625, 1.13330078125, 1.176513671875, 1.2197265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 15.0, 7.0, 15.0, 26.0, 50.0, 54.0, 55.0, 75.0, 78.0, 94.0, 97.0, 97.0, 66.0, 77.0, 63.0, 42.0, 32.0, 18.0, 11.0, 13.0, 10.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.7051496505737305, -4.526846885681152, -4.348544597625732, -4.170241832733154, -3.9919395446777344, -3.8136370182037354, -3.6353344917297363, -3.457031726837158, -3.2787294387817383, -3.1004269123077393, -2.9221243858337402, -2.743821859359741, -2.565519332885742, -2.387216806411743, -2.208914279937744, -2.030611515045166, -1.852308988571167, -1.674006462097168, -1.495703935623169, -1.31740140914917, -1.139098882675171, -0.9607962965965271, -0.7824937105178833, -0.6041911840438843, -0.42588865756988525, -0.24758611619472504, -0.06928357481956482, 0.10901898145675659, 0.2873215079307556, 0.46562403440475464, 0.6439266204833984, 0.8222291469573975, 1.0005316734313965, 1.1788341999053955, 1.3571367263793945, 1.5354392528533936, 1.7137417793273926, 1.8920443058013916, 2.0703468322753906, 2.2486495971679688, 2.4269518852233887, 2.6052544116973877, 2.7835569381713867, 2.9618594646453857, 3.1401619911193848, 3.318464517593384, 3.496767044067383, 3.675069808959961, 3.85337233543396, 4.031674861907959, 4.209977626800537, 4.388279914855957, 4.566582679748535, 4.744884967803955, 4.923187732696533, 5.101490020751953, 5.279792785644531, 5.458095550537109, 5.636397838592529, 5.814700603485107, 5.993002891540527, 6.1713056564331055, 6.349607944488525, 6.5279107093811035, 6.706212997436523]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 11.0, 16.0, 9.0, 25.0, 19.0, 26.0, 24.0, 25.0, 26.0, 32.0, 33.0, 27.0, 37.0, 37.0, 40.0, 39.0, 41.0, 40.0, 44.0, 37.0, 34.0, 43.0, 45.0, 36.0, 27.0, 21.0, 30.0, 23.0, 24.0, 12.0, 21.0, 12.0, 12.0, 11.0, 8.0, 2.0, 8.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0967464447021484, -2.997384548187256, -2.8980228900909424, -2.79866099357605, -2.6992990970611572, -2.5999374389648438, -2.500575542449951, -2.4012136459350586, -2.301851749420166, -2.2024898529052734, -2.10312819480896, -2.0037662982940674, -1.9044044017791748, -1.8050426244735718, -1.7056808471679688, -1.6063189506530762, -1.5069572925567627, -1.4075955152511597, -1.308233618736267, -1.208871841430664, -1.1095099449157715, -1.0101481676101685, -0.9107863903045654, -0.8114245533943176, -0.7120627164840698, -0.612700879573822, -0.5133390426635742, -0.4139772653579712, -0.3146154284477234, -0.21525359153747559, -0.11589181423187256, -0.016529977321624756, 0.08283185958862305, 0.18219368159770966, 0.28155550360679626, 0.3809173107147217, 0.4802791476249695, 0.5796409845352173, 0.6790027618408203, 0.7783645987510681, 0.8777264356613159, 0.9770882725715637, 1.0764501094818115, 1.1758118867874146, 1.2751736640930176, 1.3745355606079102, 1.4738973379135132, 1.5732591152191162, 1.6726210117340088, 1.7719827890396118, 1.8713446855545044, 1.9707064628601074, 2.070068359375, 2.1694302558898926, 2.268791913986206, 2.3681538105010986, 2.467515468597412, 2.5668773651123047, 2.666239023208618, 2.7656009197235107, 2.8649628162384033, 2.964324474334717, 3.0636863708496094, 3.163048267364502, 3.2624101638793945]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 4.0, 14.0, 15.0, 35.0, 46.0, 87.0, 158.0, 289.0, 616.0, 1423.0, 4742.0, 36626.0, 618216.0, 361482.0, 19343.0, 3281.0, 1116.0, 499.0, 252.0, 123.0, 77.0, 43.0, 20.0, 25.0, 8.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6953125, -1.6385650634765625, -1.581817626953125, -1.5250701904296875, -1.46832275390625, -1.4115753173828125, -1.354827880859375, -1.2980804443359375, -1.2413330078125, -1.1845855712890625, -1.127838134765625, -1.0710906982421875, -1.01434326171875, -0.9575958251953125, -0.900848388671875, -0.8441009521484375, -0.787353515625, -0.7306060791015625, -0.673858642578125, -0.6171112060546875, -0.56036376953125, -0.5036163330078125, -0.446868896484375, -0.3901214599609375, -0.3333740234375, -0.2766265869140625, -0.219879150390625, -0.1631317138671875, -0.10638427734375, -0.0496368408203125, 0.007110595703125, 0.0638580322265625, 0.12060546875, 0.1773529052734375, 0.234100341796875, 0.2908477783203125, 0.34759521484375, 0.4043426513671875, 0.461090087890625, 0.5178375244140625, 0.5745849609375, 0.6313323974609375, 0.688079833984375, 0.7448272705078125, 0.80157470703125, 0.8583221435546875, 0.915069580078125, 0.9718170166015625, 1.028564453125, 1.0853118896484375, 1.142059326171875, 1.1988067626953125, 1.25555419921875, 1.3123016357421875, 1.369049072265625, 1.4257965087890625, 1.4825439453125, 1.5392913818359375, 1.596038818359375, 1.6527862548828125, 1.70953369140625, 1.7662811279296875, 1.823028564453125, 1.8797760009765625, 1.9365234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 3.0, 8.0, 15.0, 21.0, 19.0, 41.0, 36.0, 51.0, 63.0, 73.0, 65.0, 78.0, 71.0, 81.0, 63.0, 61.0, 53.0, 50.0, 40.0, 36.0, 20.0, 20.0, 9.0, 8.0, 6.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-5.84765625, -5.71630859375, -5.5849609375, -5.45361328125, -5.322265625, -5.19091796875, -5.0595703125, -4.92822265625, -4.796875, -4.66552734375, -4.5341796875, -4.40283203125, -4.271484375, -4.14013671875, -4.0087890625, -3.87744140625, -3.74609375, -3.61474609375, -3.4833984375, -3.35205078125, -3.220703125, -3.08935546875, -2.9580078125, -2.82666015625, -2.6953125, -2.56396484375, -2.4326171875, -2.30126953125, -2.169921875, -2.03857421875, -1.9072265625, -1.77587890625, -1.64453125, -1.51318359375, -1.3818359375, -1.25048828125, -1.119140625, -0.98779296875, -0.8564453125, -0.72509765625, -0.59375, -0.46240234375, -0.3310546875, -0.19970703125, -0.068359375, 0.06298828125, 0.1943359375, 0.32568359375, 0.45703125, 0.58837890625, 0.7197265625, 0.85107421875, 0.982421875, 1.11376953125, 1.2451171875, 1.37646484375, 1.5078125, 1.63916015625, 1.7705078125, 1.90185546875, 2.033203125, 2.16455078125, 2.2958984375, 2.42724609375, 2.55859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 13.0, 22.0, 39.0, 49.0, 106.0, 200.0, 362.0, 709.0, 1392.0, 2918.0, 5901.0, 12410.0, 26480.0, 55651.0, 112522.0, 197452.0, 244623.0, 186249.0, 103633.0, 51277.0, 24084.0, 11512.0, 5481.0, 2728.0, 1291.0, 680.0, 346.0, 162.0, 98.0, 58.0, 29.0, 15.0, 16.0, 11.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.353759765625, -0.3434867858886719, -0.33321380615234375, -0.3229408264160156, -0.3126678466796875, -0.3023948669433594, -0.29212188720703125, -0.2818489074707031, -0.271575927734375, -0.2613029479980469, -0.25102996826171875, -0.24075698852539062, -0.2304840087890625, -0.22021102905273438, -0.20993804931640625, -0.19966506958007812, -0.18939208984375, -0.17911911010742188, -0.16884613037109375, -0.15857315063476562, -0.1483001708984375, -0.13802719116210938, -0.12775421142578125, -0.11748123168945312, -0.107208251953125, -0.09693527221679688, -0.08666229248046875, -0.07638931274414062, -0.0661163330078125, -0.055843353271484375, -0.04557037353515625, -0.035297393798828125, -0.0250244140625, -0.014751434326171875, -0.00447845458984375, 0.005794525146484375, 0.0160675048828125, 0.026340484619140625, 0.03661346435546875, 0.046886444091796875, 0.057159423828125, 0.06743240356445312, 0.07770538330078125, 0.08797836303710938, 0.0982513427734375, 0.10852432250976562, 0.11879730224609375, 0.12907028198242188, 0.13934326171875, 0.14961624145507812, 0.15988922119140625, 0.17016220092773438, 0.1804351806640625, 0.19070816040039062, 0.20098114013671875, 0.21125411987304688, 0.221527099609375, 0.23180007934570312, 0.24207305908203125, 0.2523460388183594, 0.2626190185546875, 0.2728919982910156, 0.28316497802734375, 0.2934379577636719, 0.3037109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 5.0, 8.0, 14.0, 7.0, 16.0, 9.0, 18.0, 27.0, 29.0, 31.0, 43.0, 55.0, 51.0, 41.0, 57.0, 53.0, 67.0, 64.0, 46.0, 61.0, 45.0, 39.0, 32.0, 27.0, 24.0, 24.0, 26.0, 12.0, 13.0, 16.0, 7.0, 5.0, 6.0, 3.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.48046875, -5.27703857421875, -5.0736083984375, -4.87017822265625, -4.666748046875, -4.46331787109375, -4.2598876953125, -4.05645751953125, -3.85302734375, -3.64959716796875, -3.4461669921875, -3.24273681640625, -3.039306640625, -2.83587646484375, -2.6324462890625, -2.42901611328125, -2.2255859375, -2.02215576171875, -1.8187255859375, -1.61529541015625, -1.411865234375, -1.20843505859375, -1.0050048828125, -0.80157470703125, -0.59814453125, -0.39471435546875, -0.1912841796875, 0.01214599609375, 0.215576171875, 0.41900634765625, 0.6224365234375, 0.82586669921875, 1.029296875, 1.23272705078125, 1.4361572265625, 1.63958740234375, 1.843017578125, 2.04644775390625, 2.2498779296875, 2.45330810546875, 2.65673828125, 2.86016845703125, 3.0635986328125, 3.26702880859375, 3.470458984375, 3.67388916015625, 3.8773193359375, 4.08074951171875, 4.2841796875, 4.48760986328125, 4.6910400390625, 4.89447021484375, 5.097900390625, 5.30133056640625, 5.5047607421875, 5.70819091796875, 5.91162109375, 6.11505126953125, 6.3184814453125, 6.52191162109375, 6.725341796875, 6.92877197265625, 7.1322021484375, 7.33563232421875, 7.5390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 10.0, 9.0, 11.0, 15.0, 24.0, 54.0, 58.0, 80.0, 142.0, 231.0, 408.0, 774.0, 1507.0, 3885.0, 11961.0, 47680.0, 255663.0, 543082.0, 141291.0, 28604.0, 7739.0, 2671.0, 1196.0, 554.0, 316.0, 198.0, 127.0, 74.0, 53.0, 46.0, 20.0, 27.0, 19.0, 15.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.100830078125, -0.09789276123046875, -0.0949554443359375, -0.09201812744140625, -0.089080810546875, -0.08614349365234375, -0.0832061767578125, -0.08026885986328125, -0.07733154296875, -0.07439422607421875, -0.0714569091796875, -0.06851959228515625, -0.065582275390625, -0.06264495849609375, -0.0597076416015625, -0.05677032470703125, -0.0538330078125, -0.05089569091796875, -0.0479583740234375, -0.04502105712890625, -0.042083740234375, -0.03914642333984375, -0.0362091064453125, -0.03327178955078125, -0.03033447265625, -0.02739715576171875, -0.0244598388671875, -0.02152252197265625, -0.018585205078125, -0.01564788818359375, -0.0127105712890625, -0.00977325439453125, -0.0068359375, -0.00389862060546875, -0.0009613037109375, 0.00197601318359375, 0.004913330078125, 0.00785064697265625, 0.0107879638671875, 0.01372528076171875, 0.01666259765625, 0.01959991455078125, 0.0225372314453125, 0.02547454833984375, 0.028411865234375, 0.03134918212890625, 0.0342864990234375, 0.03722381591796875, 0.0401611328125, 0.04309844970703125, 0.0460357666015625, 0.04897308349609375, 0.051910400390625, 0.05484771728515625, 0.0577850341796875, 0.06072235107421875, 0.06365966796875, 0.06659698486328125, 0.0695343017578125, 0.07247161865234375, 0.075408935546875, 0.07834625244140625, 0.0812835693359375, 0.08422088623046875, 0.087158203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 12.0, 15.0, 25.0, 46.0, 46.0, 68.0, 76.0, 85.0, 101.0, 103.0, 97.0, 66.0, 58.0, 61.0, 35.0, 35.0, 18.0, 13.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.577108383178711e-05, -8.361786603927612e-05, -8.146464824676514e-05, -7.931143045425415e-05, -7.715821266174316e-05, -7.500499486923218e-05, -7.285177707672119e-05, -7.06985592842102e-05, -6.854534149169922e-05, -6.639212369918823e-05, -6.423890590667725e-05, -6.208568811416626e-05, -5.9932470321655273e-05, -5.777925252914429e-05, -5.56260347366333e-05, -5.3472816944122314e-05, -5.131959915161133e-05, -4.916638135910034e-05, -4.7013163566589355e-05, -4.485994577407837e-05, -4.270672798156738e-05, -4.0553510189056396e-05, -3.840029239654541e-05, -3.6247074604034424e-05, -3.409385681152344e-05, -3.194063901901245e-05, -2.9787421226501465e-05, -2.763420343399048e-05, -2.5480985641479492e-05, -2.3327767848968506e-05, -2.117455005645752e-05, -1.9021332263946533e-05, -1.6868114471435547e-05, -1.471489667892456e-05, -1.2561678886413574e-05, -1.0408461093902588e-05, -8.255243301391602e-06, -6.102025508880615e-06, -3.948807716369629e-06, -1.7955899238586426e-06, 3.5762786865234375e-07, 2.51084566116333e-06, 4.664063453674316e-06, 6.817281246185303e-06, 8.970499038696289e-06, 1.1123716831207275e-05, 1.3276934623718262e-05, 1.5430152416229248e-05, 1.7583370208740234e-05, 1.973658800125122e-05, 2.1889805793762207e-05, 2.4043023586273193e-05, 2.619624137878418e-05, 2.8349459171295166e-05, 3.0502676963806152e-05, 3.265589475631714e-05, 3.4809112548828125e-05, 3.696233034133911e-05, 3.91155481338501e-05, 4.1268765926361084e-05, 4.342198371887207e-05, 4.557520151138306e-05, 4.772841930389404e-05, 4.988163709640503e-05, 5.2034854888916016e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 11.0, 6.0, 18.0, 24.0, 29.0, 33.0, 48.0, 63.0, 90.0, 143.0, 205.0, 415.0, 772.0, 1549.0, 3726.0, 10181.0, 35577.0, 193051.0, 619493.0, 139974.0, 28240.0, 8605.0, 3258.0, 1359.0, 681.0, 358.0, 205.0, 127.0, 87.0, 59.0, 45.0, 19.0, 23.0, 6.0, 14.0, 12.0, 15.0, 5.0, 5.0, 5.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.1195068359375, -0.1162252426147461, -0.11294364929199219, -0.10966205596923828, -0.10638046264648438, -0.10309886932373047, -0.09981727600097656, -0.09653568267822266, -0.09325408935546875, -0.08997249603271484, -0.08669090270996094, -0.08340930938720703, -0.08012771606445312, -0.07684612274169922, -0.07356452941894531, -0.0702829360961914, -0.0670013427734375, -0.0637197494506836, -0.06043815612792969, -0.05715656280517578, -0.053874969482421875, -0.05059337615966797, -0.04731178283691406, -0.044030189514160156, -0.04074859619140625, -0.037467002868652344, -0.03418540954589844, -0.03090381622314453, -0.027622222900390625, -0.02434062957763672, -0.021059036254882812, -0.017777442932128906, -0.014495849609375, -0.011214256286621094, -0.007932662963867188, -0.004651069641113281, -0.001369476318359375, 0.0019121170043945312, 0.0051937103271484375, 0.008475303649902344, 0.01175689697265625, 0.015038490295410156, 0.018320083618164062, 0.02160167694091797, 0.024883270263671875, 0.02816486358642578, 0.03144645690917969, 0.034728050231933594, 0.0380096435546875, 0.041291236877441406, 0.04457283020019531, 0.04785442352294922, 0.051136016845703125, 0.05441761016845703, 0.05769920349121094, 0.060980796813964844, 0.06426239013671875, 0.06754398345947266, 0.07082557678222656, 0.07410717010498047, 0.07738876342773438, 0.08067035675048828, 0.08395195007324219, 0.0872335433959961, 0.09051513671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 4.0, 0.0, 2.0, 6.0, 6.0, 7.0, 7.0, 9.0, 7.0, 15.0, 14.0, 13.0, 26.0, 27.0, 33.0, 56.0, 60.0, 72.0, 85.0, 109.0, 87.0, 72.0, 40.0, 55.0, 33.0, 29.0, 26.0, 16.0, 17.0, 7.0, 8.0, 6.0, 7.0, 6.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.026611328125, -0.025833845138549805, -0.02505636215209961, -0.024278879165649414, -0.02350139617919922, -0.022723913192749023, -0.021946430206298828, -0.021168947219848633, -0.020391464233398438, -0.019613981246948242, -0.018836498260498047, -0.01805901527404785, -0.017281532287597656, -0.01650404930114746, -0.015726566314697266, -0.01494908332824707, -0.014171600341796875, -0.01339411735534668, -0.012616634368896484, -0.011839151382446289, -0.011061668395996094, -0.010284185409545898, -0.009506702423095703, -0.008729219436645508, -0.007951736450195312, -0.007174253463745117, -0.006396770477294922, -0.0056192874908447266, -0.004841804504394531, -0.004064321517944336, -0.0032868385314941406, -0.0025093555450439453, -0.00173187255859375, -0.0009543895721435547, -0.00017690658569335938, 0.0006005764007568359, 0.0013780593872070312, 0.0021555423736572266, 0.002933025360107422, 0.003710508346557617, 0.0044879913330078125, 0.005265474319458008, 0.006042957305908203, 0.0068204402923583984, 0.007597923278808594, 0.008375406265258789, 0.009152889251708984, 0.00993037223815918, 0.010707855224609375, 0.01148533821105957, 0.012262821197509766, 0.013040304183959961, 0.013817787170410156, 0.014595270156860352, 0.015372753143310547, 0.016150236129760742, 0.016927719116210938, 0.017705202102661133, 0.018482685089111328, 0.019260168075561523, 0.02003765106201172, 0.020815134048461914, 0.02159261703491211, 0.022370100021362305, 0.0231475830078125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 8.0, 16.0, 43.0, 82.0, 95.0, 146.0, 147.0, 153.0, 135.0, 80.0, 50.0, 24.0, 13.0, 10.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.818401575088501, -3.6155362129211426, -3.4126710891723633, -3.209805727005005, -3.0069403648376465, -2.804075002670288, -2.6012096405029297, -2.3983445167541504, -2.195479154586792, -1.9926137924194336, -1.7897485494613647, -1.586883306503296, -1.3840179443359375, -1.181152582168579, -0.9782873392105103, -0.7754220962524414, -0.572556734085083, -0.3696914315223694, -0.16682612895965576, 0.03603917360305786, 0.23890447616577148, 0.4417698383331299, 0.6446350812911987, 0.8475003242492676, 1.050365686416626, 1.2532310485839844, 1.4560962915420532, 1.658961534500122, 1.8618268966674805, 2.064692258834839, 2.2675576210021973, 2.4704227447509766, 2.673288345336914, 2.8761537075042725, 3.079019069671631, 3.28188419342041, 3.4847495555877686, 3.687614917755127, 3.8904800415039062, 4.093345642089844, 4.296210765838623, 4.499075889587402, 4.70194149017334, 4.904806613922119, 5.107671737670898, 5.310537338256836, 5.513402462005615, 5.7162675857543945, 5.919133186340332, 6.121998310089111, 6.324863910675049, 6.527729034423828, 6.730594635009766, 6.933459758758545, 7.136324882507324, 7.339190483093262, 7.542055606842041, 7.74492073059082, 7.947786331176758, 8.150651931762695, 8.353516578674316, 8.556382179260254, 8.759247779846191, 8.962112426757812, 9.16497802734375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 5.0, 11.0, 25.0, 30.0, 29.0, 40.0, 44.0, 47.0, 47.0, 53.0, 71.0, 59.0, 66.0, 66.0, 57.0, 67.0, 58.0, 35.0, 44.0, 33.0, 24.0, 20.0, 20.0, 8.0, 12.0, 4.0, 6.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.6918487548828125, -4.581019401550293, -4.470190525054932, -4.359361171722412, -4.248531818389893, -4.137702941894531, -4.026873588562012, -3.9160444736480713, -3.805215358734131, -3.6943862438201904, -3.583556890487671, -3.4727277755737305, -3.36189866065979, -3.2510695457458496, -3.14024019241333, -3.0294110774993896, -2.91858172416687, -2.8077526092529297, -2.69692325592041, -2.5860941410064697, -2.4752650260925293, -2.3644356727600098, -2.2536065578460693, -2.142777442932129, -2.0319480895996094, -1.9211188554763794, -1.810289740562439, -1.699460506439209, -1.5886313915252686, -1.4778021574020386, -1.3669729232788086, -1.2561438083648682, -1.1453146934509277, -1.0344854593276978, -0.9236563444137573, -0.8128271102905273, -0.7019979357719421, -0.5911687612533569, -0.48033952713012695, -0.36951035261154175, -0.25868117809295654, -0.14785198867321014, -0.037022799253463745, 0.07380640506744385, 0.18463557958602905, 0.29546475410461426, 0.40629398822784424, 0.5171231627464294, 0.6279523372650146, 0.7387815117835999, 0.8496106863021851, 0.960439920425415, 1.0712690353393555, 1.1820982694625854, 1.2929275035858154, 1.4037566184997559, 1.5145858526229858, 1.6254150867462158, 1.7362442016601562, 1.8470734357833862, 1.9579026699066162, 2.0687317848205566, 2.179561138153076, 2.2903902530670166, 2.401219367980957]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 0.0, 4.0, 6.0, 6.0, 10.0, 10.0, 15.0, 22.0, 19.0, 57.0, 61.0, 95.0, 139.0, 218.0, 430.0, 811.0, 2073.0, 5814.0, 20848.0, 83657.0, 511142.0, 335240.0, 63293.0, 16319.0, 4849.0, 1750.0, 693.0, 387.0, 182.0, 124.0, 83.0, 51.0, 58.0, 29.0, 18.0, 10.0, 8.0, 13.0, 3.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.921875, -4.78851318359375, -4.6551513671875, -4.52178955078125, -4.388427734375, -4.25506591796875, -4.1217041015625, -3.98834228515625, -3.85498046875, -3.72161865234375, -3.5882568359375, -3.45489501953125, -3.321533203125, -3.18817138671875, -3.0548095703125, -2.92144775390625, -2.7880859375, -2.65472412109375, -2.5213623046875, -2.38800048828125, -2.254638671875, -2.12127685546875, -1.9879150390625, -1.85455322265625, -1.72119140625, -1.58782958984375, -1.4544677734375, -1.32110595703125, -1.187744140625, -1.05438232421875, -0.9210205078125, -0.78765869140625, -0.654296875, -0.52093505859375, -0.3875732421875, -0.25421142578125, -0.120849609375, 0.01251220703125, 0.1458740234375, 0.27923583984375, 0.41259765625, 0.54595947265625, 0.6793212890625, 0.81268310546875, 0.946044921875, 1.07940673828125, 1.2127685546875, 1.34613037109375, 1.4794921875, 1.61285400390625, 1.7462158203125, 1.87957763671875, 2.012939453125, 2.14630126953125, 2.2796630859375, 2.41302490234375, 2.54638671875, 2.67974853515625, 2.8131103515625, 2.94647216796875, 3.079833984375, 3.21319580078125, 3.3465576171875, 3.47991943359375, 3.61328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 11.0, 8.0, 19.0, 17.0, 20.0, 27.0, 23.0, 32.0, 34.0, 50.0, 46.0, 41.0, 56.0, 49.0, 51.0, 50.0, 59.0, 58.0, 50.0, 40.0, 38.0, 37.0, 37.0, 26.0, 27.0, 21.0, 15.0, 9.0, 8.0, 7.0, 7.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.76171875, -5.60162353515625, -5.4415283203125, -5.28143310546875, -5.121337890625, -4.96124267578125, -4.8011474609375, -4.64105224609375, -4.48095703125, -4.32086181640625, -4.1607666015625, -4.00067138671875, -3.840576171875, -3.68048095703125, -3.5203857421875, -3.36029052734375, -3.2001953125, -3.04010009765625, -2.8800048828125, -2.71990966796875, -2.559814453125, -2.39971923828125, -2.2396240234375, -2.07952880859375, -1.91943359375, -1.75933837890625, -1.5992431640625, -1.43914794921875, -1.279052734375, -1.11895751953125, -0.9588623046875, -0.79876708984375, -0.638671875, -0.47857666015625, -0.3184814453125, -0.15838623046875, 0.001708984375, 0.16180419921875, 0.3218994140625, 0.48199462890625, 0.64208984375, 0.80218505859375, 0.9622802734375, 1.12237548828125, 1.282470703125, 1.44256591796875, 1.6026611328125, 1.76275634765625, 1.9228515625, 2.08294677734375, 2.2430419921875, 2.40313720703125, 2.563232421875, 2.72332763671875, 2.8834228515625, 3.04351806640625, 3.20361328125, 3.36370849609375, 3.5238037109375, 3.68389892578125, 3.843994140625, 4.00408935546875, 4.1641845703125, 4.32427978515625, 4.484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 4.0, 9.0, 10.0, 5.0, 14.0, 12.0, 18.0, 25.0, 27.0, 40.0, 56.0, 72.0, 83.0, 111.0, 207.0, 301.0, 755.0, 3520.0, 37107.0, 783240.0, 208058.0, 12109.0, 1545.0, 430.0, 211.0, 142.0, 102.0, 60.0, 65.0, 45.0, 37.0, 28.0, 22.0, 21.0, 9.0, 15.0, 7.0, 7.0, 6.0, 8.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.890625, -9.62176513671875, -9.3529052734375, -9.08404541015625, -8.815185546875, -8.54632568359375, -8.2774658203125, -8.00860595703125, -7.73974609375, -7.47088623046875, -7.2020263671875, -6.93316650390625, -6.664306640625, -6.39544677734375, -6.1265869140625, -5.85772705078125, -5.5888671875, -5.32000732421875, -5.0511474609375, -4.78228759765625, -4.513427734375, -4.24456787109375, -3.9757080078125, -3.70684814453125, -3.43798828125, -3.16912841796875, -2.9002685546875, -2.63140869140625, -2.362548828125, -2.09368896484375, -1.8248291015625, -1.55596923828125, -1.287109375, -1.01824951171875, -0.7493896484375, -0.48052978515625, -0.211669921875, 0.05718994140625, 0.3260498046875, 0.59490966796875, 0.86376953125, 1.13262939453125, 1.4014892578125, 1.67034912109375, 1.939208984375, 2.20806884765625, 2.4769287109375, 2.74578857421875, 3.0146484375, 3.28350830078125, 3.5523681640625, 3.82122802734375, 4.090087890625, 4.35894775390625, 4.6278076171875, 4.89666748046875, 5.16552734375, 5.43438720703125, 5.7032470703125, 5.97210693359375, 6.240966796875, 6.50982666015625, 6.7786865234375, 7.04754638671875, 7.31640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 1.0, 4.0, 8.0, 6.0, 12.0, 23.0, 22.0, 13.0, 22.0, 36.0, 21.0, 25.0, 31.0, 33.0, 35.0, 43.0, 54.0, 41.0, 52.0, 51.0, 41.0, 48.0, 36.0, 47.0, 42.0, 24.0, 47.0, 33.0, 16.0, 25.0, 19.0, 12.0, 9.0, 12.0, 8.0, 8.0, 3.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0], "bins": [-5.7109375, -5.555908203125, -5.40087890625, -5.245849609375, -5.0908203125, -4.935791015625, -4.78076171875, -4.625732421875, -4.470703125, -4.315673828125, -4.16064453125, -4.005615234375, -3.8505859375, -3.695556640625, -3.54052734375, -3.385498046875, -3.23046875, -3.075439453125, -2.92041015625, -2.765380859375, -2.6103515625, -2.455322265625, -2.30029296875, -2.145263671875, -1.990234375, -1.835205078125, -1.68017578125, -1.525146484375, -1.3701171875, -1.215087890625, -1.06005859375, -0.905029296875, -0.75, -0.594970703125, -0.43994140625, -0.284912109375, -0.1298828125, 0.025146484375, 0.18017578125, 0.335205078125, 0.490234375, 0.645263671875, 0.80029296875, 0.955322265625, 1.1103515625, 1.265380859375, 1.42041015625, 1.575439453125, 1.73046875, 1.885498046875, 2.04052734375, 2.195556640625, 2.3505859375, 2.505615234375, 2.66064453125, 2.815673828125, 2.970703125, 3.125732421875, 3.28076171875, 3.435791015625, 3.5908203125, 3.745849609375, 3.90087890625, 4.055908203125, 4.2109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 12.0, 8.0, 12.0, 20.0, 41.0, 45.0, 78.0, 155.0, 353.0, 1078.0, 6333.0, 119976.0, 862275.0, 53103.0, 3570.0, 816.0, 267.0, 137.0, 91.0, 51.0, 38.0, 22.0, 14.0, 11.0, 6.0, 5.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.248046875, -2.174041748046875, -2.10003662109375, -2.026031494140625, -1.9520263671875, -1.878021240234375, -1.80401611328125, -1.730010986328125, -1.656005859375, -1.582000732421875, -1.50799560546875, -1.433990478515625, -1.3599853515625, -1.285980224609375, -1.21197509765625, -1.137969970703125, -1.06396484375, -0.989959716796875, -0.91595458984375, -0.841949462890625, -0.7679443359375, -0.693939208984375, -0.61993408203125, -0.545928955078125, -0.471923828125, -0.397918701171875, -0.32391357421875, -0.249908447265625, -0.1759033203125, -0.101898193359375, -0.02789306640625, 0.046112060546875, 0.1201171875, 0.194122314453125, 0.26812744140625, 0.342132568359375, 0.4161376953125, 0.490142822265625, 0.56414794921875, 0.638153076171875, 0.712158203125, 0.786163330078125, 0.86016845703125, 0.934173583984375, 1.0081787109375, 1.082183837890625, 1.15618896484375, 1.230194091796875, 1.30419921875, 1.378204345703125, 1.45220947265625, 1.526214599609375, 1.6002197265625, 1.674224853515625, 1.74822998046875, 1.822235107421875, 1.896240234375, 1.970245361328125, 2.04425048828125, 2.118255615234375, 2.1922607421875, 2.266265869140625, 2.34027099609375, 2.414276123046875, 2.48828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 9.0, 7.0, 8.0, 23.0, 24.0, 47.0, 28.0, 57.0, 73.0, 105.0, 118.0, 135.0, 86.0, 66.0, 51.0, 32.0, 28.0, 19.0, 24.0, 16.0, 6.0, 6.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018906593322753906, -0.0001824982464313507, -0.00017593055963516235, -0.000169362872838974, -0.00016279518604278564, -0.0001562274992465973, -0.00014965981245040894, -0.00014309212565422058, -0.00013652443885803223, -0.00012995675206184387, -0.00012338906526565552, -0.00011682137846946716, -0.00011025369167327881, -0.00010368600487709045, -9.71183180809021e-05, -9.055063128471375e-05, -8.398294448852539e-05, -7.741525769233704e-05, -7.084757089614868e-05, -6.427988409996033e-05, -5.771219730377197e-05, -5.114451050758362e-05, -4.4576823711395264e-05, -3.800913691520691e-05, -3.1441450119018555e-05, -2.48737633228302e-05, -1.8306076526641846e-05, -1.1738389730453491e-05, -5.170702934265137e-06, 1.3969838619232178e-06, 7.964670658111572e-06, 1.4532357454299927e-05, 2.110004425048828e-05, 2.7667731046676636e-05, 3.423541784286499e-05, 4.0803104639053345e-05, 4.73707914352417e-05, 5.3938478231430054e-05, 6.050616502761841e-05, 6.707385182380676e-05, 7.364153861999512e-05, 8.020922541618347e-05, 8.677691221237183e-05, 9.334459900856018e-05, 9.991228580474854e-05, 0.00010647997260093689, 0.00011304765939712524, 0.0001196153461933136, 0.00012618303298950195, 0.0001327507197856903, 0.00013931840658187866, 0.00014588609337806702, 0.00015245378017425537, 0.00015902146697044373, 0.00016558915376663208, 0.00017215684056282043, 0.0001787245273590088, 0.00018529221415519714, 0.0001918599009513855, 0.00019842758774757385, 0.0002049952745437622, 0.00021156296133995056, 0.00021813064813613892, 0.00022469833493232727, 0.00023126602172851562]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 9.0, 19.0, 40.0, 74.0, 185.0, 471.0, 1204.0, 4989.0, 199320.0, 828090.0, 11412.0, 1695.0, 583.0, 237.0, 100.0, 51.0, 25.0, 17.0, 6.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.6484375, -3.5313720703125, -3.414306640625, -3.2972412109375, -3.18017578125, -3.0631103515625, -2.946044921875, -2.8289794921875, -2.7119140625, -2.5948486328125, -2.477783203125, -2.3607177734375, -2.24365234375, -2.1265869140625, -2.009521484375, -1.8924560546875, -1.775390625, -1.6583251953125, -1.541259765625, -1.4241943359375, -1.30712890625, -1.1900634765625, -1.072998046875, -0.9559326171875, -0.8388671875, -0.7218017578125, -0.604736328125, -0.4876708984375, -0.37060546875, -0.2535400390625, -0.136474609375, -0.0194091796875, 0.09765625, 0.2147216796875, 0.331787109375, 0.4488525390625, 0.56591796875, 0.6829833984375, 0.800048828125, 0.9171142578125, 1.0341796875, 1.1512451171875, 1.268310546875, 1.3853759765625, 1.50244140625, 1.6195068359375, 1.736572265625, 1.8536376953125, 1.970703125, 2.0877685546875, 2.204833984375, 2.3218994140625, 2.43896484375, 2.5560302734375, 2.673095703125, 2.7901611328125, 2.9072265625, 3.0242919921875, 3.141357421875, 3.2584228515625, 3.37548828125, 3.4925537109375, 3.609619140625, 3.7266845703125, 3.84375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 20.0, 19.0, 48.0, 68.0, 104.0, 199.0, 229.0, 122.0, 71.0, 31.0, 24.0, 22.0, 13.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.2599945068359375, -1.226043701171875, -1.1920928955078125, -1.15814208984375, -1.1241912841796875, -1.090240478515625, -1.0562896728515625, -1.0223388671875, -0.9883880615234375, -0.954437255859375, -0.9204864501953125, -0.88653564453125, -0.8525848388671875, -0.818634033203125, -0.7846832275390625, -0.750732421875, -0.7167816162109375, -0.682830810546875, -0.6488800048828125, -0.61492919921875, -0.5809783935546875, -0.547027587890625, -0.5130767822265625, -0.4791259765625, -0.4451751708984375, -0.411224365234375, -0.3772735595703125, -0.34332275390625, -0.3093719482421875, -0.275421142578125, -0.2414703369140625, -0.20751953125, -0.1735687255859375, -0.139617919921875, -0.1056671142578125, -0.07171630859375, -0.0377655029296875, -0.003814697265625, 0.0301361083984375, 0.0640869140625, 0.0980377197265625, 0.131988525390625, 0.1659393310546875, 0.19989013671875, 0.2338409423828125, 0.267791748046875, 0.3017425537109375, 0.335693359375, 0.3696441650390625, 0.403594970703125, 0.4375457763671875, 0.47149658203125, 0.5054473876953125, 0.539398193359375, 0.5733489990234375, 0.6072998046875, 0.6412506103515625, 0.675201416015625, 0.7091522216796875, 0.74310302734375, 0.7770538330078125, 0.811004638671875, 0.8449554443359375, 0.87890625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 16.0, 10.0, 17.0, 28.0, 38.0, 36.0, 56.0, 68.0, 52.0, 66.0, 73.0, 75.0, 99.0, 68.0, 52.0, 53.0, 46.0, 38.0, 27.0, 16.0, 19.0, 27.0, 4.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3045148849487305, -6.111701011657715, -5.918887138366699, -5.726073265075684, -5.533259391784668, -5.340445518493652, -5.147631645202637, -4.954817771911621, -4.7620038986206055, -4.56919002532959, -4.376376152038574, -4.183562278747559, -3.990748405456543, -3.7979345321655273, -3.605120897293091, -3.412307024002075, -3.2194933891296387, -3.026679515838623, -2.8338656425476074, -2.641051769256592, -2.448237895965576, -2.2554240226745605, -2.062610387802124, -1.8697965145111084, -1.6769826412200928, -1.4841687679290771, -1.2913548946380615, -1.0985411405563354, -0.9057272672653198, -0.7129133939743042, -0.5200996398925781, -0.3272857666015625, -0.13447141647338867, 0.058342427015304565, 0.2511562705039978, 0.44397008419036865, 0.6367839574813843, 0.8295978307723999, 1.022411584854126, 1.2152254581451416, 1.4080393314361572, 1.6008532047271729, 1.7936670780181885, 1.9864808320999146, 2.1792945861816406, 2.3721084594726562, 2.564922332763672, 2.7577362060546875, 2.950550079345703, 3.1433639526367188, 3.3361778259277344, 3.52899169921875, 3.7218055725097656, 3.9146194458007812, 4.107433319091797, 4.3002471923828125, 4.493061065673828, 4.685874938964844, 4.878688812255859, 5.071502685546875, 5.264316558837891, 5.457130432128906, 5.649944305419922, 5.8427581787109375, 6.035571575164795]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 9.0, 12.0, 13.0, 10.0, 20.0, 18.0, 20.0, 23.0, 36.0, 32.0, 37.0, 47.0, 48.0, 52.0, 50.0, 50.0, 46.0, 49.0, 55.0, 40.0, 54.0, 38.0, 46.0, 42.0, 32.0, 24.0, 18.0, 14.0, 15.0, 11.0, 8.0, 12.0, 3.0, 9.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.694814682006836, -9.386423110961914, -9.078031539916992, -8.769640922546387, -8.461249351501465, -8.152857780456543, -7.844466209411621, -7.536074638366699, -7.2276835441589355, -6.919291973114014, -6.61090087890625, -6.302509307861328, -5.994117736816406, -5.685726642608643, -5.377335071563721, -5.068943977355957, -4.760552406311035, -4.452160835266113, -4.14376974105835, -3.8353781700134277, -3.526986837387085, -3.218595504760742, -2.9102039337158203, -2.6018126010894775, -2.2934212684631348, -1.985029935836792, -1.6766384840011597, -1.3682470321655273, -1.0598556995391846, -0.7514643669128418, -0.4430729150772095, -0.13468146324157715, 0.17371082305908203, 0.4821022152900696, 0.7904936075210571, 1.0988850593566895, 1.4072763919830322, 1.715667724609375, 2.024059295654297, 2.3324506282806396, 2.6408419609069824, 2.949233293533325, 3.257624626159668, 3.56601619720459, 3.8744075298309326, 4.182798862457275, 4.491190433502197, 4.799581527709961, 5.107973098754883, 5.416364669799805, 5.724755764007568, 6.03314733505249, 6.341538429260254, 6.649930000305176, 6.958321571350098, 7.2667131423950195, 7.575104236602783, 7.883495807647705, 8.191886901855469, 8.50027847290039, 8.808670043945312, 9.117061614990234, 9.42545223236084, 9.733843803405762, 10.042235374450684]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 14.0, 15.0, 40.0, 52.0, 108.0, 158.0, 268.0, 463.0, 920.0, 1935.0, 4949.0, 16966.0, 85556.0, 676130.0, 2440891.0, 832948.0, 104197.0, 19205.0, 5313.0, 2054.0, 983.0, 481.0, 254.0, 142.0, 86.0, 60.0, 34.0, 17.0, 14.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.421875, -5.281219482421875, -5.14056396484375, -4.999908447265625, -4.8592529296875, -4.718597412109375, -4.57794189453125, -4.437286376953125, -4.296630859375, -4.155975341796875, -4.01531982421875, -3.874664306640625, -3.7340087890625, -3.593353271484375, -3.45269775390625, -3.312042236328125, -3.17138671875, -3.030731201171875, -2.89007568359375, -2.749420166015625, -2.6087646484375, -2.468109130859375, -2.32745361328125, -2.186798095703125, -2.046142578125, -1.905487060546875, -1.76483154296875, -1.624176025390625, -1.4835205078125, -1.342864990234375, -1.20220947265625, -1.061553955078125, -0.9208984375, -0.780242919921875, -0.63958740234375, -0.498931884765625, -0.3582763671875, -0.217620849609375, -0.07696533203125, 0.063690185546875, 0.204345703125, 0.345001220703125, 0.48565673828125, 0.626312255859375, 0.7669677734375, 0.907623291015625, 1.04827880859375, 1.188934326171875, 1.32958984375, 1.470245361328125, 1.61090087890625, 1.751556396484375, 1.8922119140625, 2.032867431640625, 2.17352294921875, 2.314178466796875, 2.454833984375, 2.595489501953125, 2.73614501953125, 2.876800537109375, 3.0174560546875, 3.158111572265625, 3.29876708984375, 3.439422607421875, 3.580078125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 3.0, 15.0, 8.0, 11.0, 20.0, 11.0, 20.0, 16.0, 23.0, 23.0, 18.0, 31.0, 29.0, 31.0, 39.0, 37.0, 51.0, 44.0, 31.0, 37.0, 39.0, 37.0, 45.0, 49.0, 41.0, 28.0, 34.0, 31.0, 22.0, 25.0, 21.0, 21.0, 24.0, 14.0, 14.0, 10.0, 10.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.373046875, -2.2923583984375, -2.211669921875, -2.1309814453125, -2.05029296875, -1.9696044921875, -1.888916015625, -1.8082275390625, -1.7275390625, -1.6468505859375, -1.566162109375, -1.4854736328125, -1.40478515625, -1.3240966796875, -1.243408203125, -1.1627197265625, -1.08203125, -1.0013427734375, -0.920654296875, -0.8399658203125, -0.75927734375, -0.6785888671875, -0.597900390625, -0.5172119140625, -0.4365234375, -0.3558349609375, -0.275146484375, -0.1944580078125, -0.11376953125, -0.0330810546875, 0.047607421875, 0.1282958984375, 0.208984375, 0.2896728515625, 0.370361328125, 0.4510498046875, 0.53173828125, 0.6124267578125, 0.693115234375, 0.7738037109375, 0.8544921875, 0.9351806640625, 1.015869140625, 1.0965576171875, 1.17724609375, 1.2579345703125, 1.338623046875, 1.4193115234375, 1.5, 1.5806884765625, 1.661376953125, 1.7420654296875, 1.82275390625, 1.9034423828125, 1.984130859375, 2.0648193359375, 2.1455078125, 2.2261962890625, 2.306884765625, 2.3875732421875, 2.46826171875, 2.5489501953125, 2.629638671875, 2.7103271484375, 2.791015625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 12.0, 17.0, 19.0, 20.0, 43.0, 80.0, 126.0, 248.0, 642.0, 2142.0, 16448.0, 1078343.0, 3060309.0, 31290.0, 3065.0, 771.0, 302.0, 142.0, 102.0, 47.0, 36.0, 25.0, 12.0, 7.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3828125, -11.0390625, -10.6953125, -10.3515625, -10.0078125, -9.6640625, -9.3203125, -8.9765625, -8.6328125, -8.2890625, -7.9453125, -7.6015625, -7.2578125, -6.9140625, -6.5703125, -6.2265625, -5.8828125, -5.5390625, -5.1953125, -4.8515625, -4.5078125, -4.1640625, -3.8203125, -3.4765625, -3.1328125, -2.7890625, -2.4453125, -2.1015625, -1.7578125, -1.4140625, -1.0703125, -0.7265625, -0.3828125, -0.0390625, 0.3046875, 0.6484375, 0.9921875, 1.3359375, 1.6796875, 2.0234375, 2.3671875, 2.7109375, 3.0546875, 3.3984375, 3.7421875, 4.0859375, 4.4296875, 4.7734375, 5.1171875, 5.4609375, 5.8046875, 6.1484375, 6.4921875, 6.8359375, 7.1796875, 7.5234375, 7.8671875, 8.2109375, 8.5546875, 8.8984375, 9.2421875, 9.5859375, 9.9296875, 10.2734375, 10.6171875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 3.0, 5.0, 8.0, 6.0, 10.0, 10.0, 17.0, 19.0, 31.0, 26.0, 53.0, 73.0, 102.0, 150.0, 221.0, 283.0, 382.0, 474.0, 500.0, 403.0, 353.0, 272.0, 181.0, 127.0, 101.0, 64.0, 57.0, 31.0, 26.0, 19.0, 10.0, 8.0, 13.0, 6.0, 4.0, 3.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.3701171875, -1.3249969482421875, -1.279876708984375, -1.2347564697265625, -1.18963623046875, -1.1445159912109375, -1.099395751953125, -1.0542755126953125, -1.0091552734375, -0.9640350341796875, -0.918914794921875, -0.8737945556640625, -0.82867431640625, -0.7835540771484375, -0.738433837890625, -0.6933135986328125, -0.648193359375, -0.6030731201171875, -0.557952880859375, -0.5128326416015625, -0.46771240234375, -0.4225921630859375, -0.377471923828125, -0.3323516845703125, -0.2872314453125, -0.2421112060546875, -0.196990966796875, -0.1518707275390625, -0.10675048828125, -0.0616302490234375, -0.016510009765625, 0.0286102294921875, 0.07373046875, 0.1188507080078125, 0.163970947265625, 0.2090911865234375, 0.25421142578125, 0.2993316650390625, 0.344451904296875, 0.3895721435546875, 0.4346923828125, 0.4798126220703125, 0.524932861328125, 0.5700531005859375, 0.61517333984375, 0.6602935791015625, 0.705413818359375, 0.7505340576171875, 0.795654296875, 0.8407745361328125, 0.885894775390625, 0.9310150146484375, 0.97613525390625, 1.0212554931640625, 1.066375732421875, 1.1114959716796875, 1.1566162109375, 1.2017364501953125, 1.246856689453125, 1.2919769287109375, 1.33709716796875, 1.3822174072265625, 1.427337646484375, 1.4724578857421875, 1.517578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 8.0, 16.0, 25.0, 23.0, 31.0, 37.0, 46.0, 50.0, 64.0, 71.0, 63.0, 68.0, 76.0, 57.0, 60.0, 58.0, 59.0, 49.0, 26.0, 36.0, 24.0, 8.0, 12.0, 6.0, 6.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.058391571044922, -2.923959732055664, -2.789527654647827, -2.6550958156585693, -2.5206637382507324, -2.3862318992614746, -2.251800060272217, -2.11736798286438, -1.9829360246658325, -1.8485040664672852, -1.7140721082687378, -1.5796401500701904, -1.4452083110809326, -1.3107762336730957, -1.176344394683838, -1.0419124364852905, -0.9074804782867432, -0.7730485200881958, -0.6386165618896484, -0.5041846632957458, -0.3697527050971985, -0.23532074689865112, -0.10088884830474854, 0.03354310989379883, 0.1679750680923462, 0.30240702629089355, 0.43683895468711853, 0.5712708830833435, 0.7057028412818909, 0.8401347994804382, 0.9745666980743408, 1.1089986562728882, 1.2434306144714355, 1.377862572669983, 1.5122945308685303, 1.646726369857788, 1.781158447265625, 1.9155902862548828, 2.0500221252441406, 2.1844542026519775, 2.3188862800598145, 2.4533181190490723, 2.587750196456909, 2.722182035446167, 2.856614112854004, 2.9910459518432617, 3.1254777908325195, 3.2599098682403564, 3.3943417072296143, 3.528773546218872, 3.663205623626709, 3.797637462615967, 3.9320695400238037, 4.066501617431641, 4.200933456420898, 4.335365295410156, 4.469797134399414, 4.604228973388672, 4.73866081237793, 4.873093128204346, 5.0075249671936035, 5.141956806182861, 5.276388645172119, 5.410820960998535, 5.545252799987793]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 9.0, 11.0, 6.0, 10.0, 10.0, 12.0, 20.0, 20.0, 21.0, 19.0, 20.0, 23.0, 26.0, 25.0, 35.0, 40.0, 42.0, 55.0, 39.0, 41.0, 33.0, 45.0, 30.0, 43.0, 38.0, 29.0, 40.0, 31.0, 35.0, 35.0, 24.0, 22.0, 30.0, 18.0, 7.0, 9.0, 8.0, 5.0, 7.0, 10.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.383267879486084, -3.282144069671631, -3.1810200214385986, -3.0798962116241455, -2.9787721633911133, -2.87764835357666, -2.776524543762207, -2.675400733947754, -2.5742766857147217, -2.4731528759002686, -2.3720288276672363, -2.270905017852783, -2.16978120803833, -2.068657159805298, -1.9675333499908447, -1.866409420967102, -1.7652854919433594, -1.6641615629196167, -1.563037633895874, -1.461913824081421, -1.3607898950576782, -1.2596659660339355, -1.1585421562194824, -1.0574182271957397, -0.9562942981719971, -0.8551703691482544, -0.7540464997291565, -0.6529226303100586, -0.5517987012863159, -0.45067477226257324, -0.34955090284347534, -0.24842703342437744, -0.14730310440063477, -0.04617920517921448, 0.05494469404220581, 0.1560685932636261, 0.2571924924850464, 0.35831642150878906, 0.45944029092788696, 0.5605641603469849, 0.6616880893707275, 0.7628120183944702, 0.8639358878135681, 0.965059757232666, 1.0661836862564087, 1.1673076152801514, 1.2684314250946045, 1.3695553541183472, 1.4706792831420898, 1.5718032121658325, 1.6729271411895752, 1.7740509510040283, 1.875174880027771, 1.9762988090515137, 2.077422618865967, 2.17854642868042, 2.279670476913452, 2.3807942867279053, 2.4819183349609375, 2.5830421447753906, 2.6841659545898438, 2.785290002822876, 2.886413812637329, 2.9875378608703613, 3.0886616706848145]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 9.0, 12.0, 9.0, 15.0, 28.0, 36.0, 41.0, 42.0, 78.0, 111.0, 175.0, 288.0, 478.0, 843.0, 1584.0, 3205.0, 8517.0, 31105.0, 151964.0, 504876.0, 268588.0, 54171.0, 13219.0, 4639.0, 1995.0, 998.0, 569.0, 334.0, 186.0, 140.0, 87.0, 64.0, 41.0, 28.0, 13.0, 14.0, 11.0, 11.0, 6.0, 6.0, 7.0, 0.0, 3.0, 6.0, 2.0, 1.0], "bins": [-0.974609375, -0.9487457275390625, -0.922882080078125, -0.8970184326171875, -0.87115478515625, -0.8452911376953125, -0.819427490234375, -0.7935638427734375, -0.7677001953125, -0.7418365478515625, -0.715972900390625, -0.6901092529296875, -0.66424560546875, -0.6383819580078125, -0.612518310546875, -0.5866546630859375, -0.560791015625, -0.5349273681640625, -0.509063720703125, -0.4832000732421875, -0.45733642578125, -0.4314727783203125, -0.405609130859375, -0.3797454833984375, -0.3538818359375, -0.3280181884765625, -0.302154541015625, -0.2762908935546875, -0.25042724609375, -0.2245635986328125, -0.198699951171875, -0.1728363037109375, -0.14697265625, -0.1211090087890625, -0.095245361328125, -0.0693817138671875, -0.04351806640625, -0.0176544189453125, 0.008209228515625, 0.0340728759765625, 0.0599365234375, 0.0858001708984375, 0.111663818359375, 0.1375274658203125, 0.16339111328125, 0.1892547607421875, 0.215118408203125, 0.2409820556640625, 0.266845703125, 0.2927093505859375, 0.318572998046875, 0.3444366455078125, 0.37030029296875, 0.3961639404296875, 0.422027587890625, 0.4478912353515625, 0.4737548828125, 0.4996185302734375, 0.525482177734375, 0.5513458251953125, 0.57720947265625, 0.6030731201171875, 0.628936767578125, 0.6548004150390625, 0.6806640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 9.0, 8.0, 9.0, 11.0, 19.0, 15.0, 13.0, 27.0, 22.0, 20.0, 26.0, 31.0, 34.0, 40.0, 46.0, 41.0, 49.0, 45.0, 27.0, 50.0, 44.0, 49.0, 39.0, 40.0, 42.0, 40.0, 37.0, 22.0, 25.0, 23.0, 20.0, 14.0, 9.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0], "bins": [-2.466796875, -2.3994293212890625, -2.332061767578125, -2.2646942138671875, -2.19732666015625, -2.1299591064453125, -2.062591552734375, -1.9952239990234375, -1.9278564453125, -1.8604888916015625, -1.793121337890625, -1.7257537841796875, -1.65838623046875, -1.5910186767578125, -1.523651123046875, -1.4562835693359375, -1.388916015625, -1.3215484619140625, -1.254180908203125, -1.1868133544921875, -1.11944580078125, -1.0520782470703125, -0.984710693359375, -0.9173431396484375, -0.8499755859375, -0.7826080322265625, -0.715240478515625, -0.6478729248046875, -0.58050537109375, -0.5131378173828125, -0.445770263671875, -0.3784027099609375, -0.31103515625, -0.2436676025390625, -0.176300048828125, -0.1089324951171875, -0.04156494140625, 0.0258026123046875, 0.093170166015625, 0.1605377197265625, 0.2279052734375, 0.2952728271484375, 0.362640380859375, 0.4300079345703125, 0.49737548828125, 0.5647430419921875, 0.632110595703125, 0.6994781494140625, 0.766845703125, 0.8342132568359375, 0.901580810546875, 0.9689483642578125, 1.03631591796875, 1.1036834716796875, 1.171051025390625, 1.2384185791015625, 1.3057861328125, 1.3731536865234375, 1.440521240234375, 1.5078887939453125, 1.57525634765625, 1.6426239013671875, 1.709991455078125, 1.7773590087890625, 1.8447265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 6.0, 12.0, 16.0, 25.0, 24.0, 45.0, 75.0, 122.0, 230.0, 469.0, 857.0, 1901.0, 4089.0, 8908.0, 19797.0, 43697.0, 93367.0, 183521.0, 265505.0, 212482.0, 113807.0, 53824.0, 24718.0, 11420.0, 5036.0, 2298.0, 1095.0, 554.0, 277.0, 146.0, 93.0, 42.0, 31.0, 25.0, 16.0, 10.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2759056091308594, -0.26689910888671875, -0.2578926086425781, -0.2488861083984375, -0.23987960815429688, -0.23087310791015625, -0.22186660766601562, -0.212860107421875, -0.20385360717773438, -0.19484710693359375, -0.18584060668945312, -0.1768341064453125, -0.16782760620117188, -0.15882110595703125, -0.14981460571289062, -0.14080810546875, -0.13180160522460938, -0.12279510498046875, -0.11378860473632812, -0.1047821044921875, -0.09577560424804688, -0.08676910400390625, -0.07776260375976562, -0.068756103515625, -0.059749603271484375, -0.05074310302734375, -0.041736602783203125, -0.0327301025390625, -0.023723602294921875, -0.01471710205078125, -0.005710601806640625, 0.0032958984375, 0.012302398681640625, 0.02130889892578125, 0.030315399169921875, 0.0393218994140625, 0.048328399658203125, 0.05733489990234375, 0.06634140014648438, 0.075347900390625, 0.08435440063476562, 0.09336090087890625, 0.10236740112304688, 0.1113739013671875, 0.12038040161132812, 0.12938690185546875, 0.13839340209960938, 0.14739990234375, 0.15640640258789062, 0.16541290283203125, 0.17441940307617188, 0.1834259033203125, 0.19243240356445312, 0.20143890380859375, 0.21044540405273438, 0.219451904296875, 0.22845840454101562, 0.23746490478515625, 0.24647140502929688, 0.2554779052734375, 0.2644844055175781, 0.27349090576171875, 0.2824974060058594, 0.29150390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 8.0, 2.0, 6.0, 6.0, 6.0, 10.0, 12.0, 12.0, 15.0, 18.0, 31.0, 31.0, 20.0, 35.0, 44.0, 34.0, 42.0, 56.0, 51.0, 44.0, 42.0, 50.0, 44.0, 37.0, 48.0, 38.0, 34.0, 39.0, 33.0, 18.0, 25.0, 18.0, 14.0, 20.0, 8.0, 6.0, 10.0, 15.0, 4.0, 3.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.16253662109375, -4.0203857421875, -3.87823486328125, -3.736083984375, -3.59393310546875, -3.4517822265625, -3.30963134765625, -3.16748046875, -3.02532958984375, -2.8831787109375, -2.74102783203125, -2.598876953125, -2.45672607421875, -2.3145751953125, -2.17242431640625, -2.0302734375, -1.88812255859375, -1.7459716796875, -1.60382080078125, -1.461669921875, -1.31951904296875, -1.1773681640625, -1.03521728515625, -0.89306640625, -0.75091552734375, -0.6087646484375, -0.46661376953125, -0.324462890625, -0.18231201171875, -0.0401611328125, 0.10198974609375, 0.244140625, 0.38629150390625, 0.5284423828125, 0.67059326171875, 0.812744140625, 0.95489501953125, 1.0970458984375, 1.23919677734375, 1.38134765625, 1.52349853515625, 1.6656494140625, 1.80780029296875, 1.949951171875, 2.09210205078125, 2.2342529296875, 2.37640380859375, 2.5185546875, 2.66070556640625, 2.8028564453125, 2.94500732421875, 3.087158203125, 3.22930908203125, 3.3714599609375, 3.51361083984375, 3.65576171875, 3.79791259765625, 3.9400634765625, 4.08221435546875, 4.224365234375, 4.36651611328125, 4.5086669921875, 4.65081787109375, 4.79296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 7.0, 7.0, 10.0, 22.0, 18.0, 37.0, 52.0, 55.0, 86.0, 107.0, 216.0, 386.0, 737.0, 1708.0, 5715.0, 32590.0, 577613.0, 396397.0, 24968.0, 4822.0, 1501.0, 629.0, 322.0, 173.0, 114.0, 86.0, 47.0, 32.0, 29.0, 23.0, 18.0, 9.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.171875, -0.1663188934326172, -0.16076278686523438, -0.15520668029785156, -0.14965057373046875, -0.14409446716308594, -0.13853836059570312, -0.1329822540283203, -0.1274261474609375, -0.12187004089355469, -0.11631393432617188, -0.11075782775878906, -0.10520172119140625, -0.09964561462402344, -0.09408950805664062, -0.08853340148925781, -0.082977294921875, -0.07742118835449219, -0.07186508178710938, -0.06630897521972656, -0.06075286865234375, -0.05519676208496094, -0.049640655517578125, -0.04408454895019531, -0.0385284423828125, -0.03297233581542969, -0.027416229248046875, -0.021860122680664062, -0.01630401611328125, -0.010747909545898438, -0.005191802978515625, 0.0003643035888671875, 0.00592041015625, 0.011476516723632812, 0.017032623291015625, 0.022588729858398438, 0.02814483642578125, 0.03370094299316406, 0.039257049560546875, 0.04481315612792969, 0.0503692626953125, 0.05592536926269531, 0.061481475830078125, 0.06703758239746094, 0.07259368896484375, 0.07814979553222656, 0.08370590209960938, 0.08926200866699219, 0.094818115234375, 0.10037422180175781, 0.10593032836914062, 0.11148643493652344, 0.11704254150390625, 0.12259864807128906, 0.12815475463867188, 0.1337108612060547, 0.1392669677734375, 0.1448230743408203, 0.15037918090820312, 0.15593528747558594, 0.16149139404296875, 0.16704750061035156, 0.17260360717773438, 0.1781597137451172, 0.1837158203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 9.0, 8.0, 6.0, 12.0, 8.0, 20.0, 30.0, 45.0, 40.0, 67.0, 80.0, 85.0, 96.0, 107.0, 97.0, 83.0, 45.0, 45.0, 27.0, 27.0, 19.0, 12.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16908073425293e-05, -5.9752725064754486e-05, -5.7814642786979675e-05, -5.5876560509204865e-05, -5.3938478231430054e-05, -5.200039595365524e-05, -5.006231367588043e-05, -4.812423139810562e-05, -4.618614912033081e-05, -4.4248066842556e-05, -4.230998456478119e-05, -4.037190228700638e-05, -3.843382000923157e-05, -3.6495737731456757e-05, -3.4557655453681946e-05, -3.2619573175907135e-05, -3.0681490898132324e-05, -2.8743408620357513e-05, -2.6805326342582703e-05, -2.4867244064807892e-05, -2.292916178703308e-05, -2.099107950925827e-05, -1.905299723148346e-05, -1.711491495370865e-05, -1.5176832675933838e-05, -1.3238750398159027e-05, -1.1300668120384216e-05, -9.362585842609406e-06, -7.424503564834595e-06, -5.486421287059784e-06, -3.548339009284973e-06, -1.6102567315101624e-06, 3.2782554626464844e-07, 2.2659078240394592e-06, 4.20399010181427e-06, 6.142072379589081e-06, 8.080154657363892e-06, 1.0018236935138702e-05, 1.1956319212913513e-05, 1.3894401490688324e-05, 1.5832483768463135e-05, 1.7770566046237946e-05, 1.9708648324012756e-05, 2.1646730601787567e-05, 2.3584812879562378e-05, 2.552289515733719e-05, 2.7460977435112e-05, 2.939905971288681e-05, 3.133714199066162e-05, 3.327522426843643e-05, 3.521330654621124e-05, 3.7151388823986053e-05, 3.9089471101760864e-05, 4.1027553379535675e-05, 4.2965635657310486e-05, 4.49037179350853e-05, 4.684180021286011e-05, 4.877988249063492e-05, 5.071796476840973e-05, 5.265604704618454e-05, 5.459412932395935e-05, 5.653221160173416e-05, 5.847029387950897e-05, 6.040837615728378e-05, 6.23464584350586e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 4.0, 13.0, 21.0, 22.0, 41.0, 65.0, 98.0, 202.0, 507.0, 1679.0, 7380.0, 62628.0, 898244.0, 67112.0, 7785.0, 1721.0, 497.0, 211.0, 101.0, 85.0, 37.0, 24.0, 24.0, 9.0, 5.0, 8.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.24936294555664062, -0.24091339111328125, -0.23246383666992188, -0.2240142822265625, -0.21556472778320312, -0.20711517333984375, -0.19866561889648438, -0.190216064453125, -0.18176651000976562, -0.17331695556640625, -0.16486740112304688, -0.1564178466796875, -0.14796829223632812, -0.13951873779296875, -0.13106918334960938, -0.12261962890625, -0.11417007446289062, -0.10572052001953125, -0.09727096557617188, -0.0888214111328125, -0.08037185668945312, -0.07192230224609375, -0.06347274780273438, -0.055023193359375, -0.046573638916015625, -0.03812408447265625, -0.029674530029296875, -0.0212249755859375, -0.012775421142578125, -0.00432586669921875, 0.004123687744140625, 0.0125732421875, 0.021022796630859375, 0.02947235107421875, 0.037921905517578125, 0.0463714599609375, 0.054821014404296875, 0.06327056884765625, 0.07172012329101562, 0.080169677734375, 0.08861923217773438, 0.09706878662109375, 0.10551834106445312, 0.1139678955078125, 0.12241744995117188, 0.13086700439453125, 0.13931655883789062, 0.14776611328125, 0.15621566772460938, 0.16466522216796875, 0.17311477661132812, 0.1815643310546875, 0.19001388549804688, 0.19846343994140625, 0.20691299438476562, 0.215362548828125, 0.22381210327148438, 0.23226165771484375, 0.24071121215820312, 0.2491607666015625, 0.2576103210449219, 0.26605987548828125, 0.2745094299316406, 0.282958984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 11.0, 14.0, 12.0, 14.0, 29.0, 52.0, 126.0, 298.0, 203.0, 82.0, 34.0, 24.0, 20.0, 18.0, 10.0, 4.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.071533203125, -0.06973075866699219, -0.06792831420898438, -0.06612586975097656, -0.06432342529296875, -0.06252098083496094, -0.060718536376953125, -0.05891609191894531, -0.0571136474609375, -0.05531120300292969, -0.053508758544921875, -0.05170631408691406, -0.04990386962890625, -0.04810142517089844, -0.046298980712890625, -0.04449653625488281, -0.042694091796875, -0.04089164733886719, -0.039089202880859375, -0.03728675842285156, -0.03548431396484375, -0.03368186950683594, -0.031879425048828125, -0.030076980590820312, -0.0282745361328125, -0.026472091674804688, -0.024669647216796875, -0.022867202758789062, -0.02106475830078125, -0.019262313842773438, -0.017459869384765625, -0.015657424926757812, -0.01385498046875, -0.012052536010742188, -0.010250091552734375, -0.008447647094726562, -0.00664520263671875, -0.0048427581787109375, -0.003040313720703125, -0.0012378692626953125, 0.0005645751953125, 0.0023670196533203125, 0.004169464111328125, 0.0059719085693359375, 0.00777435302734375, 0.009576797485351562, 0.011379241943359375, 0.013181686401367188, 0.014984130859375, 0.016786575317382812, 0.018589019775390625, 0.020391464233398438, 0.02219390869140625, 0.023996353149414062, 0.025798797607421875, 0.027601242065429688, 0.0294036865234375, 0.031206130981445312, 0.033008575439453125, 0.03481101989746094, 0.03661346435546875, 0.03841590881347656, 0.040218353271484375, 0.04202079772949219, 0.0438232421875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 4.0, 7.0, 12.0, 22.0, 33.0, 39.0, 57.0, 66.0, 76.0, 97.0, 84.0, 92.0, 76.0, 84.0, 77.0, 53.0, 36.0, 32.0, 18.0, 10.0, 11.0, 6.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4458606243133545, -3.347395658493042, -3.2489306926727295, -3.150465726852417, -3.0520005226135254, -2.953535556793213, -2.8550705909729004, -2.756605625152588, -2.6581406593322754, -2.559675693511963, -2.4612107276916504, -2.362745761871338, -2.2642807960510254, -2.165815591812134, -2.0673506259918213, -1.9688856601715088, -1.8704206943511963, -1.7719557285308838, -1.6734907627105713, -1.5750256776809692, -1.4765607118606567, -1.3780957460403442, -1.2796306610107422, -1.1811656951904297, -1.0827007293701172, -0.9842357635498047, -0.8857707381248474, -0.7873057126998901, -0.6888407468795776, -0.5903757810592651, -0.49191075563430786, -0.3934457302093506, -0.2949807643890381, -0.1965157687664032, -0.09805077314376831, 0.00041422247886657715, 0.09887921810150146, 0.19734421372413635, 0.29580920934677124, 0.3942742347717285, 0.492739200592041, 0.5912041664123535, 0.6896691918373108, 0.7881342172622681, 0.8865991830825806, 0.9850641489028931, 1.0835292339324951, 1.1819941997528076, 1.2804591655731201, 1.3789241313934326, 1.4773890972137451, 1.5758541822433472, 1.6743191480636597, 1.7727841138839722, 1.8712491989135742, 1.9697141647338867, 2.068179130554199, 2.1666440963745117, 2.265109062194824, 2.3635740280151367, 2.462038993835449, 2.560504198074341, 2.6589691638946533, 2.757434129714966, 2.8558990955352783]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 11.0, 4.0, 11.0, 10.0, 11.0, 15.0, 20.0, 25.0, 21.0, 22.0, 15.0, 23.0, 33.0, 36.0, 33.0, 52.0, 52.0, 47.0, 45.0, 40.0, 41.0, 36.0, 41.0, 38.0, 42.0, 37.0, 33.0, 26.0, 42.0, 14.0, 26.0, 27.0, 8.0, 14.0, 6.0, 8.0, 5.0, 8.0, 0.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.075538158416748, -2.012981653213501, -1.950425148010254, -1.8878685235977173, -1.8253120183944702, -1.7627555131912231, -1.7001988887786865, -1.6376423835754395, -1.5750858783721924, -1.5125293731689453, -1.4499728679656982, -1.3874162435531616, -1.3248597383499146, -1.2623032331466675, -1.1997466087341309, -1.1371901035308838, -1.0746335983276367, -1.0120770931243896, -0.9495205283164978, -0.886963963508606, -0.8244074583053589, -0.7618509531021118, -0.69929438829422, -0.6367378234863281, -0.574181318283081, -0.511624813079834, -0.44906824827194214, -0.3865117132663727, -0.3239551782608032, -0.26139864325523376, -0.1988421082496643, -0.13628557324409485, -0.07372915744781494, -0.011172622442245483, 0.051383912563323975, 0.11394044756889343, 0.1764969825744629, 0.23905351758003235, 0.3016100525856018, 0.36416658759117126, 0.4267231225967407, 0.4892796576023102, 0.5518361926078796, 0.6143927574157715, 0.6769492626190186, 0.7395057678222656, 0.8020623326301575, 0.8646188974380493, 0.9271754026412964, 0.9897319078445435, 1.05228853225708, 1.1148450374603271, 1.1774015426635742, 1.2399580478668213, 1.3025145530700684, 1.365071177482605, 1.427627682685852, 1.4901841878890991, 1.5527408123016357, 1.6152973175048828, 1.6778538227081299, 1.740410327911377, 1.802966833114624, 1.8655234575271606, 1.9280799627304077]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 10.0, 14.0, 14.0, 29.0, 35.0, 52.0, 87.0, 172.0, 254.0, 401.0, 835.0, 1591.0, 3217.0, 7048.0, 15984.0, 38859.0, 100265.0, 261850.0, 355543.0, 159474.0, 59233.0, 23927.0, 10249.0, 4706.0, 2214.0, 1120.0, 521.0, 307.0, 205.0, 128.0, 79.0, 46.0, 31.0, 12.0, 18.0, 9.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.15985107421875, -2.0775146484375, -1.99517822265625, -1.912841796875, -1.83050537109375, -1.7481689453125, -1.66583251953125, -1.58349609375, -1.50115966796875, -1.4188232421875, -1.33648681640625, -1.254150390625, -1.17181396484375, -1.0894775390625, -1.00714111328125, -0.9248046875, -0.84246826171875, -0.7601318359375, -0.67779541015625, -0.595458984375, -0.51312255859375, -0.4307861328125, -0.34844970703125, -0.26611328125, -0.18377685546875, -0.1014404296875, -0.01910400390625, 0.063232421875, 0.14556884765625, 0.2279052734375, 0.31024169921875, 0.392578125, 0.47491455078125, 0.5572509765625, 0.63958740234375, 0.721923828125, 0.80426025390625, 0.8865966796875, 0.96893310546875, 1.05126953125, 1.13360595703125, 1.2159423828125, 1.29827880859375, 1.380615234375, 1.46295166015625, 1.5452880859375, 1.62762451171875, 1.7099609375, 1.79229736328125, 1.8746337890625, 1.95697021484375, 2.039306640625, 2.12164306640625, 2.2039794921875, 2.28631591796875, 2.36865234375, 2.45098876953125, 2.5333251953125, 2.61566162109375, 2.697998046875, 2.78033447265625, 2.8626708984375, 2.94500732421875, 3.02734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 8.0, 10.0, 13.0, 10.0, 15.0, 13.0, 19.0, 20.0, 28.0, 23.0, 33.0, 31.0, 42.0, 48.0, 39.0, 57.0, 44.0, 41.0, 56.0, 44.0, 53.0, 32.0, 45.0, 35.0, 36.0, 30.0, 25.0, 28.0, 31.0, 8.0, 21.0, 7.0, 11.0, 7.0, 7.0, 6.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.359375, -4.2303466796875, -4.101318359375, -3.9722900390625, -3.84326171875, -3.7142333984375, -3.585205078125, -3.4561767578125, -3.3271484375, -3.1981201171875, -3.069091796875, -2.9400634765625, -2.81103515625, -2.6820068359375, -2.552978515625, -2.4239501953125, -2.294921875, -2.1658935546875, -2.036865234375, -1.9078369140625, -1.77880859375, -1.6497802734375, -1.520751953125, -1.3917236328125, -1.2626953125, -1.1336669921875, -1.004638671875, -0.8756103515625, -0.74658203125, -0.6175537109375, -0.488525390625, -0.3594970703125, -0.23046875, -0.1014404296875, 0.027587890625, 0.1566162109375, 0.28564453125, 0.4146728515625, 0.543701171875, 0.6727294921875, 0.8017578125, 0.9307861328125, 1.059814453125, 1.1888427734375, 1.31787109375, 1.4468994140625, 1.575927734375, 1.7049560546875, 1.833984375, 1.9630126953125, 2.092041015625, 2.2210693359375, 2.35009765625, 2.4791259765625, 2.608154296875, 2.7371826171875, 2.8662109375, 2.9952392578125, 3.124267578125, 3.2532958984375, 3.38232421875, 3.5113525390625, 3.640380859375, 3.7694091796875, 3.8984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 0.0, 3.0, 8.0, 4.0, 8.0, 12.0, 6.0, 19.0, 23.0, 28.0, 44.0, 64.0, 95.0, 149.0, 233.0, 451.0, 1028.0, 4194.0, 25928.0, 280746.0, 653690.0, 70054.0, 8559.0, 1747.0, 622.0, 313.0, 159.0, 109.0, 73.0, 63.0, 37.0, 34.0, 10.0, 10.0, 5.0, 4.0, 9.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.9547119140625, -6.745361328125, -6.5360107421875, -6.32666015625, -6.1173095703125, -5.907958984375, -5.6986083984375, -5.4892578125, -5.2799072265625, -5.070556640625, -4.8612060546875, -4.65185546875, -4.4425048828125, -4.233154296875, -4.0238037109375, -3.814453125, -3.6051025390625, -3.395751953125, -3.1864013671875, -2.97705078125, -2.7677001953125, -2.558349609375, -2.3489990234375, -2.1396484375, -1.9302978515625, -1.720947265625, -1.5115966796875, -1.30224609375, -1.0928955078125, -0.883544921875, -0.6741943359375, -0.46484375, -0.2554931640625, -0.046142578125, 0.1632080078125, 0.37255859375, 0.5819091796875, 0.791259765625, 1.0006103515625, 1.2099609375, 1.4193115234375, 1.628662109375, 1.8380126953125, 2.04736328125, 2.2567138671875, 2.466064453125, 2.6754150390625, 2.884765625, 3.0941162109375, 3.303466796875, 3.5128173828125, 3.72216796875, 3.9315185546875, 4.140869140625, 4.3502197265625, 4.5595703125, 4.7689208984375, 4.978271484375, 5.1876220703125, 5.39697265625, 5.6063232421875, 5.815673828125, 6.0250244140625, 6.234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 5.0, 9.0, 14.0, 18.0, 27.0, 14.0, 34.0, 33.0, 32.0, 46.0, 45.0, 47.0, 51.0, 46.0, 46.0, 67.0, 56.0, 39.0, 49.0, 53.0, 37.0, 30.0, 34.0, 23.0, 28.0, 20.0, 18.0, 16.0, 7.0, 4.0, 5.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.73046875, -5.5633544921875, -5.396240234375, -5.2291259765625, -5.06201171875, -4.8948974609375, -4.727783203125, -4.5606689453125, -4.3935546875, -4.2264404296875, -4.059326171875, -3.8922119140625, -3.72509765625, -3.5579833984375, -3.390869140625, -3.2237548828125, -3.056640625, -2.8895263671875, -2.722412109375, -2.5552978515625, -2.38818359375, -2.2210693359375, -2.053955078125, -1.8868408203125, -1.7197265625, -1.5526123046875, -1.385498046875, -1.2183837890625, -1.05126953125, -0.8841552734375, -0.717041015625, -0.5499267578125, -0.3828125, -0.2156982421875, -0.048583984375, 0.1185302734375, 0.28564453125, 0.4527587890625, 0.619873046875, 0.7869873046875, 0.9541015625, 1.1212158203125, 1.288330078125, 1.4554443359375, 1.62255859375, 1.7896728515625, 1.956787109375, 2.1239013671875, 2.291015625, 2.4581298828125, 2.625244140625, 2.7923583984375, 2.95947265625, 3.1265869140625, 3.293701171875, 3.4608154296875, 3.6279296875, 3.7950439453125, 3.962158203125, 4.1292724609375, 4.29638671875, 4.4635009765625, 4.630615234375, 4.7977294921875, 4.96484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 11.0, 13.0, 15.0, 25.0, 41.0, 60.0, 67.0, 121.0, 201.0, 414.0, 865.0, 2432.0, 8762.0, 45218.0, 308825.0, 579359.0, 81922.0, 14249.0, 3576.0, 1196.0, 486.0, 252.0, 146.0, 77.0, 52.0, 50.0, 20.0, 26.0, 8.0, 11.0, 7.0, 8.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4482421875, -1.401763916015625, -1.35528564453125, -1.308807373046875, -1.2623291015625, -1.215850830078125, -1.16937255859375, -1.122894287109375, -1.076416015625, -1.029937744140625, -0.98345947265625, -0.936981201171875, -0.8905029296875, -0.844024658203125, -0.79754638671875, -0.751068115234375, -0.70458984375, -0.658111572265625, -0.61163330078125, -0.565155029296875, -0.5186767578125, -0.472198486328125, -0.42572021484375, -0.379241943359375, -0.332763671875, -0.286285400390625, -0.23980712890625, -0.193328857421875, -0.1468505859375, -0.100372314453125, -0.05389404296875, -0.007415771484375, 0.0390625, 0.085540771484375, 0.13201904296875, 0.178497314453125, 0.2249755859375, 0.271453857421875, 0.31793212890625, 0.364410400390625, 0.410888671875, 0.457366943359375, 0.50384521484375, 0.550323486328125, 0.5968017578125, 0.643280029296875, 0.68975830078125, 0.736236572265625, 0.78271484375, 0.829193115234375, 0.87567138671875, 0.922149658203125, 0.9686279296875, 1.015106201171875, 1.06158447265625, 1.108062744140625, 1.154541015625, 1.201019287109375, 1.24749755859375, 1.293975830078125, 1.3404541015625, 1.386932373046875, 1.43341064453125, 1.479888916015625, 1.5263671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 13.0, 8.0, 12.0, 15.0, 25.0, 22.0, 24.0, 47.0, 38.0, 79.0, 85.0, 145.0, 120.0, 93.0, 62.0, 52.0, 54.0, 22.0, 19.0, 12.0, 14.0, 14.0, 8.0, 3.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002155303955078125, -0.00020856782793998718, -0.00020160526037216187, -0.00019464269280433655, -0.00018768012523651123, -0.0001807175576686859, -0.0001737549901008606, -0.00016679242253303528, -0.00015982985496520996, -0.00015286728739738464, -0.00014590471982955933, -0.000138942152261734, -0.0001319795846939087, -0.00012501701712608337, -0.00011805444955825806, -0.00011109188199043274, -0.00010412931442260742, -9.71667468547821e-05, -9.020417928695679e-05, -8.324161171913147e-05, -7.627904415130615e-05, -6.931647658348083e-05, -6.235390901565552e-05, -5.53913414478302e-05, -4.842877388000488e-05, -4.1466206312179565e-05, -3.450363874435425e-05, -2.754107117652893e-05, -2.0578503608703613e-05, -1.3615936040878296e-05, -6.6533684730529785e-06, 3.0919909477233887e-07, 7.271766662597656e-06, 1.4234334230422974e-05, 2.119690179824829e-05, 2.815946936607361e-05, 3.5122036933898926e-05, 4.208460450172424e-05, 4.904717206954956e-05, 5.600973963737488e-05, 6.29723072052002e-05, 6.993487477302551e-05, 7.689744234085083e-05, 8.386000990867615e-05, 9.082257747650146e-05, 9.778514504432678e-05, 0.0001047477126121521, 0.00011171028017997742, 0.00011867284774780273, 0.00012563541531562805, 0.00013259798288345337, 0.0001395605504512787, 0.000146523118019104, 0.00015348568558692932, 0.00016044825315475464, 0.00016741082072257996, 0.00017437338829040527, 0.0001813359558582306, 0.0001882985234260559, 0.00019526109099388123, 0.00020222365856170654, 0.00020918622612953186, 0.00021614879369735718, 0.0002231113612651825, 0.0002300739288330078]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 2.0, 5.0, 9.0, 12.0, 18.0, 47.0, 130.0, 334.0, 993.0, 3478.0, 29913.0, 824559.0, 178200.0, 8203.0, 1760.0, 562.0, 177.0, 69.0, 32.0, 18.0, 13.0, 3.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.8690185546875, -2.757568359375, -2.6461181640625, -2.53466796875, -2.4232177734375, -2.311767578125, -2.2003173828125, -2.0888671875, -1.9774169921875, -1.865966796875, -1.7545166015625, -1.64306640625, -1.5316162109375, -1.420166015625, -1.3087158203125, -1.197265625, -1.0858154296875, -0.974365234375, -0.8629150390625, -0.75146484375, -0.6400146484375, -0.528564453125, -0.4171142578125, -0.3056640625, -0.1942138671875, -0.082763671875, 0.0286865234375, 0.14013671875, 0.2515869140625, 0.363037109375, 0.4744873046875, 0.5859375, 0.6973876953125, 0.808837890625, 0.9202880859375, 1.03173828125, 1.1431884765625, 1.254638671875, 1.3660888671875, 1.4775390625, 1.5889892578125, 1.700439453125, 1.8118896484375, 1.92333984375, 2.0347900390625, 2.146240234375, 2.2576904296875, 2.369140625, 2.4805908203125, 2.592041015625, 2.7034912109375, 2.81494140625, 2.9263916015625, 3.037841796875, 3.1492919921875, 3.2607421875, 3.3721923828125, 3.483642578125, 3.5950927734375, 3.70654296875, 3.8179931640625, 3.929443359375, 4.0408935546875, 4.15234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 23.0, 30.0, 54.0, 61.0, 91.0, 153.0, 180.0, 142.0, 82.0, 52.0, 41.0, 31.0, 21.0, 8.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.388671875, -1.3550262451171875, -1.321380615234375, -1.2877349853515625, -1.25408935546875, -1.2204437255859375, -1.186798095703125, -1.1531524658203125, -1.1195068359375, -1.0858612060546875, -1.052215576171875, -1.0185699462890625, -0.98492431640625, -0.9512786865234375, -0.917633056640625, -0.8839874267578125, -0.850341796875, -0.8166961669921875, -0.783050537109375, -0.7494049072265625, -0.71575927734375, -0.6821136474609375, -0.648468017578125, -0.6148223876953125, -0.5811767578125, -0.5475311279296875, -0.513885498046875, -0.4802398681640625, -0.44659423828125, -0.4129486083984375, -0.379302978515625, -0.3456573486328125, -0.31201171875, -0.2783660888671875, -0.244720458984375, -0.2110748291015625, -0.17742919921875, -0.1437835693359375, -0.110137939453125, -0.0764923095703125, -0.0428466796875, -0.0092010498046875, 0.024444580078125, 0.0580902099609375, 0.09173583984375, 0.1253814697265625, 0.159027099609375, 0.1926727294921875, 0.226318359375, 0.2599639892578125, 0.293609619140625, 0.3272552490234375, 0.36090087890625, 0.3945465087890625, 0.428192138671875, 0.4618377685546875, 0.4954833984375, 0.5291290283203125, 0.562774658203125, 0.5964202880859375, 0.63006591796875, 0.6637115478515625, 0.697357177734375, 0.7310028076171875, 0.7646484375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 17.0, 35.0, 72.0, 120.0, 182.0, 193.0, 150.0, 124.0, 60.0, 25.0, 8.0, 14.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.594183921813965, -9.166465759277344, -8.738748550415039, -8.311030387878418, -7.883312225341797, -7.455594062805176, -7.027876377105713, -6.60015869140625, -6.172440528869629, -5.744722366333008, -5.317004680633545, -4.889286994934082, -4.461568832397461, -4.03385066986084, -3.606132984161377, -3.178415060043335, -2.750697135925293, -2.322979211807251, -1.895261287689209, -1.467543363571167, -1.039825439453125, -0.612107515335083, -0.18438959121704102, 0.24332833290100098, 0.671046257019043, 1.098764181137085, 1.526482105255127, 1.954200029373169, 2.381917953491211, 2.809635877609253, 3.237353801727295, 3.665071725845337, 4.0927886962890625, 4.520506858825684, 4.9482245445251465, 5.375942230224609, 5.8036603927612305, 6.231378555297852, 6.6590962409973145, 7.086813926696777, 7.514532089233398, 7.9422502517700195, 8.36996841430664, 8.797685623168945, 9.225403785705566, 9.653121948242188, 10.080839157104492, 10.508557319641113, 10.936275482177734, 11.363993644714355, 11.791711807250977, 12.219429016113281, 12.647147178649902, 13.074865341186523, 13.502582550048828, 13.93030071258545, 14.35801887512207, 14.785737037658691, 15.213455200195312, 15.641172409057617, 16.068889617919922, 16.49660873413086, 16.924325942993164, 17.3520450592041, 17.779762268066406]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 8.0, 7.0, 10.0, 10.0, 16.0, 16.0, 18.0, 27.0, 19.0, 26.0, 20.0, 31.0, 24.0, 34.0, 39.0, 42.0, 45.0, 51.0, 34.0, 57.0, 38.0, 44.0, 44.0, 41.0, 28.0, 34.0, 33.0, 21.0, 32.0, 26.0, 17.0, 21.0, 11.0, 15.0, 7.0, 5.0, 9.0, 5.0, 7.0, 4.0, 1.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.976343631744385, -6.751397609710693, -6.526451587677002, -6.301505088806152, -6.076559066772461, -5.8516130447387695, -5.626667022705078, -5.401721000671387, -5.176774978637695, -4.951828956604004, -4.7268829345703125, -4.501936912536621, -4.2769904136657715, -4.05204439163208, -3.8270983695983887, -3.6021523475646973, -3.3772060871124268, -3.1522600650787354, -2.927313804626465, -2.7023677825927734, -2.477421760559082, -2.2524757385253906, -2.02752947807312, -1.8025834560394287, -1.5776373147964478, -1.3526911735534668, -1.1277451515197754, -0.9027990102767944, -0.6778529286384583, -0.45290684700012207, -0.2279607057571411, -0.003014683723449707, 0.22193145751953125, 0.44687753915786743, 0.6718236207962036, 0.8967697620391846, 1.121715784072876, 1.346661925315857, 1.571608066558838, 1.7965540885925293, 2.0215001106262207, 2.246446132659912, 2.4713923931121826, 2.696338415145874, 2.9212844371795654, 3.146230697631836, 3.3711767196655273, 3.5961227416992188, 3.8210690021514893, 4.04601526260376, 4.270961284637451, 4.495907306671143, 4.720853328704834, 4.945799350738525, 5.170745849609375, 5.395691871643066, 5.620637893676758, 5.845583915710449, 6.070529937744141, 6.295475959777832, 6.520422458648682, 6.745368480682373, 6.9703145027160645, 7.195260524749756, 7.420206546783447]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 13.0, 18.0, 19.0, 18.0, 30.0, 28.0, 61.0, 60.0, 98.0, 105.0, 154.0, 186.0, 284.0, 478.0, 904.0, 2167.0, 7810.0, 62446.0, 1293664.0, 2620416.0, 184603.0, 14551.0, 3201.0, 1157.0, 596.0, 318.0, 211.0, 168.0, 105.0, 96.0, 72.0, 50.0, 39.0, 38.0, 22.0, 19.0, 20.0, 12.0, 10.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.046875, -5.85296630859375, -5.6590576171875, -5.46514892578125, -5.271240234375, -5.07733154296875, -4.8834228515625, -4.68951416015625, -4.49560546875, -4.30169677734375, -4.1077880859375, -3.91387939453125, -3.719970703125, -3.52606201171875, -3.3321533203125, -3.13824462890625, -2.9443359375, -2.75042724609375, -2.5565185546875, -2.36260986328125, -2.168701171875, -1.97479248046875, -1.7808837890625, -1.58697509765625, -1.39306640625, -1.19915771484375, -1.0052490234375, -0.81134033203125, -0.617431640625, -0.42352294921875, -0.2296142578125, -0.03570556640625, 0.158203125, 0.35211181640625, 0.5460205078125, 0.73992919921875, 0.933837890625, 1.12774658203125, 1.3216552734375, 1.51556396484375, 1.70947265625, 1.90338134765625, 2.0972900390625, 2.29119873046875, 2.485107421875, 2.67901611328125, 2.8729248046875, 3.06683349609375, 3.2607421875, 3.45465087890625, 3.6485595703125, 3.84246826171875, 4.036376953125, 4.23028564453125, 4.4241943359375, 4.61810302734375, 4.81201171875, 5.00592041015625, 5.1998291015625, 5.39373779296875, 5.587646484375, 5.78155517578125, 5.9754638671875, 6.16937255859375, 6.36328125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 10.0, 11.0, 14.0, 19.0, 25.0, 21.0, 29.0, 26.0, 28.0, 30.0, 36.0, 27.0, 23.0, 38.0, 39.0, 56.0, 45.0, 48.0, 41.0, 46.0, 38.0, 37.0, 39.0, 33.0, 27.0, 33.0, 26.0, 26.0, 14.0, 15.0, 12.0, 15.0, 10.0, 5.0, 12.0, 8.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.287109375, -2.212738037109375, -2.13836669921875, -2.063995361328125, -1.9896240234375, -1.915252685546875, -1.84088134765625, -1.766510009765625, -1.692138671875, -1.617767333984375, -1.54339599609375, -1.469024658203125, -1.3946533203125, -1.320281982421875, -1.24591064453125, -1.171539306640625, -1.09716796875, -1.022796630859375, -0.94842529296875, -0.874053955078125, -0.7996826171875, -0.725311279296875, -0.65093994140625, -0.576568603515625, -0.502197265625, -0.427825927734375, -0.35345458984375, -0.279083251953125, -0.2047119140625, -0.130340576171875, -0.05596923828125, 0.018402099609375, 0.0927734375, 0.167144775390625, 0.24151611328125, 0.315887451171875, 0.3902587890625, 0.464630126953125, 0.53900146484375, 0.613372802734375, 0.687744140625, 0.762115478515625, 0.83648681640625, 0.910858154296875, 0.9852294921875, 1.059600830078125, 1.13397216796875, 1.208343505859375, 1.28271484375, 1.357086181640625, 1.43145751953125, 1.505828857421875, 1.5802001953125, 1.654571533203125, 1.72894287109375, 1.803314208984375, 1.877685546875, 1.952056884765625, 2.02642822265625, 2.100799560546875, 2.1751708984375, 2.249542236328125, 2.32391357421875, 2.398284912109375, 2.47265625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 6.0, 6.0, 11.0, 18.0, 22.0, 41.0, 68.0, 157.0, 382.0, 1034.0, 4263.0, 64106.0, 3976602.0, 139772.0, 5658.0, 1323.0, 432.0, 196.0, 80.0, 32.0, 27.0, 12.0, 13.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.671875, -12.325439453125, -11.97900390625, -11.632568359375, -11.2861328125, -10.939697265625, -10.59326171875, -10.246826171875, -9.900390625, -9.553955078125, -9.20751953125, -8.861083984375, -8.5146484375, -8.168212890625, -7.82177734375, -7.475341796875, -7.12890625, -6.782470703125, -6.43603515625, -6.089599609375, -5.7431640625, -5.396728515625, -5.05029296875, -4.703857421875, -4.357421875, -4.010986328125, -3.66455078125, -3.318115234375, -2.9716796875, -2.625244140625, -2.27880859375, -1.932373046875, -1.5859375, -1.239501953125, -0.89306640625, -0.546630859375, -0.2001953125, 0.146240234375, 0.49267578125, 0.839111328125, 1.185546875, 1.531982421875, 1.87841796875, 2.224853515625, 2.5712890625, 2.917724609375, 3.26416015625, 3.610595703125, 3.95703125, 4.303466796875, 4.64990234375, 4.996337890625, 5.3427734375, 5.689208984375, 6.03564453125, 6.382080078125, 6.728515625, 7.074951171875, 7.42138671875, 7.767822265625, 8.1142578125, 8.460693359375, 8.80712890625, 9.153564453125, 9.5]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 14.0, 11.0, 17.0, 23.0, 36.0, 74.0, 73.0, 136.0, 215.0, 339.0, 484.0, 562.0, 556.0, 476.0, 374.0, 233.0, 137.0, 96.0, 80.0, 40.0, 31.0, 16.0, 16.0, 8.0, 7.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.91015625, -1.860107421875, -1.81005859375, -1.760009765625, -1.7099609375, -1.659912109375, -1.60986328125, -1.559814453125, -1.509765625, -1.459716796875, -1.40966796875, -1.359619140625, -1.3095703125, -1.259521484375, -1.20947265625, -1.159423828125, -1.109375, -1.059326171875, -1.00927734375, -0.959228515625, -0.9091796875, -0.859130859375, -0.80908203125, -0.759033203125, -0.708984375, -0.658935546875, -0.60888671875, -0.558837890625, -0.5087890625, -0.458740234375, -0.40869140625, -0.358642578125, -0.30859375, -0.258544921875, -0.20849609375, -0.158447265625, -0.1083984375, -0.058349609375, -0.00830078125, 0.041748046875, 0.091796875, 0.141845703125, 0.19189453125, 0.241943359375, 0.2919921875, 0.342041015625, 0.39208984375, 0.442138671875, 0.4921875, 0.542236328125, 0.59228515625, 0.642333984375, 0.6923828125, 0.742431640625, 0.79248046875, 0.842529296875, 0.892578125, 0.942626953125, 0.99267578125, 1.042724609375, 1.0927734375, 1.142822265625, 1.19287109375, 1.242919921875, 1.29296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 2.0, 7.0, 9.0, 5.0, 7.0, 7.0, 11.0, 10.0, 21.0, 18.0, 16.0, 16.0, 28.0, 20.0, 27.0, 37.0, 23.0, 45.0, 35.0, 30.0, 38.0, 34.0, 26.0, 54.0, 35.0, 40.0, 50.0, 31.0, 31.0, 33.0, 30.0, 21.0, 29.0, 22.0, 19.0, 15.0, 23.0, 15.0, 17.0, 7.0, 10.0, 8.0, 9.0, 7.0, 6.0, 1.0, 6.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.0933501720428467, -2.023475170135498, -1.9536001682281494, -1.8837251663208008, -1.8138502836227417, -1.743975281715393, -1.6741002798080444, -1.6042252779006958, -1.5343503952026367, -1.464475393295288, -1.3946003913879395, -1.3247253894805908, -1.2548505067825317, -1.184975504875183, -1.1151005029678345, -1.0452255010604858, -0.9753504991531372, -0.9054754972457886, -0.8356005549430847, -0.7657255530357361, -0.6958506107330322, -0.6259756088256836, -0.556100606918335, -0.4862256348133087, -0.41635066270828247, -0.3464756906032562, -0.27660071849823, -0.20672571659088135, -0.1368507444858551, -0.06697577238082886, 0.0028992295265197754, 0.07277420163154602, 0.14264917373657227, 0.2125241458415985, 0.28239911794662476, 0.3522741198539734, 0.42214909195899963, 0.4920240640640259, 0.5618990659713745, 0.6317740678787231, 0.701649010181427, 0.7715240120887756, 0.8413989543914795, 0.9112739562988281, 0.9811489582061768, 1.0510239601135254, 1.120898962020874, 1.190773844718933, 1.2606488466262817, 1.3305238485336304, 1.400398850440979, 1.470273733139038, 1.5401487350463867, 1.6100237369537354, 1.679898738861084, 1.7497737407684326, 1.8196487426757812, 1.8895237445831299, 1.9593987464904785, 2.029273748397827, 2.099148750305176, 2.1690235137939453, 2.238898754119873, 2.3087735176086426, 2.378648519515991]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 10.0, 6.0, 8.0, 9.0, 20.0, 9.0, 17.0, 19.0, 19.0, 19.0, 33.0, 25.0, 31.0, 36.0, 31.0, 39.0, 35.0, 41.0, 46.0, 45.0, 39.0, 41.0, 42.0, 29.0, 45.0, 40.0, 28.0, 35.0, 27.0, 26.0, 18.0, 23.0, 25.0, 18.0, 12.0, 16.0, 8.0, 6.0, 4.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9165236949920654, -2.8275294303894043, -2.738535165786743, -2.649540901184082, -2.560546636581421, -2.4715523719787598, -2.3825583457946777, -2.2935640811920166, -2.2045698165893555, -2.1155755519866943, -2.026581287384033, -1.937587022781372, -1.8485928773880005, -1.7595986127853394, -1.6706043481826782, -1.5816102027893066, -1.492615818977356, -1.4036215543746948, -1.3146272897720337, -1.225633144378662, -1.136638879776001, -1.0476446151733398, -0.9586503505706787, -0.8696561455726624, -0.7806618809700012, -0.6916676163673401, -0.6026734113693237, -0.5136791467666626, -0.42468491196632385, -0.3356906771659851, -0.24669641256332397, -0.15770220756530762, -0.06870794296264648, 0.020286299288272858, 0.1092805415391922, 0.19827479124069214, 0.2872690260410309, 0.37626326084136963, 0.46525752544403076, 0.5542517304420471, 0.6432459950447083, 0.7322402596473694, 0.8212344646453857, 0.9102287292480469, 0.999222993850708, 1.0882172584533691, 1.1772115230560303, 1.2662056684494019, 1.355199933052063, 1.4441941976547241, 1.5331884622573853, 1.6221826076507568, 1.711176872253418, 1.800171136856079, 1.8891654014587402, 1.9781596660614014, 2.0671539306640625, 2.1561481952667236, 2.2451424598693848, 2.334136724472046, 2.423130989074707, 2.512125015258789, 2.6011195182800293, 2.6901135444641113, 2.7791078090667725]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 9.0, 10.0, 9.0, 18.0, 20.0, 34.0, 39.0, 51.0, 76.0, 108.0, 113.0, 151.0, 231.0, 332.0, 444.0, 656.0, 1378.0, 4955.0, 45721.0, 433937.0, 493845.0, 56701.0, 5870.0, 1411.0, 743.0, 467.0, 320.0, 221.0, 167.0, 109.0, 96.0, 82.0, 52.0, 40.0, 30.0, 20.0, 19.0, 18.0, 9.0, 12.0, 12.0, 2.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.078643798828125, -1.04498291015625, -1.011322021484375, -0.9776611328125, -0.944000244140625, -0.91033935546875, -0.876678466796875, -0.843017578125, -0.809356689453125, -0.77569580078125, -0.742034912109375, -0.7083740234375, -0.674713134765625, -0.64105224609375, -0.607391357421875, -0.57373046875, -0.540069580078125, -0.50640869140625, -0.472747802734375, -0.4390869140625, -0.405426025390625, -0.37176513671875, -0.338104248046875, -0.304443359375, -0.270782470703125, -0.23712158203125, -0.203460693359375, -0.1697998046875, -0.136138916015625, -0.10247802734375, -0.068817138671875, -0.03515625, -0.001495361328125, 0.03216552734375, 0.065826416015625, 0.0994873046875, 0.133148193359375, 0.16680908203125, 0.200469970703125, 0.234130859375, 0.267791748046875, 0.30145263671875, 0.335113525390625, 0.3687744140625, 0.402435302734375, 0.43609619140625, 0.469757080078125, 0.50341796875, 0.537078857421875, 0.57073974609375, 0.604400634765625, 0.6380615234375, 0.671722412109375, 0.70538330078125, 0.739044189453125, 0.772705078125, 0.806365966796875, 0.84002685546875, 0.873687744140625, 0.9073486328125, 0.941009521484375, 0.97467041015625, 1.008331298828125, 1.0419921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 8.0, 8.0, 11.0, 6.0, 10.0, 15.0, 11.0, 12.0, 9.0, 14.0, 29.0, 27.0, 27.0, 26.0, 31.0, 44.0, 31.0, 34.0, 38.0, 43.0, 44.0, 39.0, 43.0, 43.0, 44.0, 38.0, 26.0, 27.0, 37.0, 24.0, 30.0, 31.0, 30.0, 18.0, 20.0, 18.0, 10.0, 9.0, 12.0, 8.0, 6.0, 4.0, 8.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.798828125, -1.741485595703125, -1.68414306640625, -1.626800537109375, -1.5694580078125, -1.512115478515625, -1.45477294921875, -1.397430419921875, -1.340087890625, -1.282745361328125, -1.22540283203125, -1.168060302734375, -1.1107177734375, -1.053375244140625, -0.99603271484375, -0.938690185546875, -0.88134765625, -0.824005126953125, -0.76666259765625, -0.709320068359375, -0.6519775390625, -0.594635009765625, -0.53729248046875, -0.479949951171875, -0.422607421875, -0.365264892578125, -0.30792236328125, -0.250579833984375, -0.1932373046875, -0.135894775390625, -0.07855224609375, -0.021209716796875, 0.0361328125, 0.093475341796875, 0.15081787109375, 0.208160400390625, 0.2655029296875, 0.322845458984375, 0.38018798828125, 0.437530517578125, 0.494873046875, 0.552215576171875, 0.60955810546875, 0.666900634765625, 0.7242431640625, 0.781585693359375, 0.83892822265625, 0.896270751953125, 0.95361328125, 1.010955810546875, 1.06829833984375, 1.125640869140625, 1.1829833984375, 1.240325927734375, 1.29766845703125, 1.355010986328125, 1.412353515625, 1.469696044921875, 1.52703857421875, 1.584381103515625, 1.6417236328125, 1.699066162109375, 1.75640869140625, 1.813751220703125, 1.87109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 13.0, 11.0, 28.0, 30.0, 38.0, 67.0, 122.0, 217.0, 359.0, 630.0, 1178.0, 2118.0, 3801.0, 7072.0, 12673.0, 22808.0, 40823.0, 70476.0, 113660.0, 161513.0, 184121.0, 158634.0, 110589.0, 68758.0, 39339.0, 22102.0, 12159.0, 6785.0, 3725.0, 2026.0, 1143.0, 633.0, 366.0, 197.0, 121.0, 76.0, 41.0, 36.0, 20.0, 14.0, 9.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.223388671875, -0.2165088653564453, -0.20962905883789062, -0.20274925231933594, -0.19586944580078125, -0.18898963928222656, -0.18210983276367188, -0.1752300262451172, -0.1683502197265625, -0.1614704132080078, -0.15459060668945312, -0.14771080017089844, -0.14083099365234375, -0.13395118713378906, -0.12707138061523438, -0.12019157409667969, -0.113311767578125, -0.10643196105957031, -0.09955215454101562, -0.09267234802246094, -0.08579254150390625, -0.07891273498535156, -0.07203292846679688, -0.06515312194824219, -0.0582733154296875, -0.05139350891113281, -0.044513702392578125, -0.03763389587402344, -0.03075408935546875, -0.023874282836914062, -0.016994476318359375, -0.010114669799804688, -0.00323486328125, 0.0036449432373046875, 0.010524749755859375, 0.017404556274414062, 0.02428436279296875, 0.031164169311523438, 0.038043975830078125, 0.04492378234863281, 0.0518035888671875, 0.05868339538574219, 0.06556320190429688, 0.07244300842285156, 0.07932281494140625, 0.08620262145996094, 0.09308242797851562, 0.09996223449707031, 0.106842041015625, 0.11372184753417969, 0.12060165405273438, 0.12748146057128906, 0.13436126708984375, 0.14124107360839844, 0.14812088012695312, 0.1550006866455078, 0.1618804931640625, 0.1687602996826172, 0.17564010620117188, 0.18251991271972656, 0.18939971923828125, 0.19627952575683594, 0.20315933227539062, 0.2100391387939453, 0.2169189453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 15.0, 13.0, 11.0, 14.0, 15.0, 20.0, 18.0, 37.0, 27.0, 32.0, 36.0, 42.0, 37.0, 40.0, 65.0, 45.0, 39.0, 32.0, 43.0, 42.0, 40.0, 31.0, 41.0, 24.0, 31.0, 27.0, 18.0, 27.0, 21.0, 17.0, 17.0, 9.0, 9.0, 9.0, 4.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.82421875, -4.67926025390625, -4.5343017578125, -4.38934326171875, -4.244384765625, -4.09942626953125, -3.9544677734375, -3.80950927734375, -3.66455078125, -3.51959228515625, -3.3746337890625, -3.22967529296875, -3.084716796875, -2.93975830078125, -2.7947998046875, -2.64984130859375, -2.5048828125, -2.35992431640625, -2.2149658203125, -2.07000732421875, -1.925048828125, -1.78009033203125, -1.6351318359375, -1.49017333984375, -1.34521484375, -1.20025634765625, -1.0552978515625, -0.91033935546875, -0.765380859375, -0.62042236328125, -0.4754638671875, -0.33050537109375, -0.185546875, -0.04058837890625, 0.1043701171875, 0.24932861328125, 0.394287109375, 0.53924560546875, 0.6842041015625, 0.82916259765625, 0.97412109375, 1.11907958984375, 1.2640380859375, 1.40899658203125, 1.553955078125, 1.69891357421875, 1.8438720703125, 1.98883056640625, 2.1337890625, 2.27874755859375, 2.4237060546875, 2.56866455078125, 2.713623046875, 2.85858154296875, 3.0035400390625, 3.14849853515625, 3.29345703125, 3.43841552734375, 3.5833740234375, 3.72833251953125, 3.873291015625, 4.01824951171875, 4.1632080078125, 4.30816650390625, 4.453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 10.0, 13.0, 22.0, 23.0, 48.0, 84.0, 72.0, 187.0, 238.0, 401.0, 746.0, 1557.0, 4255.0, 19083.0, 202596.0, 737334.0, 66700.0, 9524.0, 2923.0, 1186.0, 596.0, 339.0, 214.0, 121.0, 73.0, 58.0, 51.0, 27.0, 15.0, 15.0, 15.0, 11.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.2429656982421875, -0.235443115234375, -0.2279205322265625, -0.22039794921875, -0.2128753662109375, -0.205352783203125, -0.1978302001953125, -0.1903076171875, -0.1827850341796875, -0.175262451171875, -0.1677398681640625, -0.16021728515625, -0.1526947021484375, -0.145172119140625, -0.1376495361328125, -0.130126953125, -0.1226043701171875, -0.115081787109375, -0.1075592041015625, -0.10003662109375, -0.0925140380859375, -0.084991455078125, -0.0774688720703125, -0.0699462890625, -0.0624237060546875, -0.054901123046875, -0.0473785400390625, -0.03985595703125, -0.0323333740234375, -0.024810791015625, -0.0172882080078125, -0.009765625, -0.0022430419921875, 0.005279541015625, 0.0128021240234375, 0.02032470703125, 0.0278472900390625, 0.035369873046875, 0.0428924560546875, 0.0504150390625, 0.0579376220703125, 0.065460205078125, 0.0729827880859375, 0.08050537109375, 0.0880279541015625, 0.095550537109375, 0.1030731201171875, 0.110595703125, 0.1181182861328125, 0.125640869140625, 0.1331634521484375, 0.14068603515625, 0.1482086181640625, 0.155731201171875, 0.1632537841796875, 0.1707763671875, 0.1782989501953125, 0.185821533203125, 0.1933441162109375, 0.20086669921875, 0.2083892822265625, 0.215911865234375, 0.2234344482421875, 0.23095703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 10.0, 17.0, 27.0, 37.0, 56.0, 80.0, 109.0, 142.0, 144.0, 118.0, 88.0, 60.0, 42.0, 25.0, 16.0, 13.0, 8.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265806198120117e-05, -6.923172622919083e-05, -6.580539047718048e-05, -6.237905472517014e-05, -5.895271897315979e-05, -5.5526383221149445e-05, -5.21000474691391e-05, -4.8673711717128754e-05, -4.524737596511841e-05, -4.182104021310806e-05, -3.839470446109772e-05, -3.496836870908737e-05, -3.1542032957077026e-05, -2.811569720506668e-05, -2.4689361453056335e-05, -2.126302570104599e-05, -1.7836689949035645e-05, -1.4410354197025299e-05, -1.0984018445014954e-05, -7.557682693004608e-06, -4.131346940994263e-06, -7.050111889839172e-07, 2.7213245630264282e-06, 6.147660315036774e-06, 9.573996067047119e-06, 1.3000331819057465e-05, 1.642666757106781e-05, 1.9853003323078156e-05, 2.32793390750885e-05, 2.6705674827098846e-05, 3.0132010579109192e-05, 3.355834633111954e-05, 3.698468208312988e-05, 4.041101783514023e-05, 4.3837353587150574e-05, 4.726368933916092e-05, 5.0690025091171265e-05, 5.411636084318161e-05, 5.7542696595191956e-05, 6.09690323472023e-05, 6.439536809921265e-05, 6.782170385122299e-05, 7.124803960323334e-05, 7.467437535524368e-05, 7.810071110725403e-05, 8.152704685926437e-05, 8.495338261127472e-05, 8.837971836328506e-05, 9.180605411529541e-05, 9.523238986730576e-05, 9.86587256193161e-05, 0.00010208506137132645, 0.00010551139712333679, 0.00010893773287534714, 0.00011236406862735748, 0.00011579040437936783, 0.00011921674013137817, 0.00012264307588338852, 0.00012606941163539886, 0.0001294957473874092, 0.00013292208313941956, 0.0001363484188914299, 0.00013977475464344025, 0.0001432010903954506, 0.00014662742614746094]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 9.0, 5.0, 6.0, 7.0, 7.0, 18.0, 21.0, 30.0, 55.0, 57.0, 115.0, 193.0, 242.0, 390.0, 689.0, 1140.0, 1895.0, 3168.0, 5670.0, 10209.0, 19095.0, 39434.0, 95111.0, 361814.0, 337072.0, 90741.0, 38368.0, 19040.0, 10137.0, 5647.0, 3215.0, 1938.0, 1101.0, 697.0, 420.0, 283.0, 165.0, 113.0, 75.0, 52.0, 27.0, 22.0, 15.0, 10.0, 4.0, 7.0, 5.0, 5.0, 6.0, 0.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1290283203125, -0.1248626708984375, -0.120697021484375, -0.1165313720703125, -0.11236572265625, -0.1082000732421875, -0.104034423828125, -0.0998687744140625, -0.095703125, -0.0915374755859375, -0.087371826171875, -0.0832061767578125, -0.07904052734375, -0.0748748779296875, -0.070709228515625, -0.0665435791015625, -0.0623779296875, -0.0582122802734375, -0.054046630859375, -0.0498809814453125, -0.04571533203125, -0.0415496826171875, -0.037384033203125, -0.0332183837890625, -0.029052734375, -0.0248870849609375, -0.020721435546875, -0.0165557861328125, -0.01239013671875, -0.0082244873046875, -0.004058837890625, 0.0001068115234375, 0.0042724609375, 0.0084381103515625, 0.012603759765625, 0.0167694091796875, 0.02093505859375, 0.0251007080078125, 0.029266357421875, 0.0334320068359375, 0.03759765625, 0.0417633056640625, 0.045928955078125, 0.0500946044921875, 0.05426025390625, 0.0584259033203125, 0.062591552734375, 0.0667572021484375, 0.0709228515625, 0.0750885009765625, 0.079254150390625, 0.0834197998046875, 0.08758544921875, 0.0917510986328125, 0.095916748046875, 0.1000823974609375, 0.104248046875, 0.1084136962890625, 0.112579345703125, 0.1167449951171875, 0.12091064453125, 0.1250762939453125, 0.129241943359375, 0.1334075927734375, 0.1375732421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 6.0, 5.0, 6.0, 6.0, 4.0, 13.0, 5.0, 12.0, 18.0, 26.0, 35.0, 41.0, 37.0, 49.0, 67.0, 102.0, 133.0, 94.0, 60.0, 42.0, 39.0, 29.0, 23.0, 23.0, 23.0, 20.0, 14.0, 7.0, 8.0, 13.0, 2.0, 5.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.05609130859375, -0.054302215576171875, -0.05251312255859375, -0.050724029541015625, -0.0489349365234375, -0.047145843505859375, -0.04535675048828125, -0.043567657470703125, -0.041778564453125, -0.039989471435546875, -0.03820037841796875, -0.036411285400390625, -0.0346221923828125, -0.032833099365234375, -0.03104400634765625, -0.029254913330078125, -0.0274658203125, -0.025676727294921875, -0.02388763427734375, -0.022098541259765625, -0.0203094482421875, -0.018520355224609375, -0.01673126220703125, -0.014942169189453125, -0.013153076171875, -0.011363983154296875, -0.00957489013671875, -0.007785797119140625, -0.0059967041015625, -0.004207611083984375, -0.00241851806640625, -0.000629425048828125, 0.00115966796875, 0.002948760986328125, 0.00473785400390625, 0.006526947021484375, 0.0083160400390625, 0.010105133056640625, 0.01189422607421875, 0.013683319091796875, 0.015472412109375, 0.017261505126953125, 0.01905059814453125, 0.020839691162109375, 0.0226287841796875, 0.024417877197265625, 0.02620697021484375, 0.027996063232421875, 0.02978515625, 0.031574249267578125, 0.03336334228515625, 0.035152435302734375, 0.0369415283203125, 0.038730621337890625, 0.04051971435546875, 0.042308807373046875, 0.044097900390625, 0.045886993408203125, 0.04767608642578125, 0.049465179443359375, 0.0512542724609375, 0.053043365478515625, 0.05483245849609375, 0.056621551513671875, 0.05841064453125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 2.0, 10.0, 2.0, 12.0, 16.0, 13.0, 16.0, 28.0, 19.0, 35.0, 27.0, 49.0, 50.0, 33.0, 40.0, 50.0, 57.0, 47.0, 56.0, 48.0, 59.0, 49.0, 35.0, 35.0, 34.0, 26.0, 32.0, 17.0, 25.0, 11.0, 19.0, 8.0, 8.0, 12.0, 6.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3707630634307861, -1.3151752948760986, -1.2595875263214111, -1.2039998769760132, -1.1484121084213257, -1.0928243398666382, -1.0372365713119507, -0.981648862361908, -0.9260611534118652, -0.8704733848571777, -0.814885675907135, -0.7592979073524475, -0.7037101984024048, -0.6481224298477173, -0.5925346612930298, -0.5369469523429871, -0.48135918378829956, -0.42577144503593445, -0.37018370628356934, -0.31459593772888184, -0.2590082287788391, -0.2034204602241516, -0.1478327214717865, -0.09224498271942139, -0.036657243967056274, 0.018930498510599136, 0.07451824098825455, 0.13010598719120026, 0.18569372594356537, 0.24128147959709167, 0.2968692183494568, 0.3524569571018219, 0.408044695854187, 0.4636324346065521, 0.5192201733589172, 0.5748079419136047, 0.6303956508636475, 0.685983419418335, 0.7415711879730225, 0.7971588969230652, 0.8527466058731079, 0.9083343744277954, 0.9639220833778381, 1.0195097923278809, 1.0750975608825684, 1.1306853294372559, 1.1862730979919434, 1.2418608665466309, 1.2974486351013184, 1.3530364036560059, 1.4086241722106934, 1.4642118215560913, 1.5197995901107788, 1.5753873586654663, 1.6309751272201538, 1.6865627765655518, 1.7421505451202393, 1.7977383136749268, 1.8533260822296143, 1.9089137315750122, 1.9645015001296997, 2.0200891494750977, 2.075676918029785, 2.1312646865844727, 2.18685245513916]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 6.0, 9.0, 7.0, 12.0, 16.0, 13.0, 18.0, 12.0, 20.0, 19.0, 22.0, 33.0, 28.0, 29.0, 35.0, 42.0, 37.0, 40.0, 42.0, 45.0, 51.0, 42.0, 36.0, 34.0, 38.0, 36.0, 40.0, 29.0, 31.0, 22.0, 29.0, 23.0, 20.0, 13.0, 18.0, 10.0, 15.0, 8.0, 3.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8072359561920166, -1.7508479356765747, -1.6944599151611328, -1.638071894645691, -1.581683874130249, -1.5252959728240967, -1.4689079523086548, -1.412519931793213, -1.356131911277771, -1.299743890762329, -1.2433558702468872, -1.1869678497314453, -1.130579948425293, -1.0741918087005615, -1.0178039073944092, -0.9614158868789673, -0.9050278663635254, -0.8486398458480835, -0.7922518253326416, -0.7358638644218445, -0.6794758439064026, -0.6230878233909607, -0.5666998624801636, -0.5103118419647217, -0.4539238214492798, -0.3975358009338379, -0.3411478102207184, -0.2847598195075989, -0.22837179899215698, -0.1719837784767151, -0.11559578776359558, -0.059207797050476074, -0.0028198957443237305, 0.05356810986995697, 0.10995611548423767, 0.16634412109851837, 0.22273212671279907, 0.27912014722824097, 0.3355081379413605, 0.39189612865448, 0.4482841491699219, 0.5046721696853638, 0.5610601902008057, 0.6174481511116028, 0.6738361716270447, 0.7302241921424866, 0.7866121530532837, 0.8430001735687256, 0.8993881940841675, 0.9557762145996094, 1.0121642351150513, 1.0685522556304932, 1.1249401569366455, 1.181328296661377, 1.2377161979675293, 1.2941042184829712, 1.350492238998413, 1.406880259513855, 1.4632682800292969, 1.5196563005447388, 1.5760443210601807, 1.632432222366333, 1.688820242881775, 1.7452082633972168, 1.8015962839126587]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 14.0, 16.0, 24.0, 27.0, 35.0, 66.0, 95.0, 166.0, 258.0, 388.0, 612.0, 1220.0, 2263.0, 4710.0, 9956.0, 21149.0, 47453.0, 103005.0, 196687.0, 264482.0, 198857.0, 106182.0, 48852.0, 21976.0, 10016.0, 4685.0, 2356.0, 1181.0, 644.0, 418.0, 254.0, 156.0, 103.0, 60.0, 59.0, 32.0, 25.0, 19.0, 9.0, 7.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.546875, -2.466064453125, -2.38525390625, -2.304443359375, -2.2236328125, -2.142822265625, -2.06201171875, -1.981201171875, -1.900390625, -1.819580078125, -1.73876953125, -1.657958984375, -1.5771484375, -1.496337890625, -1.41552734375, -1.334716796875, -1.25390625, -1.173095703125, -1.09228515625, -1.011474609375, -0.9306640625, -0.849853515625, -0.76904296875, -0.688232421875, -0.607421875, -0.526611328125, -0.44580078125, -0.364990234375, -0.2841796875, -0.203369140625, -0.12255859375, -0.041748046875, 0.0390625, 0.119873046875, 0.20068359375, 0.281494140625, 0.3623046875, 0.443115234375, 0.52392578125, 0.604736328125, 0.685546875, 0.766357421875, 0.84716796875, 0.927978515625, 1.0087890625, 1.089599609375, 1.17041015625, 1.251220703125, 1.33203125, 1.412841796875, 1.49365234375, 1.574462890625, 1.6552734375, 1.736083984375, 1.81689453125, 1.897705078125, 1.978515625, 2.059326171875, 2.14013671875, 2.220947265625, 2.3017578125, 2.382568359375, 2.46337890625, 2.544189453125, 2.625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 10.0, 4.0, 6.0, 8.0, 8.0, 6.0, 12.0, 16.0, 22.0, 16.0, 35.0, 36.0, 32.0, 32.0, 43.0, 38.0, 33.0, 53.0, 47.0, 65.0, 56.0, 46.0, 48.0, 47.0, 50.0, 40.0, 37.0, 29.0, 19.0, 21.0, 25.0, 22.0, 12.0, 6.0, 9.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.68359375, -3.5738525390625, -3.464111328125, -3.3543701171875, -3.24462890625, -3.1348876953125, -3.025146484375, -2.9154052734375, -2.8056640625, -2.6959228515625, -2.586181640625, -2.4764404296875, -2.36669921875, -2.2569580078125, -2.147216796875, -2.0374755859375, -1.927734375, -1.8179931640625, -1.708251953125, -1.5985107421875, -1.48876953125, -1.3790283203125, -1.269287109375, -1.1595458984375, -1.0498046875, -0.9400634765625, -0.830322265625, -0.7205810546875, -0.61083984375, -0.5010986328125, -0.391357421875, -0.2816162109375, -0.171875, -0.0621337890625, 0.047607421875, 0.1573486328125, 0.26708984375, 0.3768310546875, 0.486572265625, 0.5963134765625, 0.7060546875, 0.8157958984375, 0.925537109375, 1.0352783203125, 1.14501953125, 1.2547607421875, 1.364501953125, 1.4742431640625, 1.583984375, 1.6937255859375, 1.803466796875, 1.9132080078125, 2.02294921875, 2.1326904296875, 2.242431640625, 2.3521728515625, 2.4619140625, 2.5716552734375, 2.681396484375, 2.7911376953125, 2.90087890625, 3.0106201171875, 3.120361328125, 3.2301025390625, 3.33984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 11.0, 5.0, 13.0, 12.0, 24.0, 32.0, 43.0, 57.0, 101.0, 159.0, 252.0, 438.0, 943.0, 2587.0, 8961.0, 34049.0, 140279.0, 439860.0, 312711.0, 79956.0, 19348.0, 5328.0, 1768.0, 672.0, 328.0, 217.0, 119.0, 81.0, 61.0, 31.0, 28.0, 12.0, 16.0, 10.0, 9.0, 14.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6953125, -4.53228759765625, -4.3692626953125, -4.20623779296875, -4.043212890625, -3.88018798828125, -3.7171630859375, -3.55413818359375, -3.39111328125, -3.22808837890625, -3.0650634765625, -2.90203857421875, -2.739013671875, -2.57598876953125, -2.4129638671875, -2.24993896484375, -2.0869140625, -1.92388916015625, -1.7608642578125, -1.59783935546875, -1.434814453125, -1.27178955078125, -1.1087646484375, -0.94573974609375, -0.78271484375, -0.61968994140625, -0.4566650390625, -0.29364013671875, -0.130615234375, 0.03240966796875, 0.1954345703125, 0.35845947265625, 0.521484375, 0.68450927734375, 0.8475341796875, 1.01055908203125, 1.173583984375, 1.33660888671875, 1.4996337890625, 1.66265869140625, 1.82568359375, 1.98870849609375, 2.1517333984375, 2.31475830078125, 2.477783203125, 2.64080810546875, 2.8038330078125, 2.96685791015625, 3.1298828125, 3.29290771484375, 3.4559326171875, 3.61895751953125, 3.781982421875, 3.94500732421875, 4.1080322265625, 4.27105712890625, 4.43408203125, 4.59710693359375, 4.7601318359375, 4.92315673828125, 5.086181640625, 5.24920654296875, 5.4122314453125, 5.57525634765625, 5.73828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 4.0, 5.0, 7.0, 5.0, 11.0, 22.0, 15.0, 14.0, 27.0, 34.0, 27.0, 27.0, 33.0, 38.0, 45.0, 53.0, 46.0, 49.0, 76.0, 50.0, 49.0, 49.0, 46.0, 36.0, 30.0, 28.0, 24.0, 20.0, 17.0, 20.0, 9.0, 16.0, 14.0, 7.0, 10.0, 8.0, 6.0, 0.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.396484375, -3.285430908203125, -3.17437744140625, -3.063323974609375, -2.9522705078125, -2.841217041015625, -2.73016357421875, -2.619110107421875, -2.508056640625, -2.397003173828125, -2.28594970703125, -2.174896240234375, -2.0638427734375, -1.952789306640625, -1.84173583984375, -1.730682373046875, -1.61962890625, -1.508575439453125, -1.39752197265625, -1.286468505859375, -1.1754150390625, -1.064361572265625, -0.95330810546875, -0.842254638671875, -0.731201171875, -0.620147705078125, -0.50909423828125, -0.398040771484375, -0.2869873046875, -0.175933837890625, -0.06488037109375, 0.046173095703125, 0.1572265625, 0.268280029296875, 0.37933349609375, 0.490386962890625, 0.6014404296875, 0.712493896484375, 0.82354736328125, 0.934600830078125, 1.045654296875, 1.156707763671875, 1.26776123046875, 1.378814697265625, 1.4898681640625, 1.600921630859375, 1.71197509765625, 1.823028564453125, 1.93408203125, 2.045135498046875, 2.15618896484375, 2.267242431640625, 2.3782958984375, 2.489349365234375, 2.60040283203125, 2.711456298828125, 2.822509765625, 2.933563232421875, 3.04461669921875, 3.155670166015625, 3.2667236328125, 3.377777099609375, 3.48883056640625, 3.599884033203125, 3.7109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 9.0, 20.0, 39.0, 57.0, 105.0, 198.0, 417.0, 770.0, 1915.0, 5031.0, 15154.0, 53578.0, 191026.0, 449573.0, 233293.0, 68266.0, 18931.0, 6065.0, 2278.0, 960.0, 426.0, 195.0, 100.0, 57.0, 29.0, 21.0, 16.0, 7.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.1845703125, -1.1560897827148438, -1.1276092529296875, -1.0991287231445312, -1.070648193359375, -1.0421676635742188, -1.0136871337890625, -0.9852066040039062, -0.95672607421875, -0.9282455444335938, -0.8997650146484375, -0.8712844848632812, -0.842803955078125, -0.8143234252929688, -0.7858428955078125, -0.7573623657226562, -0.7288818359375, -0.7004013061523438, -0.6719207763671875, -0.6434402465820312, -0.614959716796875, -0.5864791870117188, -0.5579986572265625, -0.5295181274414062, -0.50103759765625, -0.47255706787109375, -0.4440765380859375, -0.41559600830078125, -0.387115478515625, -0.35863494873046875, -0.3301544189453125, -0.30167388916015625, -0.273193359375, -0.24471282958984375, -0.2162322998046875, -0.18775177001953125, -0.159271240234375, -0.13079071044921875, -0.1023101806640625, -0.07382965087890625, -0.04534912109375, -0.01686859130859375, 0.0116119384765625, 0.04009246826171875, 0.068572998046875, 0.09705352783203125, 0.1255340576171875, 0.15401458740234375, 0.1824951171875, 0.21097564697265625, 0.2394561767578125, 0.26793670654296875, 0.296417236328125, 0.32489776611328125, 0.3533782958984375, 0.38185882568359375, 0.41033935546875, 0.43881988525390625, 0.4673004150390625, 0.49578094482421875, 0.524261474609375, 0.5527420043945312, 0.5812225341796875, 0.6097030639648438, 0.63818359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 8.0, 9.0, 10.0, 14.0, 13.0, 13.0, 20.0, 31.0, 34.0, 56.0, 60.0, 68.0, 87.0, 157.0, 86.0, 57.0, 48.0, 36.0, 36.0, 39.0, 21.0, 27.0, 12.0, 9.0, 11.0, 11.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.00018262863159179688, -0.00017763115465641022, -0.00017263367772102356, -0.0001676362007856369, -0.00016263872385025024, -0.00015764124691486359, -0.00015264376997947693, -0.00014764629304409027, -0.0001426488161087036, -0.00013765133917331696, -0.0001326538622379303, -0.00012765638530254364, -0.00012265890836715698, -0.00011766143143177032, -0.00011266395449638367, -0.00010766647756099701, -0.00010266900062561035, -9.76715236902237e-05, -9.267404675483704e-05, -8.767656981945038e-05, -8.267909288406372e-05, -7.768161594867706e-05, -7.26841390132904e-05, -6.768666207790375e-05, -6.268918514251709e-05, -5.769170820713043e-05, -5.2694231271743774e-05, -4.769675433635712e-05, -4.269927740097046e-05, -3.77018004655838e-05, -3.2704323530197144e-05, -2.7706846594810486e-05, -2.2709369659423828e-05, -1.771189272403717e-05, -1.2714415788650513e-05, -7.716938853263855e-06, -2.7194619178771973e-06, 2.2780150175094604e-06, 7.275491952896118e-06, 1.2272968888282776e-05, 1.7270445823669434e-05, 2.226792275905609e-05, 2.726539969444275e-05, 3.226287662982941e-05, 3.7260353565216064e-05, 4.225783050060272e-05, 4.725530743598938e-05, 5.225278437137604e-05, 5.7250261306762695e-05, 6.224773824214935e-05, 6.724521517753601e-05, 7.224269211292267e-05, 7.724016904830933e-05, 8.223764598369598e-05, 8.723512291908264e-05, 9.22325998544693e-05, 9.723007678985596e-05, 0.00010222755372524261, 0.00010722503066062927, 0.00011222250759601593, 0.00011721998453140259, 0.00012221746146678925, 0.0001272149384021759, 0.00013221241533756256, 0.00013720989227294922]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 5.0, 11.0, 23.0, 35.0, 44.0, 71.0, 95.0, 145.0, 253.0, 393.0, 635.0, 1129.0, 2044.0, 3851.0, 8575.0, 23549.0, 80378.0, 268507.0, 440783.0, 149781.0, 42478.0, 13715.0, 5664.0, 2728.0, 1443.0, 785.0, 521.0, 316.0, 218.0, 123.0, 84.0, 50.0, 39.0, 30.0, 22.0, 9.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -1.002105712890625, -0.97003173828125, -0.937957763671875, -0.9058837890625, -0.873809814453125, -0.84173583984375, -0.809661865234375, -0.777587890625, -0.745513916015625, -0.71343994140625, -0.681365966796875, -0.6492919921875, -0.617218017578125, -0.58514404296875, -0.553070068359375, -0.52099609375, -0.488922119140625, -0.45684814453125, -0.424774169921875, -0.3927001953125, -0.360626220703125, -0.32855224609375, -0.296478271484375, -0.264404296875, -0.232330322265625, -0.20025634765625, -0.168182373046875, -0.1361083984375, -0.104034423828125, -0.07196044921875, -0.039886474609375, -0.0078125, 0.024261474609375, 0.05633544921875, 0.088409423828125, 0.1204833984375, 0.152557373046875, 0.18463134765625, 0.216705322265625, 0.248779296875, 0.280853271484375, 0.31292724609375, 0.345001220703125, 0.3770751953125, 0.409149169921875, 0.44122314453125, 0.473297119140625, 0.50537109375, 0.537445068359375, 0.56951904296875, 0.601593017578125, 0.6336669921875, 0.665740966796875, 0.69781494140625, 0.729888916015625, 0.761962890625, 0.794036865234375, 0.82611083984375, 0.858184814453125, 0.8902587890625, 0.922332763671875, 0.95440673828125, 0.986480712890625, 1.0185546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 11.0, 18.0, 28.0, 37.0, 59.0, 98.0, 100.0, 154.0, 135.0, 85.0, 64.0, 62.0, 41.0, 35.0, 14.0, 12.0, 13.0, 6.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53564453125, -0.5100173950195312, -0.4843902587890625, -0.45876312255859375, -0.433135986328125, -0.40750885009765625, -0.3818817138671875, -0.35625457763671875, -0.33062744140625, -0.30500030517578125, -0.2793731689453125, -0.25374603271484375, -0.228118896484375, -0.20249176025390625, -0.1768646240234375, -0.15123748779296875, -0.1256103515625, -0.09998321533203125, -0.0743560791015625, -0.04872894287109375, -0.023101806640625, 0.00252532958984375, 0.0281524658203125, 0.05377960205078125, 0.07940673828125, 0.10503387451171875, 0.1306610107421875, 0.15628814697265625, 0.181915283203125, 0.20754241943359375, 0.2331695556640625, 0.25879669189453125, 0.284423828125, 0.31005096435546875, 0.3356781005859375, 0.36130523681640625, 0.386932373046875, 0.41255950927734375, 0.4381866455078125, 0.46381378173828125, 0.48944091796875, 0.5150680541992188, 0.5406951904296875, 0.5663223266601562, 0.591949462890625, 0.6175765991210938, 0.6432037353515625, 0.6688308715820312, 0.6944580078125, 0.7200851440429688, 0.7457122802734375, 0.7713394165039062, 0.796966552734375, 0.8225936889648438, 0.8482208251953125, 0.8738479614257812, 0.89947509765625, 0.9251022338867188, 0.9507293701171875, 0.9763565063476562, 1.001983642578125, 1.0276107788085938, 1.0532379150390625, 1.0788650512695312, 1.1044921875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 11.0, 20.0, 15.0, 32.0, 56.0, 72.0, 85.0, 84.0, 105.0, 94.0, 109.0, 90.0, 64.0, 52.0, 37.0, 26.0, 17.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-9.922094345092773, -9.714754104614258, -9.507413864135742, -9.300073623657227, -9.092733383178711, -8.885393142700195, -8.67805290222168, -8.470712661743164, -8.263372421264648, -8.056032180786133, -7.848691940307617, -7.641351699829102, -7.434011459350586, -7.22667121887207, -7.019330978393555, -6.811990737915039, -6.604650497436523, -6.397310256958008, -6.189970016479492, -5.982629776000977, -5.775289535522461, -5.567949295043945, -5.36060905456543, -5.153268814086914, -4.945929050445557, -4.738588809967041, -4.531248569488525, -4.32390832901001, -4.116568088531494, -3.9092278480529785, -3.701887607574463, -3.4945473670959473, -3.2872071266174316, -3.079866886138916, -2.8725266456604004, -2.6651864051818848, -2.457846164703369, -2.2505059242248535, -2.043165683746338, -1.8358255624771118, -1.6284853219985962, -1.4211450815200806, -1.213804841041565, -1.0064647197723389, -0.7991244196891785, -0.5917842388153076, -0.384443998336792, -0.17710375785827637, 0.030236482620239258, 0.2375767081975937, 0.4449169337749481, 0.6522571444511414, 0.859597384929657, 1.0669375658035278, 1.2742778062820435, 1.481618046760559, 1.6889582872390747, 1.8962985277175903, 2.1036386489868164, 2.310978889465332, 2.5183191299438477, 2.7256593704223633, 2.932999610900879, 3.1403398513793945, 3.34768009185791]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 12.0, 10.0, 13.0, 7.0, 10.0, 14.0, 30.0, 29.0, 25.0, 27.0, 29.0, 29.0, 42.0, 31.0, 44.0, 42.0, 38.0, 45.0, 51.0, 41.0, 35.0, 33.0, 29.0, 37.0, 35.0, 36.0, 33.0, 25.0, 15.0, 17.0, 16.0, 25.0, 16.0, 14.0, 16.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.669668197631836, -5.494604110717773, -5.319540500640869, -5.144476413726807, -4.969412326812744, -4.79434871673584, -4.619284629821777, -4.444220542907715, -4.269156455993652, -4.09409236907959, -3.9190285205841064, -3.743964672088623, -3.5689005851745605, -3.393836736679077, -3.2187728881835938, -3.0437088012695312, -2.868645191192627, -2.6935813426971436, -2.518517255783081, -2.3434534072875977, -2.168389320373535, -1.9933254718780518, -1.8182616233825684, -1.6431976556777954, -1.4681336879730225, -1.2930697202682495, -1.1180057525634766, -0.9429419040679932, -0.7678779363632202, -0.5928139686584473, -0.41775012016296387, -0.24268615245819092, -0.06762218475341797, 0.10744175314903259, 0.28250569105148315, 0.45756959915161133, 0.6326335668563843, 0.8076975345611572, 0.9827613830566406, 1.1578253507614136, 1.3328893184661865, 1.5079532861709595, 1.6830172538757324, 1.8580811023712158, 2.033144950866699, 2.2082090377807617, 2.383272886276245, 2.5583367347717285, 2.733400821685791, 2.9084646701812744, 3.083528757095337, 3.2585926055908203, 3.433656692504883, 3.608720541000366, 3.7837843894958496, 3.958848476409912, 4.133912086486816, 4.308976173400879, 4.484039783477783, 4.659103870391846, 4.834167957305908, 5.0092315673828125, 5.184295654296875, 5.3593597412109375, 5.534423828125]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 9.0, 9.0, 8.0, 13.0, 19.0, 23.0, 26.0, 46.0, 67.0, 68.0, 112.0, 162.0, 184.0, 319.0, 450.0, 647.0, 917.0, 1361.0, 2064.0, 3046.0, 4385.0, 6128.0, 1014167.0, 5252.0, 3486.0, 2458.0, 1596.0, 1081.0, 727.0, 543.0, 364.0, 237.0, 168.0, 122.0, 105.0, 68.0, 47.0, 28.0, 22.0, 22.0, 21.0, 12.0, 8.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.356604099273682, -5.200021266937256, -5.04343843460083, -4.8868560791015625, -4.730273246765137, -4.573690414428711, -4.417107582092285, -4.260524749755859, -4.103941917419434, -3.947359085083008, -3.790776491165161, -3.6341936588287354, -3.4776110649108887, -3.321028232574463, -3.164445400238037, -3.0078625679016113, -2.8512802124023438, -2.694697380065918, -2.5381147861480713, -2.3815319538116455, -2.224949359893799, -2.068366527557373, -1.9117836952209473, -1.755200982093811, -1.5986182689666748, -1.4420355558395386, -1.2854528427124023, -1.1288700103759766, -0.9722872972488403, -0.8157045841217041, -0.6591218113899231, -0.5025390386581421, -0.34595584869384766, -0.18937310576438904, -0.03279036283493042, 0.1237923800945282, 0.2803751230239868, 0.43695783615112305, 0.593540608882904, 0.7501233816146851, 0.9067060947418213, 1.0632888078689575, 1.2198715209960938, 1.3764543533325195, 1.5330370664596558, 1.689619779586792, 1.8462026119232178, 2.0027852058410645, 2.1593680381774902, 2.315950870513916, 2.4725334644317627, 2.6291162967681885, 2.785698890686035, 2.942281723022461, 3.0988645553588867, 3.2554473876953125, 3.412029981613159, 3.568612813949585, 3.7251954078674316, 3.8817782402038574, 4.038361072540283, 4.194943428039551, 4.351526260375977, 4.508109092712402, 4.664691925048828]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 12.0, 12.0, 33.0, 62.0, 91.0, 177.0, 402.0, 1098.0, 3886.0, 19816.0, 51054424.0, 360975.0, 23030.0, 4727.0, 1152.0, 400.0, 192.0, 101.0, 54.0, 36.0, 25.0, 18.0, 17.0, 10.0, 9.0, 9.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.578125, -21.893598556518555, -21.209070205688477, -20.52454376220703, -19.840017318725586, -19.15549087524414, -18.470962524414062, -17.786436080932617, -17.101909637451172, -16.417383193969727, -15.732855796813965, -15.048328399658203, -14.363801956176758, -13.679274559020996, -12.994747161865234, -12.310220718383789, -11.625692367553711, -10.94116497039795, -10.256638526916504, -9.572111129760742, -8.887584686279297, -8.203057289123535, -7.518529891967773, -6.83400297164917, -6.149476051330566, -5.464949131011963, -4.780422210693359, -4.095894813537598, -3.411367893218994, -2.7268409729003906, -2.042313575744629, -1.3577866554260254, -0.6732616424560547, 0.011265397071838379, 0.6957924365997314, 1.380319595336914, 2.0648465156555176, 2.749373435974121, 3.433900833129883, 4.118427753448486, 4.80295467376709, 5.487481594085693, 6.172008514404297, 6.856535911560059, 7.541062831878662, 8.225589752197266, 8.910117149353027, 9.594644546508789, 10.279170989990234, 10.963698387145996, 11.648224830627441, 12.332752227783203, 13.017278671264648, 13.70180606842041, 14.386333465576172, 15.070859909057617, 15.755387306213379, 16.43991470336914, 17.124441146850586, 17.80896759033203, 18.49349594116211, 19.178022384643555, 19.862548828125, 20.547077178955078, 21.231603622436523]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 0.0, 3.0, 8.0, 7.0, 14.0, 29.0, 38.0, 58.0, 84.0, 179.0, 240.0, 413.0, 668.0, 992.0, 1668.0, 2665.0, 4456.0, 7385.0, 12070.0, 19861.0, 32954.0, 52972.0, 85209.0, 131278.0, 195884.0, 274241.0, 352376.0, 2214180.0, 1737724.0, 350106.0, 271839.0, 193038.0, 129204.0, 83484.0, 52256.0, 32472.0, 20165.0, 11994.0, 7600.0, 4446.0, 2784.0, 1664.0, 1045.0, 634.0, 394.0, 264.0, 151.0, 85.0, 59.0, 43.0, 20.0, 23.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.0751953125, -1.0415802001953125, -1.007965087890625, -0.9743499755859375, -0.94073486328125, -0.9071197509765625, -0.873504638671875, -0.8398895263671875, -0.8062744140625, -0.7726593017578125, -0.739044189453125, -0.7054290771484375, -0.67181396484375, -0.6381988525390625, -0.604583740234375, -0.5709686279296875, -0.537353515625, -0.5037384033203125, -0.470123291015625, -0.4365081787109375, -0.40289306640625, -0.3692779541015625, -0.335662841796875, -0.3020477294921875, -0.2684326171875, -0.2348175048828125, -0.201202392578125, -0.1675872802734375, -0.13397216796875, -0.1003570556640625, -0.066741943359375, -0.0331268310546875, 0.00048828125, 0.0341033935546875, 0.067718505859375, 0.1013336181640625, 0.13494873046875, 0.1685638427734375, 0.202178955078125, 0.2357940673828125, 0.2694091796875, 0.3030242919921875, 0.336639404296875, 0.3702545166015625, 0.40386962890625, 0.4374847412109375, 0.471099853515625, 0.5047149658203125, 0.538330078125, 0.5719451904296875, 0.605560302734375, 0.6391754150390625, 0.67279052734375, 0.7064056396484375, 0.740020751953125, 0.7736358642578125, 0.8072509765625, 0.8408660888671875, 0.874481201171875, 0.9080963134765625, 0.94171142578125, 0.9753265380859375, 1.008941650390625, 1.0425567626953125, 1.076171875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 3.0, 8.0, 7.0, 16.0, 10.0, 14.0, 13.0, 16.0, 19.0, 22.0, 21.0, 38.0, 32.0, 45.0, 33.0, 35.0, 40.0, 34.0, 45.0, 1069.0, 48.0, 39.0, 35.0, 39.0, 41.0, 48.0, 30.0, 32.0, 28.0, 31.0, 19.0, 18.0, 10.0, 17.0, 11.0, 11.0, 8.0, 10.0, 7.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.171875, -20.501953125, -19.83203125, -19.162109375, -18.4921875, -17.822265625, -17.15234375, -16.482421875, -15.8125, -15.142578125, -14.47265625, -13.802734375, -13.1328125, -12.462890625, -11.79296875, -11.123046875, -10.453125, -9.783203125, -9.11328125, -8.443359375, -7.7734375, -7.103515625, -6.43359375, -5.763671875, -5.09375, -4.423828125, -3.75390625, -3.083984375, -2.4140625, -1.744140625, -1.07421875, -0.404296875, 0.265625, 0.935546875, 1.60546875, 2.275390625, 2.9453125, 3.615234375, 4.28515625, 4.955078125, 5.625, 6.294921875, 6.96484375, 7.634765625, 8.3046875, 8.974609375, 9.64453125, 10.314453125, 10.984375, 11.654296875, 12.32421875, 12.994140625, 13.6640625, 14.333984375, 15.00390625, 15.673828125, 16.34375, 17.013671875, 17.68359375, 18.353515625, 19.0234375, 19.693359375, 20.36328125, 21.033203125, 21.703125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 9.0, 14.0, 28.0, 41.0, 68.0, 122.0, 191.0, 290.0, 533.0, 910.0, 1530.0, 2441.0, 4301.0, 7139.0, 12065.0, 19858.0, 31770.0, 50113.0, 77739.0, 117357.0, 169262.0, 231628.0, 295689.0, 364862.0, 3445359.0, 395785.0, 301765.0, 238808.0, 176560.0, 123434.0, 82247.0, 53530.0, 33673.0, 20562.0, 12654.0, 7668.0, 4664.0, 2670.0, 1625.0, 997.0, 558.0, 366.0, 223.0, 121.0, 93.0, 45.0, 26.0, 18.0, 12.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.994842529296875, -0.96429443359375, -0.933746337890625, -0.9031982421875, -0.872650146484375, -0.84210205078125, -0.811553955078125, -0.781005859375, -0.750457763671875, -0.71990966796875, -0.689361572265625, -0.6588134765625, -0.628265380859375, -0.59771728515625, -0.567169189453125, -0.53662109375, -0.506072998046875, -0.47552490234375, -0.444976806640625, -0.4144287109375, -0.383880615234375, -0.35333251953125, -0.322784423828125, -0.292236328125, -0.261688232421875, -0.23114013671875, -0.200592041015625, -0.1700439453125, -0.139495849609375, -0.10894775390625, -0.078399658203125, -0.0478515625, -0.017303466796875, 0.01324462890625, 0.043792724609375, 0.0743408203125, 0.104888916015625, 0.13543701171875, 0.165985107421875, 0.196533203125, 0.227081298828125, 0.25762939453125, 0.288177490234375, 0.3187255859375, 0.349273681640625, 0.37982177734375, 0.410369873046875, 0.44091796875, 0.471466064453125, 0.50201416015625, 0.532562255859375, 0.5631103515625, 0.593658447265625, 0.62420654296875, 0.654754638671875, 0.685302734375, 0.715850830078125, 0.74639892578125, 0.776947021484375, 0.8074951171875, 0.838043212890625, 0.86859130859375, 0.899139404296875, 0.9296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 4.0, 13.0, 9.0, 10.0, 16.0, 10.0, 19.0, 20.0, 19.0, 19.0, 30.0, 32.0, 33.0, 47.0, 42.0, 39.0, 36.0, 43.0, 928.0, 169.0, 32.0, 51.0, 27.0, 37.0, 30.0, 31.0, 26.0, 25.0, 26.0, 28.0, 31.0, 22.0, 21.0, 17.0, 10.0, 7.0, 10.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-13.5390625, -13.099365234375, -12.65966796875, -12.219970703125, -11.7802734375, -11.340576171875, -10.90087890625, -10.461181640625, -10.021484375, -9.581787109375, -9.14208984375, -8.702392578125, -8.2626953125, -7.822998046875, -7.38330078125, -6.943603515625, -6.50390625, -6.064208984375, -5.62451171875, -5.184814453125, -4.7451171875, -4.305419921875, -3.86572265625, -3.426025390625, -2.986328125, -2.546630859375, -2.10693359375, -1.667236328125, -1.2275390625, -0.787841796875, -0.34814453125, 0.091552734375, 0.53125, 0.970947265625, 1.41064453125, 1.850341796875, 2.2900390625, 2.729736328125, 3.16943359375, 3.609130859375, 4.048828125, 4.488525390625, 4.92822265625, 5.367919921875, 5.8076171875, 6.247314453125, 6.68701171875, 7.126708984375, 7.56640625, 8.006103515625, 8.44580078125, 8.885498046875, 9.3251953125, 9.764892578125, 10.20458984375, 10.644287109375, 11.083984375, 11.523681640625, 11.96337890625, 12.403076171875, 12.8427734375, 13.282470703125, 13.72216796875, 14.161865234375, 14.6015625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 5.0, 8.0, 11.0, 13.0, 24.0, 36.0, 52.0, 81.0, 90.0, 145.0, 231.0, 356.0, 504.0, 741.0, 1198.0, 1716.0, 2798.0, 4442.0, 7057.0, 11145.0, 17601.0, 27596.0, 43571.0, 67225.0, 106965.0, 5425731.0, 308621.0, 94843.0, 60954.0, 39549.0, 24829.0, 15668.0, 9888.0, 6194.0, 3943.0, 2589.0, 1659.0, 1122.0, 758.0, 478.0, 352.0, 191.0, 128.0, 99.0, 68.0, 51.0, 41.0, 19.0, 20.0, 13.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1015625, -2.02880859375, -1.9560546875, -1.88330078125, -1.810546875, -1.73779296875, -1.6650390625, -1.59228515625, -1.51953125, -1.44677734375, -1.3740234375, -1.30126953125, -1.228515625, -1.15576171875, -1.0830078125, -1.01025390625, -0.9375, -0.86474609375, -0.7919921875, -0.71923828125, -0.646484375, -0.57373046875, -0.5009765625, -0.42822265625, -0.35546875, -0.28271484375, -0.2099609375, -0.13720703125, -0.064453125, 0.00830078125, 0.0810546875, 0.15380859375, 0.2265625, 0.29931640625, 0.3720703125, 0.44482421875, 0.517578125, 0.59033203125, 0.6630859375, 0.73583984375, 0.80859375, 0.88134765625, 0.9541015625, 1.02685546875, 1.099609375, 1.17236328125, 1.2451171875, 1.31787109375, 1.390625, 1.46337890625, 1.5361328125, 1.60888671875, 1.681640625, 1.75439453125, 1.8271484375, 1.89990234375, 1.97265625, 2.04541015625, 2.1181640625, 2.19091796875, 2.263671875, 2.33642578125, 2.4091796875, 2.48193359375, 2.5546875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 9.0, 3.0, 11.0, 13.0, 16.0, 18.0, 22.0, 25.0, 21.0, 29.0, 23.0, 18.0, 20.0, 35.0, 30.0, 49.0, 35.0, 36.0, 135.0, 953.0, 42.0, 48.0, 37.0, 42.0, 41.0, 31.0, 31.0, 28.0, 26.0, 28.0, 20.0, 29.0, 18.0, 21.0, 10.0, 11.0, 11.0, 9.0, 7.0, 5.0, 6.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.25, -10.9312744140625, -10.612548828125, -10.2938232421875, -9.97509765625, -9.6563720703125, -9.337646484375, -9.0189208984375, -8.7001953125, -8.3814697265625, -8.062744140625, -7.7440185546875, -7.42529296875, -7.1065673828125, -6.787841796875, -6.4691162109375, -6.150390625, -5.8316650390625, -5.512939453125, -5.1942138671875, -4.87548828125, -4.5567626953125, -4.238037109375, -3.9193115234375, -3.6005859375, -3.2818603515625, -2.963134765625, -2.6444091796875, -2.32568359375, -2.0069580078125, -1.688232421875, -1.3695068359375, -1.05078125, -0.7320556640625, -0.413330078125, -0.0946044921875, 0.22412109375, 0.5428466796875, 0.861572265625, 1.1802978515625, 1.4990234375, 1.8177490234375, 2.136474609375, 2.4552001953125, 2.77392578125, 3.0926513671875, 3.411376953125, 3.7301025390625, 4.048828125, 4.3675537109375, 4.686279296875, 5.0050048828125, 5.32373046875, 5.6424560546875, 5.961181640625, 6.2799072265625, 6.5986328125, 6.9173583984375, 7.236083984375, 7.5548095703125, 7.87353515625, 8.1922607421875, 8.510986328125, 8.8297119140625, 9.1484375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 14.0, 7.0, 22.0, 58.0, 157.0, 288.0, 236.0, 104.0, 53.0, 31.0, 13.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.218788146972656, -23.16107177734375, -22.103357315063477, -21.04564094543457, -19.987924575805664, -18.93021011352539, -17.872493743896484, -16.814777374267578, -15.757061958312988, -14.699346542358398, -13.641630172729492, -12.583914756774902, -11.526199340820312, -10.468482971191406, -9.410767555236816, -8.353052139282227, -7.29533576965332, -6.237619876861572, -5.179903984069824, -4.122188568115234, -3.0644726753234863, -2.0067567825317383, -0.9490413665771484, 0.10867452621459961, 1.1663904190063477, 2.2241063117980957, 3.2818219661712646, 4.339537620544434, 5.397253513336182, 6.45496940612793, 7.5126848220825195, 8.57040023803711, 9.628116607666016, 10.685832023620605, 11.743548393249512, 12.801263809204102, 13.858980178833008, 14.916695594787598, 15.974411010742188, 17.032127380371094, 18.08984375, 19.147560119628906, 20.20527458190918, 21.262990951538086, 22.320707321166992, 23.378421783447266, 24.436138153076172, 25.493854522705078, 26.55156898498535, 27.609285354614258, 28.66699981689453, 29.724716186523438, 30.782432556152344, 31.84014892578125, 32.897865295410156, 33.9555778503418, 35.0132942199707, 36.07101058959961, 37.128726959228516, 38.186439514160156, 39.24415588378906, 40.30187225341797, 41.359588623046875, 42.41730499267578, 43.47502136230469]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 12.0, 4.0, 10.0, 11.0, 8.0, 12.0, 8.0, 16.0, 18.0, 20.0, 22.0, 21.0, 20.0, 39.0, 32.0, 29.0, 37.0, 40.0, 27.0, 39.0, 42.0, 50.0, 45.0, 30.0, 42.0, 40.0, 41.0, 40.0, 28.0, 31.0, 25.0, 19.0, 13.0, 16.0, 14.0, 19.0, 16.0, 6.0, 10.0, 14.0, 8.0, 1.0, 5.0, 1.0, 6.0, 2.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.749069213867188, -13.299906730651855, -12.85074520111084, -12.401582717895508, -11.952421188354492, -11.50325870513916, -11.054097175598145, -10.604934692382812, -10.155773162841797, -9.706610679626465, -9.25744915008545, -8.808286666870117, -8.359125137329102, -7.9099626541137695, -7.460801124572754, -7.011638641357422, -6.562476634979248, -6.113314628601074, -5.6641526222229, -5.214990615844727, -4.765828609466553, -4.316666603088379, -3.867504358291626, -3.418342351913452, -2.9691803455352783, -2.5200183391571045, -2.0708563327789307, -1.6216942071914673, -1.1725322008132935, -0.7233700752258301, -0.27420806884765625, 0.17495393753051758, 0.6241159439086914, 1.0732779502868652, 1.522439956665039, 1.9716020822525024, 2.4207639694213867, 2.8699262142181396, 3.3190882205963135, 3.7682502269744873, 4.217411994934082, 4.666574001312256, 5.11573600769043, 5.5648980140686035, 6.014060020446777, 6.463222503662109, 6.912384033203125, 7.361546516418457, 7.810708522796631, 8.259870529174805, 8.709033012390137, 9.158194541931152, 9.607357025146484, 10.0565185546875, 10.505681037902832, 10.954842567443848, 11.40400505065918, 11.853167533874512, 12.302329063415527, 12.75149154663086, 13.200653076171875, 13.649815559387207, 14.098977088928223, 14.548139572143555, 14.99730110168457]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 11.0, 6.0, 15.0, 26.0, 29.0, 45.0, 62.0, 112.0, 140.0, 181.0, 324.0, 518.0, 805.0, 1334.0, 2338.0, 3854.0, 7087.0, 14015.0, 31299.0, 98012.0, 3839985.0, 120875.0, 35881.0, 15868.0, 8348.0, 4653.0, 2918.0, 1792.0, 1196.0, 772.0, 550.0, 357.0, 269.0, 179.0, 122.0, 84.0, 59.0, 50.0, 32.0, 21.0, 14.0, 11.0, 17.0, 9.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.348388671875, -0.3366050720214844, -0.32482147216796875, -0.3130378723144531, -0.3012542724609375, -0.2894706726074219, -0.27768707275390625, -0.2659034729003906, -0.254119873046875, -0.24233627319335938, -0.23055267333984375, -0.21876907348632812, -0.2069854736328125, -0.19520187377929688, -0.18341827392578125, -0.17163467407226562, -0.15985107421875, -0.14806747436523438, -0.13628387451171875, -0.12450027465820312, -0.1127166748046875, -0.10093307495117188, -0.08914947509765625, -0.07736587524414062, -0.065582275390625, -0.053798675537109375, -0.04201507568359375, -0.030231475830078125, -0.0184478759765625, -0.006664276123046875, 0.00511932373046875, 0.016902923583984375, 0.0286865234375, 0.040470123291015625, 0.05225372314453125, 0.06403732299804688, 0.0758209228515625, 0.08760452270507812, 0.09938812255859375, 0.11117172241210938, 0.122955322265625, 0.13473892211914062, 0.14652252197265625, 0.15830612182617188, 0.1700897216796875, 0.18187332153320312, 0.19365692138671875, 0.20544052124023438, 0.21722412109375, 0.22900772094726562, 0.24079132080078125, 0.2525749206542969, 0.2643585205078125, 0.2761421203613281, 0.28792572021484375, 0.2997093200683594, 0.311492919921875, 0.3232765197753906, 0.33506011962890625, 0.3468437194824219, 0.3586273193359375, 0.3704109191894531, 0.38219451904296875, 0.3939781188964844, 0.40576171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 7.0, 4.0, 5.0, 4.0, 8.0, 5.0, 8.0, 10.0, 11.0, 12.0, 12.0, 22.0, 778.0, 18.0, 15.0, 8.0, 11.0, 12.0, 8.0, 6.0, 9.0, 4.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.106689453125, -0.10329532623291016, -0.09990119934082031, -0.09650707244873047, -0.09311294555664062, -0.08971881866455078, -0.08632469177246094, -0.0829305648803711, -0.07953643798828125, -0.0761423110961914, -0.07274818420410156, -0.06935405731201172, -0.06595993041992188, -0.06256580352783203, -0.05917167663574219, -0.055777549743652344, -0.0523834228515625, -0.048989295959472656, -0.04559516906738281, -0.04220104217529297, -0.038806915283203125, -0.03541278839111328, -0.03201866149902344, -0.028624534606933594, -0.02523040771484375, -0.021836280822753906, -0.018442153930664062, -0.015048027038574219, -0.011653900146484375, -0.008259773254394531, -0.0048656463623046875, -0.0014715194702148438, 0.001922607421875, 0.005316734313964844, 0.008710861206054688, 0.012104988098144531, 0.015499114990234375, 0.01889324188232422, 0.022287368774414062, 0.025681495666503906, 0.02907562255859375, 0.032469749450683594, 0.03586387634277344, 0.03925800323486328, 0.042652130126953125, 0.04604625701904297, 0.04944038391113281, 0.052834510803222656, 0.0562286376953125, 0.059622764587402344, 0.06301689147949219, 0.06641101837158203, 0.06980514526367188, 0.07319927215576172, 0.07659339904785156, 0.0799875259399414, 0.08338165283203125, 0.0867757797241211, 0.09016990661621094, 0.09356403350830078, 0.09695816040039062, 0.10035228729248047, 0.10374641418457031, 0.10714054107666016, 0.11053466796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 6.0, 10.0, 8.0, 22.0, 34.0, 45.0, 61.0, 106.0, 182.0, 302.0, 505.0, 977.0, 1877.0, 3996.0, 8621.0, 21329.0, 59016.0, 199417.0, 1109286.0, 2362597.0, 296018.0, 81470.0, 27941.0, 10739.0, 4910.0, 2247.0, 1086.0, 601.0, 344.0, 181.0, 117.0, 70.0, 51.0, 39.0, 18.0, 16.0, 10.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300048828125, -0.29009246826171875, -0.2801361083984375, -0.27017974853515625, -0.260223388671875, -0.25026702880859375, -0.2403106689453125, -0.23035430908203125, -0.22039794921875, -0.21044158935546875, -0.2004852294921875, -0.19052886962890625, -0.180572509765625, -0.17061614990234375, -0.1606597900390625, -0.15070343017578125, -0.1407470703125, -0.13079071044921875, -0.1208343505859375, -0.11087799072265625, -0.100921630859375, -0.09096527099609375, -0.0810089111328125, -0.07105255126953125, -0.06109619140625, -0.05113983154296875, -0.0411834716796875, -0.03122711181640625, -0.021270751953125, -0.01131439208984375, -0.0013580322265625, 0.00859832763671875, 0.0185546875, 0.02851104736328125, 0.0384674072265625, 0.04842376708984375, 0.058380126953125, 0.06833648681640625, 0.0782928466796875, 0.08824920654296875, 0.09820556640625, 0.10816192626953125, 0.1181182861328125, 0.12807464599609375, 0.138031005859375, 0.14798736572265625, 0.1579437255859375, 0.16790008544921875, 0.1778564453125, 0.18781280517578125, 0.1977691650390625, 0.20772552490234375, 0.217681884765625, 0.22763824462890625, 0.2375946044921875, 0.24755096435546875, 0.25750732421875, 0.26746368408203125, 0.2774200439453125, 0.28737640380859375, 0.297332763671875, 0.30728912353515625, 0.3172454833984375, 0.32720184326171875, 0.337158203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 7.0, 12.0, 14.0, 20.0, 27.0, 26.0, 35.0, 47.0, 46.0, 72.0, 91.0, 114.0, 162.0, 218.0, 313.0, 722.0, 852.0, 344.0, 213.0, 149.0, 119.0, 94.0, 87.0, 72.0, 33.0, 45.0, 32.0, 18.0, 22.0, 19.0, 10.0, 3.0, 4.0, 8.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1485595703125, -0.14377593994140625, -0.1389923095703125, -0.13420867919921875, -0.129425048828125, -0.12464141845703125, -0.1198577880859375, -0.11507415771484375, -0.11029052734375, -0.10550689697265625, -0.1007232666015625, -0.09593963623046875, -0.091156005859375, -0.08637237548828125, -0.0815887451171875, -0.07680511474609375, -0.072021484375, -0.06723785400390625, -0.0624542236328125, -0.05767059326171875, -0.052886962890625, -0.04810333251953125, -0.0433197021484375, -0.03853607177734375, -0.03375244140625, -0.02896881103515625, -0.0241851806640625, -0.01940155029296875, -0.014617919921875, -0.00983428955078125, -0.0050506591796875, -0.00026702880859375, 0.0045166015625, 0.00930023193359375, 0.0140838623046875, 0.01886749267578125, 0.023651123046875, 0.02843475341796875, 0.0332183837890625, 0.03800201416015625, 0.04278564453125, 0.04756927490234375, 0.0523529052734375, 0.05713653564453125, 0.061920166015625, 0.06670379638671875, 0.0714874267578125, 0.07627105712890625, 0.0810546875, 0.08583831787109375, 0.0906219482421875, 0.09540557861328125, 0.100189208984375, 0.10497283935546875, 0.1097564697265625, 0.11454010009765625, 0.11932373046875, 0.12410736083984375, 0.1288909912109375, 0.13367462158203125, 0.138458251953125, 0.14324188232421875, 0.1480255126953125, 0.15280914306640625, 0.1575927734375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 11.0, 11.0, 26.0, 70.0, 134.0, 214.0, 208.0, 166.0, 80.0, 38.0, 22.0, 9.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0877388715744019, -1.0405055284500122, -0.9932721853256226, -0.9460387825965881, -0.8988054394721985, -0.8515720963478088, -0.8043386936187744, -0.7571053504943848, -0.7098720073699951, -0.6626386642456055, -0.6154053211212158, -0.5681719183921814, -0.5209385752677917, -0.4737052321434021, -0.42647185921669006, -0.379238486289978, -0.3320051431655884, -0.28477180004119873, -0.2375384271144867, -0.19030506908893585, -0.143071711063385, -0.09583835303783417, -0.048604995012283325, -0.001371622085571289, 0.04586172103881836, 0.0930950790643692, 0.14032843708992004, 0.1875617951154709, 0.23479515314102173, 0.2820284962654114, 0.3292618691921234, 0.37649524211883545, 0.42372870445251465, 0.4709620475769043, 0.518195390701294, 0.5654287934303284, 0.612662136554718, 0.6598954796791077, 0.7071288824081421, 0.7543622255325317, 0.8015955686569214, 0.848828911781311, 0.8960622549057007, 0.9432956576347351, 0.9905290007591248, 1.0377624034881592, 1.0849957466125488, 1.1322290897369385, 1.1794624328613281, 1.2266957759857178, 1.2739291191101074, 1.321162462234497, 1.3683958053588867, 1.415629267692566, 1.4628626108169556, 1.5100959539413452, 1.5573292970657349, 1.6045626401901245, 1.6517959833145142, 1.6990293264389038, 1.746262788772583, 1.7934961318969727, 1.8407294750213623, 1.887962818145752, 1.9351961612701416]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 5.0, 5.0, 7.0, 7.0, 14.0, 15.0, 12.0, 24.0, 33.0, 36.0, 27.0, 40.0, 38.0, 43.0, 54.0, 45.0, 45.0, 59.0, 47.0, 63.0, 47.0, 42.0, 54.0, 42.0, 22.0, 26.0, 21.0, 20.0, 20.0, 19.0, 10.0, 17.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.9560815691947937, -0.9309221506118774, -0.9057627320289612, -0.8806033134460449, -0.8554439544677734, -0.8302845358848572, -0.8051251173019409, -0.7799656987190247, -0.7548062801361084, -0.7296468615531921, -0.7044874429702759, -0.6793280839920044, -0.6541686654090881, -0.6290092468261719, -0.6038498282432556, -0.5786904096603394, -0.5535310506820679, -0.5283716320991516, -0.5032122135162354, -0.4780528247356415, -0.4528934359550476, -0.42773401737213135, -0.4025745987892151, -0.37741518020629883, -0.35225579142570496, -0.3270963728427887, -0.3019369840621948, -0.27677756547927856, -0.2516181468963623, -0.22645875811576843, -0.20129933953285217, -0.1761399358510971, -0.15098059177398682, -0.12582118809223175, -0.10066177695989609, -0.07550236582756042, -0.05034296214580536, -0.025183558464050293, -2.4139881134033203e-05, 0.025135263800621033, 0.0502946674823761, 0.07545407116413116, 0.10061348229646683, 0.1257728934288025, 0.15093229711055756, 0.17609170079231262, 0.20125111937522888, 0.22641052305698395, 0.251569926738739, 0.2767293453216553, 0.30188873410224915, 0.3270481526851654, 0.3522075414657593, 0.37736696004867554, 0.4025263786315918, 0.42768579721450806, 0.45284518599510193, 0.4780046045780182, 0.5031639933586121, 0.5283234119415283, 0.5534828305244446, 0.5786422491073608, 0.6038016080856323, 0.6289610266685486, 0.6541204452514648]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 15.0, 15.0, 26.0, 31.0, 39.0, 67.0, 85.0, 133.0, 157.0, 276.0, 371.0, 527.0, 843.0, 1283.0, 2107.0, 3382.0, 5410.0, 9503.0, 17799.0, 42850.0, 617070.0, 277746.0, 32062.0, 15278.0, 8187.0, 4832.0, 2980.0, 1856.0, 1145.0, 780.0, 526.0, 342.0, 254.0, 167.0, 117.0, 79.0, 53.0, 52.0, 35.0, 27.0, 15.0, 9.0, 15.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.253662109375, -0.24570465087890625, -0.2377471923828125, -0.22978973388671875, -0.221832275390625, -0.21387481689453125, -0.2059173583984375, -0.19795989990234375, -0.19000244140625, -0.18204498291015625, -0.1740875244140625, -0.16613006591796875, -0.158172607421875, -0.15021514892578125, -0.1422576904296875, -0.13430023193359375, -0.1263427734375, -0.11838531494140625, -0.1104278564453125, -0.10247039794921875, -0.094512939453125, -0.08655548095703125, -0.0785980224609375, -0.07064056396484375, -0.06268310546875, -0.05472564697265625, -0.0467681884765625, -0.03881072998046875, -0.030853271484375, -0.02289581298828125, -0.0149383544921875, -0.00698089599609375, 0.0009765625, 0.00893402099609375, 0.0168914794921875, 0.02484893798828125, 0.032806396484375, 0.04076385498046875, 0.0487213134765625, 0.05667877197265625, 0.06463623046875, 0.07259368896484375, 0.0805511474609375, 0.08850860595703125, 0.096466064453125, 0.10442352294921875, 0.1123809814453125, 0.12033843994140625, 0.1282958984375, 0.13625335693359375, 0.1442108154296875, 0.15216827392578125, 0.160125732421875, 0.16808319091796875, 0.1760406494140625, 0.18399810791015625, 0.19195556640625, 0.19991302490234375, 0.2078704833984375, 0.21582794189453125, 0.223785400390625, 0.23174285888671875, 0.2397003173828125, 0.24765777587890625, 0.255615234375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 1.0, 9.0, 3.0, 8.0, 6.0, 10.0, 15.0, 15.0, 37.0, 151.0, 308.0, 243.0, 79.0, 22.0, 17.0, 13.0, 9.0, 11.0, 5.0, 4.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1058349609375, -0.10239887237548828, -0.09896278381347656, -0.09552669525146484, -0.09209060668945312, -0.0886545181274414, -0.08521842956542969, -0.08178234100341797, -0.07834625244140625, -0.07491016387939453, -0.07147407531738281, -0.0680379867553711, -0.06460189819335938, -0.061165809631347656, -0.05772972106933594, -0.05429363250732422, -0.0508575439453125, -0.04742145538330078, -0.04398536682128906, -0.040549278259277344, -0.037113189697265625, -0.033677101135253906, -0.030241012573242188, -0.02680492401123047, -0.02336883544921875, -0.01993274688720703, -0.016496658325195312, -0.013060569763183594, -0.009624481201171875, -0.006188392639160156, -0.0027523040771484375, 0.0006837844848632812, 0.004119873046875, 0.007555961608886719, 0.010992050170898438, 0.014428138732910156, 0.017864227294921875, 0.021300315856933594, 0.024736404418945312, 0.02817249298095703, 0.03160858154296875, 0.03504467010498047, 0.03848075866699219, 0.041916847229003906, 0.045352935791015625, 0.048789024353027344, 0.05222511291503906, 0.05566120147705078, 0.0590972900390625, 0.06253337860107422, 0.06596946716308594, 0.06940555572509766, 0.07284164428710938, 0.0762777328491211, 0.07971382141113281, 0.08314990997314453, 0.08658599853515625, 0.09002208709716797, 0.09345817565917969, 0.0968942642211914, 0.10033035278320312, 0.10376644134521484, 0.10720252990722656, 0.11063861846923828, 0.11407470703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 5.0, 16.0, 21.0, 36.0, 83.0, 143.0, 330.0, 733.0, 1942.0, 5998.0, 20283.0, 79778.0, 318449.0, 448735.0, 126972.0, 31241.0, 8992.0, 2877.0, 1029.0, 458.0, 190.0, 115.0, 47.0, 16.0, 20.0, 15.0, 8.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4912109375, -0.4754486083984375, -0.459686279296875, -0.4439239501953125, -0.42816162109375, -0.4123992919921875, -0.396636962890625, -0.3808746337890625, -0.3651123046875, -0.3493499755859375, -0.333587646484375, -0.3178253173828125, -0.30206298828125, -0.2863006591796875, -0.270538330078125, -0.2547760009765625, -0.239013671875, -0.2232513427734375, -0.207489013671875, -0.1917266845703125, -0.17596435546875, -0.1602020263671875, -0.144439697265625, -0.1286773681640625, -0.1129150390625, -0.0971527099609375, -0.081390380859375, -0.0656280517578125, -0.04986572265625, -0.0341033935546875, -0.018341064453125, -0.0025787353515625, 0.01318359375, 0.0289459228515625, 0.044708251953125, 0.0604705810546875, 0.07623291015625, 0.0919952392578125, 0.107757568359375, 0.1235198974609375, 0.1392822265625, 0.1550445556640625, 0.170806884765625, 0.1865692138671875, 0.20233154296875, 0.2180938720703125, 0.233856201171875, 0.2496185302734375, 0.265380859375, 0.2811431884765625, 0.296905517578125, 0.3126678466796875, 0.32843017578125, 0.3441925048828125, 0.359954833984375, 0.3757171630859375, 0.3914794921875, 0.4072418212890625, 0.423004150390625, 0.4387664794921875, 0.45452880859375, 0.4702911376953125, 0.486053466796875, 0.5018157958984375, 0.517578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 5.0, 6.0, 12.0, 9.0, 6.0, 11.0, 27.0, 27.0, 31.0, 24.0, 39.0, 39.0, 36.0, 39.0, 47.0, 35.0, 34.0, 38.0, 41.0, 44.0, 32.0, 38.0, 34.0, 29.0, 28.0, 35.0, 30.0, 35.0, 28.0, 28.0, 21.0, 13.0, 11.0, 14.0, 18.0, 6.0, 7.0, 6.0, 10.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.373046875, -0.3599891662597656, -0.34693145751953125, -0.3338737487792969, -0.3208160400390625, -0.3077583312988281, -0.29470062255859375, -0.2816429138183594, -0.268585205078125, -0.2555274963378906, -0.24246978759765625, -0.22941207885742188, -0.2163543701171875, -0.20329666137695312, -0.19023895263671875, -0.17718124389648438, -0.16412353515625, -0.15106582641601562, -0.13800811767578125, -0.12495040893554688, -0.1118927001953125, -0.09883499145507812, -0.08577728271484375, -0.07271957397460938, -0.059661865234375, -0.046604156494140625, -0.03354644775390625, -0.020488739013671875, -0.0074310302734375, 0.005626678466796875, 0.01868438720703125, 0.031742095947265625, 0.0447998046875, 0.057857513427734375, 0.07091522216796875, 0.08397293090820312, 0.0970306396484375, 0.11008834838867188, 0.12314605712890625, 0.13620376586914062, 0.149261474609375, 0.16231918334960938, 0.17537689208984375, 0.18843460083007812, 0.2014923095703125, 0.21455001831054688, 0.22760772705078125, 0.24066543579101562, 0.25372314453125, 0.2667808532714844, 0.27983856201171875, 0.2928962707519531, 0.3059539794921875, 0.3190116882324219, 0.33206939697265625, 0.3451271057128906, 0.358184814453125, 0.3712425231933594, 0.38430023193359375, 0.3973579406738281, 0.4104156494140625, 0.4234733581542969, 0.43653106689453125, 0.4495887756347656, 0.462646484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 6.0, 19.0, 20.0, 47.0, 115.0, 349.0, 1490.0, 20258.0, 1018514.0, 6420.0, 869.0, 242.0, 98.0, 53.0, 20.0, 9.0, 3.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.06597900390625, -1.0255126953125, -0.98504638671875, -0.944580078125, -0.90411376953125, -0.8636474609375, -0.82318115234375, -0.78271484375, -0.74224853515625, -0.7017822265625, -0.66131591796875, -0.620849609375, -0.58038330078125, -0.5399169921875, -0.49945068359375, -0.458984375, -0.41851806640625, -0.3780517578125, -0.33758544921875, -0.297119140625, -0.25665283203125, -0.2161865234375, -0.17572021484375, -0.13525390625, -0.09478759765625, -0.0543212890625, -0.01385498046875, 0.026611328125, 0.06707763671875, 0.1075439453125, 0.14801025390625, 0.1884765625, 0.22894287109375, 0.2694091796875, 0.30987548828125, 0.350341796875, 0.39080810546875, 0.4312744140625, 0.47174072265625, 0.51220703125, 0.55267333984375, 0.5931396484375, 0.63360595703125, 0.674072265625, 0.71453857421875, 0.7550048828125, 0.79547119140625, 0.8359375, 0.87640380859375, 0.9168701171875, 0.95733642578125, 0.997802734375, 1.03826904296875, 1.0787353515625, 1.11920166015625, 1.15966796875, 1.20013427734375, 1.2406005859375, 1.28106689453125, 1.321533203125, 1.36199951171875, 1.4024658203125, 1.44293212890625, 1.4833984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 4.0, 5.0, 14.0, 15.0, 18.0, 19.0, 15.0, 41.0, 53.0, 59.0, 57.0, 63.0, 73.0, 84.0, 65.0, 66.0, 75.0, 50.0, 48.0, 34.0, 34.0, 19.0, 14.0, 12.0, 11.0, 7.0, 5.0, 4.0, 2.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.574920654296875e-05, -2.4784356355667114e-05, -2.381950616836548e-05, -2.2854655981063843e-05, -2.1889805793762207e-05, -2.092495560646057e-05, -1.9960105419158936e-05, -1.89952552318573e-05, -1.8030405044555664e-05, -1.706555485725403e-05, -1.6100704669952393e-05, -1.5135854482650757e-05, -1.4171004295349121e-05, -1.3206154108047485e-05, -1.224130392074585e-05, -1.1276453733444214e-05, -1.0311603546142578e-05, -9.346753358840942e-06, -8.381903171539307e-06, -7.417052984237671e-06, -6.452202796936035e-06, -5.487352609634399e-06, -4.522502422332764e-06, -3.557652235031128e-06, -2.592802047729492e-06, -1.6279518604278564e-06, -6.631016731262207e-07, 3.0174851417541504e-07, 1.2665987014770508e-06, 2.2314488887786865e-06, 3.1962990760803223e-06, 4.161149263381958e-06, 5.125999450683594e-06, 6.0908496379852295e-06, 7.055699825286865e-06, 8.020550012588501e-06, 8.985400199890137e-06, 9.950250387191772e-06, 1.0915100574493408e-05, 1.1879950761795044e-05, 1.284480094909668e-05, 1.3809651136398315e-05, 1.4774501323699951e-05, 1.5739351511001587e-05, 1.6704201698303223e-05, 1.766905188560486e-05, 1.8633902072906494e-05, 1.959875226020813e-05, 2.0563602447509766e-05, 2.15284526348114e-05, 2.2493302822113037e-05, 2.3458153009414673e-05, 2.442300319671631e-05, 2.5387853384017944e-05, 2.635270357131958e-05, 2.7317553758621216e-05, 2.828240394592285e-05, 2.9247254133224487e-05, 3.0212104320526123e-05, 3.117695450782776e-05, 3.2141804695129395e-05, 3.310665488243103e-05, 3.4071505069732666e-05, 3.50363552570343e-05, 3.600120544433594e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 7.0, 17.0, 12.0, 23.0, 34.0, 54.0, 87.0, 115.0, 159.0, 244.0, 313.0, 581.0, 936.0, 1543.0, 2870.0, 5570.0, 12027.0, 31639.0, 113897.0, 572434.0, 223442.0, 49213.0, 17006.0, 7470.0, 3652.0, 2009.0, 1155.0, 672.0, 441.0, 290.0, 198.0, 127.0, 89.0, 70.0, 44.0, 25.0, 25.0, 16.0, 13.0, 11.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.1934814453125, -0.18806076049804688, -0.18264007568359375, -0.17721939086914062, -0.1717987060546875, -0.16637802124023438, -0.16095733642578125, -0.15553665161132812, -0.150115966796875, -0.14469528198242188, -0.13927459716796875, -0.13385391235351562, -0.1284332275390625, -0.12301254272460938, -0.11759185791015625, -0.11217117309570312, -0.10675048828125, -0.10132980346679688, -0.09590911865234375, -0.09048843383789062, -0.0850677490234375, -0.07964706420898438, -0.07422637939453125, -0.06880569458007812, -0.063385009765625, -0.057964324951171875, -0.05254364013671875, -0.047122955322265625, -0.0417022705078125, -0.036281585693359375, -0.03086090087890625, -0.025440216064453125, -0.02001953125, -0.014598846435546875, -0.00917816162109375, -0.003757476806640625, 0.0016632080078125, 0.007083892822265625, 0.01250457763671875, 0.017925262451171875, 0.023345947265625, 0.028766632080078125, 0.03418731689453125, 0.039608001708984375, 0.0450286865234375, 0.050449371337890625, 0.05587005615234375, 0.061290740966796875, 0.06671142578125, 0.07213211059570312, 0.07755279541015625, 0.08297348022460938, 0.0883941650390625, 0.09381484985351562, 0.09923553466796875, 0.10465621948242188, 0.110076904296875, 0.11549758911132812, 0.12091827392578125, 0.12633895874023438, 0.1317596435546875, 0.13718032836914062, 0.14260101318359375, 0.14802169799804688, 0.1534423828125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 11.0, 18.0, 22.0, 39.0, 32.0, 56.0, 69.0, 104.0, 128.0, 109.0, 102.0, 65.0, 55.0, 41.0, 33.0, 33.0, 13.0, 9.0, 11.0, 5.0, 8.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2693595886230469, -0.26064300537109375, -0.2519264221191406, -0.2432098388671875, -0.23449325561523438, -0.22577667236328125, -0.21706008911132812, -0.208343505859375, -0.19962692260742188, -0.19091033935546875, -0.18219375610351562, -0.1734771728515625, -0.16476058959960938, -0.15604400634765625, -0.14732742309570312, -0.13861083984375, -0.12989425659179688, -0.12117767333984375, -0.11246109008789062, -0.1037445068359375, -0.09502792358398438, -0.08631134033203125, -0.07759475708007812, -0.068878173828125, -0.060161590576171875, -0.05144500732421875, -0.042728424072265625, -0.0340118408203125, -0.025295257568359375, -0.01657867431640625, -0.007862091064453125, 0.0008544921875, 0.009571075439453125, 0.01828765869140625, 0.027004241943359375, 0.0357208251953125, 0.044437408447265625, 0.05315399169921875, 0.061870574951171875, 0.070587158203125, 0.07930374145507812, 0.08802032470703125, 0.09673690795898438, 0.1054534912109375, 0.11417007446289062, 0.12288665771484375, 0.13160324096679688, 0.14031982421875, 0.14903640747070312, 0.15775299072265625, 0.16646957397460938, 0.1751861572265625, 0.18390274047851562, 0.19261932373046875, 0.20133590698242188, 0.210052490234375, 0.21876907348632812, 0.22748565673828125, 0.23620223999023438, 0.2449188232421875, 0.2536354064941406, 0.26235198974609375, 0.2710685729980469, 0.27978515625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 13.0, 24.0, 42.0, 96.0, 196.0, 255.0, 164.0, 86.0, 46.0, 29.0, 14.0, 12.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.376052379608154, -5.219544410705566, -5.0630364418029785, -4.906528472900391, -4.750020980834961, -4.593513011932373, -4.437005043029785, -4.280497074127197, -4.123989105224609, -3.9674811363220215, -3.8109731674194336, -3.654465436935425, -3.497957468032837, -3.341449499130249, -3.1849417686462402, -3.0284337997436523, -2.8719258308410645, -2.7154178619384766, -2.5589098930358887, -2.40240216255188, -2.245894193649292, -2.089386224746704, -1.9328783750534058, -1.7763705253601074, -1.6198625564575195, -1.4633545875549316, -1.3068467378616333, -1.150338888168335, -0.9938309192657471, -0.837323009967804, -0.6808151006698608, -0.5243072509765625, -0.3677988052368164, -0.2112908959388733, -0.054782986640930176, 0.10172492265701294, 0.25823283195495605, 0.41474074125289917, 0.5712486505508423, 0.7277565002441406, 0.8842644691467285, 1.0407724380493164, 1.1972802877426147, 1.353788137435913, 1.510296106338501, 1.6668040752410889, 1.8233119249343872, 1.9798197746276855, 2.1363277435302734, 2.2928357124328613, 2.449343681335449, 2.605851411819458, 2.762359380722046, 2.918867349624634, 3.0753750801086426, 3.2318830490112305, 3.3883910179138184, 3.5448989868164062, 3.701406955718994, 3.857914686203003, 4.014422416687012, 4.1709303855896, 4.3274383544921875, 4.483946323394775, 4.640454292297363]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 9.0, 1.0, 6.0, 5.0, 7.0, 11.0, 17.0, 36.0, 63.0, 111.0, 122.0, 171.0, 130.0, 115.0, 70.0, 35.0, 23.0, 14.0, 11.0, 8.0, 4.0, 2.0, 1.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.360021591186523, -9.090184211730957, -8.820345878601074, -8.550508499145508, -8.280671119689941, -8.010833740234375, -7.740995407104492, -7.471158027648926, -7.201320171356201, -6.931482315063477, -6.66164493560791, -6.3918070793151855, -6.121969223022461, -5.8521318435668945, -5.58229398727417, -5.312456130981445, -5.042618751525879, -4.772780895233154, -4.502943515777588, -4.233105659484863, -3.9632680416107178, -3.6934304237365723, -3.4235925674438477, -3.153754949569702, -2.8839173316955566, -2.614079713821411, -2.3442420959472656, -2.074404239654541, -1.8045666217803955, -1.53472900390625, -1.264891266822815, -0.9950535297393799, -0.7252163887023926, -0.4553787112236023, -0.185541033744812, 0.08429664373397827, 0.35413432121276855, 0.6239719390869141, 0.8938096761703491, 1.1636474132537842, 1.4334850311279297, 1.7033226490020752, 1.9731603860855103, 2.2429981231689453, 2.512835741043091, 2.7826733589172363, 3.052511215209961, 3.3223488330841064, 3.592186450958252, 3.8620240688323975, 4.131861686706543, 4.401699542999268, 4.671537399291992, 4.941374778747559, 5.211212635040283, 5.481050491333008, 5.750887870788574, 6.020725727081299, 6.290563106536865, 6.56040096282959, 6.830238342285156, 7.100076198577881, 7.3699140548706055, 7.639751434326172, 7.9095892906188965]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 5.0, 9.0, 8.0, 5.0, 7.0, 20.0, 25.0, 34.0, 41.0, 73.0, 86.0, 116.0, 183.0, 230.0, 428.0, 630.0, 972.0, 1651.0, 2943.0, 6031.0, 15129.0, 73639.0, 3932661.0, 125063.0, 19464.0, 6863.0, 3339.0, 1810.0, 964.0, 649.0, 365.0, 267.0, 167.0, 136.0, 95.0, 59.0, 28.0, 18.0, 26.0, 15.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9873046875, -0.9587631225585938, -0.9302215576171875, -0.9016799926757812, -0.873138427734375, -0.8445968627929688, -0.8160552978515625, -0.7875137329101562, -0.75897216796875, -0.7304306030273438, -0.7018890380859375, -0.6733474731445312, -0.644805908203125, -0.6162643432617188, -0.5877227783203125, -0.5591812133789062, -0.5306396484375, -0.5020980834960938, -0.4735565185546875, -0.44501495361328125, -0.416473388671875, -0.38793182373046875, -0.3593902587890625, -0.33084869384765625, -0.30230712890625, -0.27376556396484375, -0.2452239990234375, -0.21668243408203125, -0.188140869140625, -0.15959930419921875, -0.1310577392578125, -0.10251617431640625, -0.073974609375, -0.04543304443359375, -0.0168914794921875, 0.01165008544921875, 0.040191650390625, 0.06873321533203125, 0.0972747802734375, 0.12581634521484375, 0.15435791015625, 0.18289947509765625, 0.2114410400390625, 0.23998260498046875, 0.268524169921875, 0.29706573486328125, 0.3256072998046875, 0.35414886474609375, 0.3826904296875, 0.41123199462890625, 0.4397735595703125, 0.46831512451171875, 0.496856689453125, 0.5253982543945312, 0.5539398193359375, 0.5824813842773438, 0.61102294921875, 0.6395645141601562, 0.6681060791015625, 0.6966476440429688, 0.725189208984375, 0.7537307739257812, 0.7822723388671875, 0.8108139038085938, 0.83935546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 5.0, 4.0, 6.0, 5.0, 5.0, 6.0, 11.0, 7.0, 21.0, 14.0, 37.0, 74.0, 114.0, 182.0, 162.0, 124.0, 70.0, 47.0, 24.0, 15.0, 11.0, 9.0, 3.0, 7.0, 5.0, 6.0, 4.0, 2.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.11114501953125, -0.10814285278320312, -0.10514068603515625, -0.10213851928710938, -0.0991363525390625, -0.09613418579101562, -0.09313201904296875, -0.09012985229492188, -0.087127685546875, -0.08412551879882812, -0.08112335205078125, -0.07812118530273438, -0.0751190185546875, -0.07211685180664062, -0.06911468505859375, -0.06611251831054688, -0.0631103515625, -0.060108184814453125, -0.05710601806640625, -0.054103851318359375, -0.0511016845703125, -0.048099517822265625, -0.04509735107421875, -0.042095184326171875, -0.039093017578125, -0.036090850830078125, -0.03308868408203125, -0.030086517333984375, -0.0270843505859375, -0.024082183837890625, -0.02108001708984375, -0.018077850341796875, -0.01507568359375, -0.012073516845703125, -0.00907135009765625, -0.006069183349609375, -0.0030670166015625, -6.4849853515625e-05, 0.00293731689453125, 0.005939483642578125, 0.008941650390625, 0.011943817138671875, 0.01494598388671875, 0.017948150634765625, 0.0209503173828125, 0.023952484130859375, 0.02695465087890625, 0.029956817626953125, 0.032958984375, 0.035961151123046875, 0.03896331787109375, 0.041965484619140625, 0.0449676513671875, 0.047969818115234375, 0.05097198486328125, 0.053974151611328125, 0.056976318359375, 0.059978485107421875, 0.06298065185546875, 0.06598281860351562, 0.0689849853515625, 0.07198715209960938, 0.07498931884765625, 0.07799148559570312, 0.08099365234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 13.0, 14.0, 6.0, 21.0, 17.0, 31.0, 45.0, 64.0, 109.0, 174.0, 238.0, 403.0, 693.0, 1222.0, 1987.0, 3693.0, 7436.0, 16587.0, 52951.0, 439660.0, 3497630.0, 120282.0, 28559.0, 10835.0, 5037.0, 2703.0, 1564.0, 830.0, 532.0, 333.0, 208.0, 133.0, 85.0, 59.0, 36.0, 24.0, 19.0, 15.0, 11.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.68212890625, -0.6616134643554688, -0.6410980224609375, -0.6205825805664062, -0.600067138671875, -0.5795516967773438, -0.5590362548828125, -0.5385208129882812, -0.51800537109375, -0.49748992919921875, -0.4769744873046875, -0.45645904541015625, -0.435943603515625, -0.41542816162109375, -0.3949127197265625, -0.37439727783203125, -0.3538818359375, -0.33336639404296875, -0.3128509521484375, -0.29233551025390625, -0.271820068359375, -0.25130462646484375, -0.2307891845703125, -0.21027374267578125, -0.18975830078125, -0.16924285888671875, -0.1487274169921875, -0.12821197509765625, -0.107696533203125, -0.08718109130859375, -0.0666656494140625, -0.04615020751953125, -0.025634765625, -0.00511932373046875, 0.0153961181640625, 0.03591156005859375, 0.056427001953125, 0.07694244384765625, 0.0974578857421875, 0.11797332763671875, 0.13848876953125, 0.15900421142578125, 0.1795196533203125, 0.20003509521484375, 0.220550537109375, 0.24106597900390625, 0.2615814208984375, 0.28209686279296875, 0.3026123046875, 0.32312774658203125, 0.3436431884765625, 0.36415863037109375, 0.384674072265625, 0.40518951416015625, 0.4257049560546875, 0.44622039794921875, 0.46673583984375, 0.48725128173828125, 0.5077667236328125, 0.5282821655273438, 0.548797607421875, 0.5693130493164062, 0.5898284912109375, 0.6103439331054688, 0.630859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 5.0, 4.0, 7.0, 11.0, 14.0, 14.0, 41.0, 51.0, 86.0, 166.0, 404.0, 2112.0, 618.0, 206.0, 99.0, 61.0, 33.0, 33.0, 14.0, 14.0, 13.0, 10.0, 5.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.1583251953125, -0.15346908569335938, -0.14861297607421875, -0.14375686645507812, -0.1389007568359375, -0.13404464721679688, -0.12918853759765625, -0.12433242797851562, -0.119476318359375, -0.11462020874023438, -0.10976409912109375, -0.10490798950195312, -0.1000518798828125, -0.09519577026367188, -0.09033966064453125, -0.08548355102539062, -0.08062744140625, -0.07577133178710938, -0.07091522216796875, -0.06605911254882812, -0.0612030029296875, -0.056346893310546875, -0.05149078369140625, -0.046634674072265625, -0.041778564453125, -0.036922454833984375, -0.03206634521484375, -0.027210235595703125, -0.0223541259765625, -0.017498016357421875, -0.01264190673828125, -0.007785797119140625, -0.0029296875, 0.001926422119140625, 0.00678253173828125, 0.011638641357421875, 0.0164947509765625, 0.021350860595703125, 0.02620697021484375, 0.031063079833984375, 0.035919189453125, 0.040775299072265625, 0.04563140869140625, 0.050487518310546875, 0.0553436279296875, 0.060199737548828125, 0.06505584716796875, 0.06991195678710938, 0.07476806640625, 0.07962417602539062, 0.08448028564453125, 0.08933639526367188, 0.0941925048828125, 0.09904861450195312, 0.10390472412109375, 0.10876083374023438, 0.113616943359375, 0.11847305297851562, 0.12332916259765625, 0.12818527221679688, 0.1330413818359375, 0.13789749145507812, 0.14275360107421875, 0.14760971069335938, 0.1524658203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 9.0, 23.0, 43.0, 96.0, 260.0, 253.0, 149.0, 68.0, 42.0, 22.0, 16.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4395490288734436, -0.41229909658432007, -0.38504916429519653, -0.357799232006073, -0.33054929971694946, -0.3032993674278259, -0.27604940533638, -0.24879947304725647, -0.22154954075813293, -0.1942996084690094, -0.16704967617988586, -0.13979972898960114, -0.1125497967004776, -0.08529986441135406, -0.058049917221069336, -0.0307999849319458, -0.0035500526428222656, 0.023699883371591568, 0.0509498193860054, 0.07819975912570953, 0.10544969141483307, 0.1326996237039566, 0.15994957089424133, 0.18719950318336487, 0.2144494354724884, 0.24169936776161194, 0.2689493000507355, 0.2961992621421814, 0.32344919443130493, 0.35069912672042847, 0.377949059009552, 0.40519899129867554, 0.4324488639831543, 0.45969879627227783, 0.48694872856140137, 0.5141986608505249, 0.5414485931396484, 0.568698525428772, 0.5959484577178955, 0.623198390007019, 0.6504483222961426, 0.6776982545852661, 0.7049481868743896, 0.7321981191635132, 0.7594480514526367, 0.7866979837417603, 0.8139479160308838, 0.8411978483200073, 0.8684478402137756, 0.8956977725028992, 0.9229477047920227, 0.9501976370811462, 0.9774475693702698, 1.004697561264038, 1.0319474935531616, 1.0591974258422852, 1.0864473581314087, 1.1136972904205322, 1.1409472227096558, 1.1681971549987793, 1.1954470872879028, 1.2226970195770264, 1.24994695186615, 1.2771968841552734, 1.304446816444397]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 11.0, 8.0, 23.0, 19.0, 35.0, 49.0, 75.0, 86.0, 126.0, 107.0, 112.0, 92.0, 63.0, 58.0, 42.0, 24.0, 17.0, 9.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.908355712890625, -0.8805968165397644, -0.852837860584259, -0.8250789642333984, -0.7973200678825378, -0.7695611715316772, -0.7418022155761719, -0.7140433192253113, -0.6862844228744507, -0.6585255265235901, -0.6307665705680847, -0.6030076742172241, -0.5752487778663635, -0.5474898815155029, -0.5197309255599976, -0.49197202920913696, -0.4642130732536316, -0.4364541471004486, -0.408695250749588, -0.38093632459640503, -0.35317742824554443, -0.32541850209236145, -0.29765957593917847, -0.26990067958831787, -0.2421417534351349, -0.2143828421831131, -0.1866239309310913, -0.15886500477790833, -0.13110609352588654, -0.10334718227386475, -0.07558825612068176, -0.04782934486865997, -0.020070433616638184, 0.007688481360673904, 0.03544739633798599, 0.06320631504058838, 0.09096522629261017, 0.11872413754463196, 0.14648306369781494, 0.17424197494983673, 0.20200088620185852, 0.2297597974538803, 0.2575187087059021, 0.2852776348590851, 0.31303656101226807, 0.34079545736312866, 0.36855438351631165, 0.39631330966949463, 0.4240722060203552, 0.4518311321735382, 0.4795900285243988, 0.5073489546775818, 0.5351078510284424, 0.5628668069839478, 0.5906257033348083, 0.618384599685669, 0.6461435556411743, 0.6739024519920349, 0.7016614079475403, 0.7294203042984009, 0.7571792006492615, 0.7849380970001221, 0.8126970529556274, 0.840455949306488, 0.8682148456573486]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 5.0, 8.0, 11.0, 11.0, 21.0, 19.0, 34.0, 44.0, 78.0, 119.0, 152.0, 306.0, 472.0, 770.0, 1399.0, 2538.0, 4939.0, 10475.0, 27300.0, 108675.0, 639848.0, 188055.0, 36651.0, 13491.0, 6099.0, 3012.0, 1662.0, 894.0, 548.0, 302.0, 223.0, 131.0, 77.0, 46.0, 40.0, 22.0, 14.0, 19.0, 13.0, 8.0, 4.0, 5.0, 7.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.476318359375, -0.46172332763671875, -0.4471282958984375, -0.43253326416015625, -0.417938232421875, -0.40334320068359375, -0.3887481689453125, -0.37415313720703125, -0.35955810546875, -0.34496307373046875, -0.3303680419921875, -0.31577301025390625, -0.301177978515625, -0.28658294677734375, -0.2719879150390625, -0.25739288330078125, -0.2427978515625, -0.22820281982421875, -0.2136077880859375, -0.19901275634765625, -0.184417724609375, -0.16982269287109375, -0.1552276611328125, -0.14063262939453125, -0.12603759765625, -0.11144256591796875, -0.0968475341796875, -0.08225250244140625, -0.067657470703125, -0.05306243896484375, -0.0384674072265625, -0.02387237548828125, -0.00927734375, 0.00531768798828125, 0.0199127197265625, 0.03450775146484375, 0.049102783203125, 0.06369781494140625, 0.0782928466796875, 0.09288787841796875, 0.10748291015625, 0.12207794189453125, 0.1366729736328125, 0.15126800537109375, 0.165863037109375, 0.18045806884765625, 0.1950531005859375, 0.20964813232421875, 0.2242431640625, 0.23883819580078125, 0.2534332275390625, 0.26802825927734375, 0.282623291015625, 0.29721832275390625, 0.3118133544921875, 0.32640838623046875, 0.34100341796875, 0.35559844970703125, 0.3701934814453125, 0.38478851318359375, 0.399383544921875, 0.41397857666015625, 0.4285736083984375, 0.44316864013671875, 0.457763671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 1.0, 3.0, 8.0, 4.0, 1.0, 4.0, 13.0, 10.0, 10.0, 13.0, 9.0, 30.0, 41.0, 69.0, 77.0, 111.0, 124.0, 117.0, 88.0, 79.0, 43.0, 39.0, 21.0, 22.0, 12.0, 9.0, 7.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058349609375, -0.05644989013671875, -0.0545501708984375, -0.05265045166015625, -0.050750732421875, -0.04885101318359375, -0.0469512939453125, -0.04505157470703125, -0.04315185546875, -0.04125213623046875, -0.0393524169921875, -0.03745269775390625, -0.035552978515625, -0.03365325927734375, -0.0317535400390625, -0.02985382080078125, -0.0279541015625, -0.02605438232421875, -0.0241546630859375, -0.02225494384765625, -0.020355224609375, -0.01845550537109375, -0.0165557861328125, -0.01465606689453125, -0.01275634765625, -0.01085662841796875, -0.0089569091796875, -0.00705718994140625, -0.005157470703125, -0.00325775146484375, -0.0013580322265625, 0.00054168701171875, 0.00244140625, 0.00434112548828125, 0.0062408447265625, 0.00814056396484375, 0.010040283203125, 0.01194000244140625, 0.0138397216796875, 0.01573944091796875, 0.01763916015625, 0.01953887939453125, 0.0214385986328125, 0.02333831787109375, 0.025238037109375, 0.02713775634765625, 0.0290374755859375, 0.03093719482421875, 0.0328369140625, 0.03473663330078125, 0.0366363525390625, 0.03853607177734375, 0.040435791015625, 0.04233551025390625, 0.0442352294921875, 0.04613494873046875, 0.04803466796875, 0.04993438720703125, 0.0518341064453125, 0.05373382568359375, 0.055633544921875, 0.05753326416015625, 0.0594329833984375, 0.06133270263671875, 0.063232421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 21.0, 30.0, 60.0, 102.0, 178.0, 339.0, 635.0, 1328.0, 2688.0, 5640.0, 11692.0, 25889.0, 59455.0, 143310.0, 293367.0, 275523.0, 129492.0, 53638.0, 23942.0, 11004.0, 5000.0, 2526.0, 1254.0, 618.0, 353.0, 179.0, 124.0, 58.0, 36.0, 15.0, 20.0, 6.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.225830078125, -0.21802520751953125, -0.2102203369140625, -0.20241546630859375, -0.194610595703125, -0.18680572509765625, -0.1790008544921875, -0.17119598388671875, -0.16339111328125, -0.15558624267578125, -0.1477813720703125, -0.13997650146484375, -0.132171630859375, -0.12436676025390625, -0.1165618896484375, -0.10875701904296875, -0.1009521484375, -0.09314727783203125, -0.0853424072265625, -0.07753753662109375, -0.069732666015625, -0.06192779541015625, -0.0541229248046875, -0.04631805419921875, -0.03851318359375, -0.03070831298828125, -0.0229034423828125, -0.01509857177734375, -0.007293701171875, 0.00051116943359375, 0.0083160400390625, 0.01612091064453125, 0.02392578125, 0.03173065185546875, 0.0395355224609375, 0.04734039306640625, 0.055145263671875, 0.06295013427734375, 0.0707550048828125, 0.07855987548828125, 0.08636474609375, 0.09416961669921875, 0.1019744873046875, 0.10977935791015625, 0.117584228515625, 0.12538909912109375, 0.1331939697265625, 0.14099884033203125, 0.1488037109375, 0.15660858154296875, 0.1644134521484375, 0.17221832275390625, 0.180023193359375, 0.18782806396484375, 0.1956329345703125, 0.20343780517578125, 0.21124267578125, 0.21904754638671875, 0.2268524169921875, 0.23465728759765625, 0.242462158203125, 0.25026702880859375, 0.2580718994140625, 0.26587677001953125, 0.273681640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 13.0, 9.0, 9.0, 11.0, 11.0, 8.0, 16.0, 15.0, 14.0, 14.0, 26.0, 22.0, 25.0, 36.0, 25.0, 24.0, 29.0, 33.0, 33.0, 30.0, 41.0, 35.0, 30.0, 47.0, 39.0, 40.0, 30.0, 26.0, 32.0, 21.0, 27.0, 30.0, 23.0, 20.0, 17.0, 19.0, 12.0, 16.0, 9.0, 14.0, 14.0, 8.0, 7.0, 6.0, 5.0, 6.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.1827392578125, -0.17677688598632812, -0.17081451416015625, -0.16485214233398438, -0.1588897705078125, -0.15292739868164062, -0.14696502685546875, -0.14100265502929688, -0.135040283203125, -0.12907791137695312, -0.12311553955078125, -0.11715316772460938, -0.1111907958984375, -0.10522842407226562, -0.09926605224609375, -0.09330368041992188, -0.08734130859375, -0.08137893676757812, -0.07541656494140625, -0.06945419311523438, -0.0634918212890625, -0.057529449462890625, -0.05156707763671875, -0.045604705810546875, -0.039642333984375, -0.033679962158203125, -0.02771759033203125, -0.021755218505859375, -0.0157928466796875, -0.009830474853515625, -0.00386810302734375, 0.002094268798828125, 0.008056640625, 0.014019012451171875, 0.01998138427734375, 0.025943756103515625, 0.0319061279296875, 0.037868499755859375, 0.04383087158203125, 0.049793243408203125, 0.055755615234375, 0.061717987060546875, 0.06768035888671875, 0.07364273071289062, 0.0796051025390625, 0.08556747436523438, 0.09152984619140625, 0.09749221801757812, 0.10345458984375, 0.10941696166992188, 0.11537933349609375, 0.12134170532226562, 0.1273040771484375, 0.13326644897460938, 0.13922882080078125, 0.14519119262695312, 0.151153564453125, 0.15711593627929688, 0.16307830810546875, 0.16904067993164062, 0.1750030517578125, 0.18096542358398438, 0.18692779541015625, 0.19289016723632812, 0.1988525390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 5.0, 5.0, 15.0, 12.0, 15.0, 19.0, 41.0, 59.0, 103.0, 197.0, 572.0, 2089.0, 26256.0, 1006044.0, 10960.0, 1366.0, 418.0, 152.0, 76.0, 44.0, 31.0, 17.0, 14.0, 11.0, 12.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3192901611328125, -1.277252197265625, -1.2352142333984375, -1.19317626953125, -1.1511383056640625, -1.109100341796875, -1.0670623779296875, -1.0250244140625, -0.9829864501953125, -0.940948486328125, -0.8989105224609375, -0.85687255859375, -0.8148345947265625, -0.772796630859375, -0.7307586669921875, -0.688720703125, -0.6466827392578125, -0.604644775390625, -0.5626068115234375, -0.52056884765625, -0.4785308837890625, -0.436492919921875, -0.3944549560546875, -0.3524169921875, -0.3103790283203125, -0.268341064453125, -0.2263031005859375, -0.18426513671875, -0.1422271728515625, -0.100189208984375, -0.0581512451171875, -0.01611328125, 0.0259246826171875, 0.067962646484375, 0.1100006103515625, 0.15203857421875, 0.1940765380859375, 0.236114501953125, 0.2781524658203125, 0.3201904296875, 0.3622283935546875, 0.404266357421875, 0.4463043212890625, 0.48834228515625, 0.5303802490234375, 0.572418212890625, 0.6144561767578125, 0.656494140625, 0.6985321044921875, 0.740570068359375, 0.7826080322265625, 0.82464599609375, 0.8666839599609375, 0.908721923828125, 0.9507598876953125, 0.9927978515625, 1.0348358154296875, 1.076873779296875, 1.1189117431640625, 1.16094970703125, 1.2029876708984375, 1.245025634765625, 1.2870635986328125, 1.3291015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 3.0, 8.0, 5.0, 11.0, 15.0, 18.0, 17.0, 31.0, 34.0, 73.0, 85.0, 98.0, 119.0, 117.0, 103.0, 54.0, 44.0, 29.0, 32.0, 18.0, 26.0, 9.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.479024887084961e-05, -6.268173456192017e-05, -6.057322025299072e-05, -5.846470594406128e-05, -5.6356191635131836e-05, -5.424767732620239e-05, -5.213916301727295e-05, -5.0030648708343506e-05, -4.792213439941406e-05, -4.581362009048462e-05, -4.3705105781555176e-05, -4.159659147262573e-05, -3.948807716369629e-05, -3.7379562854766846e-05, -3.52710485458374e-05, -3.316253423690796e-05, -3.1054019927978516e-05, -2.8945505619049072e-05, -2.683699131011963e-05, -2.4728477001190186e-05, -2.2619962692260742e-05, -2.05114483833313e-05, -1.8402934074401855e-05, -1.6294419765472412e-05, -1.4185905456542969e-05, -1.2077391147613525e-05, -9.968876838684082e-06, -7.860362529754639e-06, -5.751848220825195e-06, -3.643333911895752e-06, -1.5348196029663086e-06, 5.736947059631348e-07, 2.682209014892578e-06, 4.7907233238220215e-06, 6.899237632751465e-06, 9.007751941680908e-06, 1.1116266250610352e-05, 1.3224780559539795e-05, 1.5333294868469238e-05, 1.744180917739868e-05, 1.9550323486328125e-05, 2.165883779525757e-05, 2.3767352104187012e-05, 2.5875866413116455e-05, 2.79843807220459e-05, 3.0092895030975342e-05, 3.2201409339904785e-05, 3.430992364883423e-05, 3.641843795776367e-05, 3.8526952266693115e-05, 4.063546657562256e-05, 4.2743980884552e-05, 4.4852495193481445e-05, 4.696100950241089e-05, 4.906952381134033e-05, 5.1178038120269775e-05, 5.328655242919922e-05, 5.539506673812866e-05, 5.7503581047058105e-05, 5.961209535598755e-05, 6.172060966491699e-05, 6.382912397384644e-05, 6.593763828277588e-05, 6.804615259170532e-05, 7.015466690063477e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 6.0, 6.0, 19.0, 24.0, 24.0, 54.0, 68.0, 93.0, 145.0, 196.0, 254.0, 458.0, 656.0, 997.0, 1659.0, 2670.0, 4762.0, 9175.0, 22628.0, 170903.0, 732382.0, 69011.0, 15628.0, 7165.0, 3706.0, 2121.0, 1272.0, 826.0, 533.0, 342.0, 235.0, 147.0, 130.0, 80.0, 43.0, 30.0, 31.0, 16.0, 16.0, 12.0, 7.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.402099609375, -0.3892631530761719, -0.37642669677734375, -0.3635902404785156, -0.3507537841796875, -0.3379173278808594, -0.32508087158203125, -0.3122444152832031, -0.299407958984375, -0.2865715026855469, -0.27373504638671875, -0.2608985900878906, -0.2480621337890625, -0.23522567749023438, -0.22238922119140625, -0.20955276489257812, -0.19671630859375, -0.18387985229492188, -0.17104339599609375, -0.15820693969726562, -0.1453704833984375, -0.13253402709960938, -0.11969757080078125, -0.10686111450195312, -0.094024658203125, -0.08118820190429688, -0.06835174560546875, -0.055515289306640625, -0.0426788330078125, -0.029842376708984375, -0.01700592041015625, -0.004169464111328125, 0.0086669921875, 0.021503448486328125, 0.03433990478515625, 0.047176361083984375, 0.0600128173828125, 0.07284927368164062, 0.08568572998046875, 0.09852218627929688, 0.111358642578125, 0.12419509887695312, 0.13703155517578125, 0.14986801147460938, 0.1627044677734375, 0.17554092407226562, 0.18837738037109375, 0.20121383666992188, 0.21405029296875, 0.22688674926757812, 0.23972320556640625, 0.2525596618652344, 0.2653961181640625, 0.2782325744628906, 0.29106903076171875, 0.3039054870605469, 0.316741943359375, 0.3295783996582031, 0.34241485595703125, 0.3552513122558594, 0.3680877685546875, 0.3809242248535156, 0.39376068115234375, 0.4065971374511719, 0.41943359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 6.0, 14.0, 15.0, 26.0, 64.0, 124.0, 211.0, 201.0, 151.0, 72.0, 20.0, 15.0, 12.0, 10.0, 5.0, 6.0, 8.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42822265625, -0.4139518737792969, -0.39968109130859375, -0.3854103088378906, -0.3711395263671875, -0.3568687438964844, -0.34259796142578125, -0.3283271789550781, -0.314056396484375, -0.2997856140136719, -0.28551483154296875, -0.2712440490722656, -0.2569732666015625, -0.24270248413085938, -0.22843170166015625, -0.21416091918945312, -0.19989013671875, -0.18561935424804688, -0.17134857177734375, -0.15707778930664062, -0.1428070068359375, -0.12853622436523438, -0.11426544189453125, -0.09999465942382812, -0.085723876953125, -0.07145309448242188, -0.05718231201171875, -0.042911529541015625, -0.0286407470703125, -0.014369964599609375, -9.918212890625e-05, 0.014171600341796875, 0.0284423828125, 0.042713165283203125, 0.05698394775390625, 0.07125473022460938, 0.0855255126953125, 0.09979629516601562, 0.11406707763671875, 0.12833786010742188, 0.142608642578125, 0.15687942504882812, 0.17115020751953125, 0.18542098999023438, 0.1996917724609375, 0.21396255493164062, 0.22823333740234375, 0.24250411987304688, 0.25677490234375, 0.2710456848144531, 0.28531646728515625, 0.2995872497558594, 0.3138580322265625, 0.3281288146972656, 0.34239959716796875, 0.3566703796386719, 0.370941162109375, 0.3852119445800781, 0.39948272705078125, 0.4137535095214844, 0.4280242919921875, 0.4422950744628906, 0.45656585693359375, 0.4708366394042969, 0.485107421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 13.0, 14.0, 18.0, 41.0, 88.0, 172.0, 232.0, 189.0, 87.0, 48.0, 39.0, 15.0, 6.0, 10.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7499608993530273, -1.6612286567687988, -1.5724964141845703, -1.4837641716003418, -1.3950319290161133, -1.3062996864318848, -1.2175674438476562, -1.1288352012634277, -1.0401029586791992, -0.9513707160949707, -0.8626384735107422, -0.7739062309265137, -0.6851739883422852, -0.5964417457580566, -0.5077094435691833, -0.41897720098495483, -0.33024489879608154, -0.24151265621185303, -0.15278039872646332, -0.06404814124107361, 0.024684101343154907, 0.11341634392738342, 0.20214861631393433, 0.29088085889816284, 0.37961310148239136, 0.4683453440666199, 0.5570775866508484, 0.6458098888397217, 0.7345421314239502, 0.8232743740081787, 0.9120066165924072, 1.0007388591766357, 1.0894711017608643, 1.1782033443450928, 1.2669355869293213, 1.3556678295135498, 1.4444000720977783, 1.5331323146820068, 1.6218645572662354, 1.7105967998504639, 1.7993290424346924, 1.888061285018921, 1.9767935276031494, 2.065525770187378, 2.1542580127716064, 2.242990255355835, 2.3317224979400635, 2.420454740524292, 2.5091872215270996, 2.597919464111328, 2.6866517066955566, 2.775383949279785, 2.8641161918640137, 2.952848434448242, 3.0415806770324707, 3.130312919616699, 3.2190451622009277, 3.3077774047851562, 3.3965096473693848, 3.4852418899536133, 3.573974132537842, 3.6627063751220703, 3.751438617706299, 3.8401708602905273, 3.928903102874756]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 1.0, 12.0, 7.0, 12.0, 17.0, 35.0, 38.0, 43.0, 78.0, 84.0, 97.0, 95.0, 112.0, 95.0, 68.0, 46.0, 39.0, 31.0, 21.0, 14.0, 11.0, 10.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0156478881835938, -2.9194695949554443, -2.823291301727295, -2.7271127700805664, -2.630934476852417, -2.5347561836242676, -2.438577890396118, -2.3423995971679688, -2.2462210655212402, -2.150042772293091, -2.0538644790649414, -1.9576860666275024, -1.8615076541900635, -1.765329360961914, -1.6691510677337646, -1.5729726552963257, -1.4767943620681763, -1.3806160688400269, -1.284437656402588, -1.1882593631744385, -1.0920809507369995, -0.9959026575088501, -0.8997243046760559, -0.8035459518432617, -0.7073675990104675, -0.6111892461776733, -0.5150108933448792, -0.41883257031440735, -0.32265421748161316, -0.22647586464881897, -0.13029754161834717, -0.03411918878555298, 0.06205916404724121, 0.1582375168800354, 0.2544158697128296, 0.3505941927433014, 0.4467725455760956, 0.5429508686065674, 0.6391292214393616, 0.7353075742721558, 0.83148592710495, 0.9276642799377441, 1.0238425731658936, 1.1200209856033325, 1.216199278831482, 1.312377691268921, 1.4085559844970703, 1.5047342777252197, 1.6009126901626587, 1.697090983390808, 1.793269395828247, 1.8894476890563965, 1.9856261014938354, 2.0818045139312744, 2.177982807159424, 2.2741611003875732, 2.3703393936157227, 2.466517686843872, 2.5626959800720215, 2.65887451171875, 2.7550528049468994, 2.851231098175049, 2.9474093914031982, 3.0435876846313477, 3.139766216278076]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 9.0, 8.0, 8.0, 8.0, 15.0, 22.0, 23.0, 42.0, 45.0, 63.0, 73.0, 120.0, 138.0, 225.0, 271.0, 404.0, 514.0, 802.0, 1154.0, 1748.0, 2934.0, 5463.0, 11340.0, 29159.0, 127369.0, 3656487.0, 281260.0, 42271.0, 14787.0, 6792.0, 3657.0, 2175.0, 1383.0, 970.0, 695.0, 486.0, 374.0, 278.0, 195.0, 129.0, 109.0, 78.0, 49.0, 46.0, 35.0, 24.0, 12.0, 10.0, 5.0, 8.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7509765625, -0.7279815673828125, -0.704986572265625, -0.6819915771484375, -0.65899658203125, -0.6360015869140625, -0.613006591796875, -0.5900115966796875, -0.5670166015625, -0.5440216064453125, -0.521026611328125, -0.4980316162109375, -0.47503662109375, -0.4520416259765625, -0.429046630859375, -0.4060516357421875, -0.383056640625, -0.3600616455078125, -0.337066650390625, -0.3140716552734375, -0.29107666015625, -0.2680816650390625, -0.245086669921875, -0.2220916748046875, -0.1990966796875, -0.1761016845703125, -0.153106689453125, -0.1301116943359375, -0.10711669921875, -0.0841217041015625, -0.061126708984375, -0.0381317138671875, -0.01513671875, 0.0078582763671875, 0.030853271484375, 0.0538482666015625, 0.07684326171875, 0.0998382568359375, 0.122833251953125, 0.1458282470703125, 0.1688232421875, 0.1918182373046875, 0.214813232421875, 0.2378082275390625, 0.26080322265625, 0.2837982177734375, 0.306793212890625, 0.3297882080078125, 0.352783203125, 0.3757781982421875, 0.398773193359375, 0.4217681884765625, 0.44476318359375, 0.4677581787109375, 0.490753173828125, 0.5137481689453125, 0.5367431640625, 0.5597381591796875, 0.582733154296875, 0.6057281494140625, 0.62872314453125, 0.6517181396484375, 0.674713134765625, 0.6977081298828125, 0.720703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 8.0, 10.0, 7.0, 7.0, 17.0, 15.0, 23.0, 45.0, 46.0, 75.0, 73.0, 89.0, 99.0, 100.0, 80.0, 68.0, 54.0, 26.0, 30.0, 15.0, 14.0, 14.0, 15.0, 5.0, 8.0, 4.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0604248046875, -0.05862998962402344, -0.056835174560546875, -0.05504035949707031, -0.05324554443359375, -0.05145072937011719, -0.049655914306640625, -0.04786109924316406, -0.0460662841796875, -0.04427146911621094, -0.042476654052734375, -0.04068183898925781, -0.03888702392578125, -0.03709220886230469, -0.035297393798828125, -0.03350257873535156, -0.031707763671875, -0.029912948608398438, -0.028118133544921875, -0.026323318481445312, -0.02452850341796875, -0.022733688354492188, -0.020938873291015625, -0.019144058227539062, -0.0173492431640625, -0.015554428100585938, -0.013759613037109375, -0.011964797973632812, -0.01016998291015625, -0.008375167846679688, -0.006580352783203125, -0.0047855377197265625, -0.00299072265625, -0.0011959075927734375, 0.000598907470703125, 0.0023937225341796875, 0.00418853759765625, 0.0059833526611328125, 0.007778167724609375, 0.009572982788085938, 0.0113677978515625, 0.013162612915039062, 0.014957427978515625, 0.016752243041992188, 0.01854705810546875, 0.020341873168945312, 0.022136688232421875, 0.023931503295898438, 0.025726318359375, 0.027521133422851562, 0.029315948486328125, 0.031110763549804688, 0.03290557861328125, 0.03470039367675781, 0.036495208740234375, 0.03829002380371094, 0.0400848388671875, 0.04187965393066406, 0.043674468994140625, 0.04546928405761719, 0.04726409912109375, 0.04905891418457031, 0.050853729248046875, 0.05264854431152344, 0.054443359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 6.0, 7.0, 17.0, 21.0, 48.0, 78.0, 189.0, 707.0, 6484.0, 4006361.0, 177178.0, 2511.0, 396.0, 122.0, 73.0, 31.0, 11.0, 15.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.1962890625, -2.095703125, -1.9951171875, -1.89453125, -1.7939453125, -1.693359375, -1.5927734375, -1.4921875, -1.3916015625, -1.291015625, -1.1904296875, -1.08984375, -0.9892578125, -0.888671875, -0.7880859375, -0.6875, -0.5869140625, -0.486328125, -0.3857421875, -0.28515625, -0.1845703125, -0.083984375, 0.0166015625, 0.1171875, 0.2177734375, 0.318359375, 0.4189453125, 0.51953125, 0.6201171875, 0.720703125, 0.8212890625, 0.921875, 1.0224609375, 1.123046875, 1.2236328125, 1.32421875, 1.4248046875, 1.525390625, 1.6259765625, 1.7265625, 1.8271484375, 1.927734375, 2.0283203125, 2.12890625, 2.2294921875, 2.330078125, 2.4306640625, 2.53125, 2.6318359375, 2.732421875, 2.8330078125, 2.93359375, 3.0341796875, 3.134765625, 3.2353515625, 3.3359375, 3.4365234375, 3.537109375, 3.6376953125, 3.73828125, 3.8388671875, 3.939453125, 4.0400390625, 4.140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 7.0, 14.0, 17.0, 21.0, 49.0, 93.0, 179.0, 503.0, 2112.0, 636.0, 191.0, 99.0, 56.0, 33.0, 20.0, 8.0, 10.0, 5.0, 6.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.300537109375, -0.2936420440673828, -0.2867469787597656, -0.27985191345214844, -0.27295684814453125, -0.26606178283691406, -0.2591667175292969, -0.2522716522216797, -0.2453765869140625, -0.2384815216064453, -0.23158645629882812, -0.22469139099121094, -0.21779632568359375, -0.21090126037597656, -0.20400619506835938, -0.1971111297607422, -0.190216064453125, -0.1833209991455078, -0.17642593383789062, -0.16953086853027344, -0.16263580322265625, -0.15574073791503906, -0.14884567260742188, -0.1419506072998047, -0.1350555419921875, -0.1281604766845703, -0.12126541137695312, -0.11437034606933594, -0.10747528076171875, -0.10058021545410156, -0.09368515014648438, -0.08679008483886719, -0.07989501953125, -0.07299995422363281, -0.06610488891601562, -0.05920982360839844, -0.05231475830078125, -0.04541969299316406, -0.038524627685546875, -0.03162956237792969, -0.0247344970703125, -0.017839431762695312, -0.010944366455078125, -0.0040493011474609375, 0.00284576416015625, 0.009740829467773438, 0.016635894775390625, 0.023530960083007812, 0.030426025390625, 0.03732109069824219, 0.044216156005859375, 0.05111122131347656, 0.05800628662109375, 0.06490135192871094, 0.07179641723632812, 0.07869148254394531, 0.0855865478515625, 0.09248161315917969, 0.09937667846679688, 0.10627174377441406, 0.11316680908203125, 0.12006187438964844, 0.12695693969726562, 0.1338520050048828, 0.1407470703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 15.0, 32.0, 49.0, 103.0, 197.0, 264.0, 181.0, 85.0, 30.0, 16.0, 4.0, 9.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7906152606010437, -0.7568397521972656, -0.7230641841888428, -0.6892886757850647, -0.6555131673812866, -0.6217376589775085, -0.5879621505737305, -0.5541865825653076, -0.5204110741615295, -0.48663556575775146, -0.452860027551651, -0.41908448934555054, -0.38530898094177246, -0.3515334725379944, -0.3177579343318939, -0.28398239612579346, -0.2502068877220154, -0.2164313644170761, -0.18265584111213684, -0.14888031780719757, -0.1151047945022583, -0.08132927119731903, -0.04755374789237976, -0.01377822458744049, 0.01999729871749878, 0.05377282202243805, 0.08754834532737732, 0.12132386863231659, 0.15509939193725586, 0.18887491524219513, 0.2226504385471344, 0.25642597675323486, 0.29020142555236816, 0.32397693395614624, 0.3577524721622467, 0.39152801036834717, 0.42530351877212524, 0.4590790271759033, 0.4928545653820038, 0.5266301035881042, 0.5604056119918823, 0.5941811203956604, 0.6279566287994385, 0.6617321968078613, 0.6955077052116394, 0.7292832136154175, 0.7630587816238403, 0.7968342900276184, 0.8306097984313965, 0.8643853068351746, 0.8981608152389526, 0.9319363832473755, 0.9657118916511536, 0.9994874000549316, 1.0332629680633545, 1.0670384168624878, 1.1008139848709106, 1.1345895528793335, 1.1683650016784668, 1.2021405696868896, 1.2359161376953125, 1.2696915864944458, 1.3034671545028687, 1.337242603302002, 1.3710181713104248]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 8.0, 15.0, 17.0, 28.0, 29.0, 42.0, 56.0, 77.0, 85.0, 109.0, 98.0, 75.0, 73.0, 75.0, 57.0, 36.0, 35.0, 20.0, 14.0, 12.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0533130168914795, -1.0257294178009033, -0.9981458187103271, -0.970562219619751, -0.9429786205291748, -0.9153950214385986, -0.8878114223480225, -0.8602278232574463, -0.8326442241668701, -0.805060625076294, -0.7774770259857178, -0.7498934268951416, -0.7223098278045654, -0.6947262287139893, -0.6671426296234131, -0.6395590305328369, -0.6119754910469055, -0.5843918919563293, -0.5568082928657532, -0.529224693775177, -0.5016410946846008, -0.47405749559402466, -0.4464739263057709, -0.4188903272151947, -0.39130672812461853, -0.36372312903404236, -0.3361395299434662, -0.3085559606552124, -0.28097236156463623, -0.25338876247406006, -0.2258051633834839, -0.19822156429290771, -0.17063796520233154, -0.14305436611175537, -0.1154707744717598, -0.08788718283176422, -0.06030358374118805, -0.03271998465061188, -0.005136400461196899, 0.022447198629379272, 0.050030797719955444, 0.07761439681053162, 0.10519798845052719, 0.13278158009052277, 0.16036517918109894, 0.1879487782716751, 0.2155323624610901, 0.24311596155166626, 0.27069956064224243, 0.2982831597328186, 0.3258667588233948, 0.35345035791397095, 0.3810339570045471, 0.4086175560951233, 0.4362011253833771, 0.46378472447395325, 0.4913683235645294, 0.5189518928527832, 0.5465354919433594, 0.5741190910339355, 0.6017026901245117, 0.6292862892150879, 0.6568698883056641, 0.6844534873962402, 0.7120370864868164]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 5.0, 7.0, 6.0, 7.0, 15.0, 20.0, 18.0, 12.0, 20.0, 28.0, 22.0, 36.0, 36.0, 43.0, 68.0, 128.0, 480.0, 4972.0, 621346.0, 416257.0, 4107.0, 487.0, 117.0, 58.0, 46.0, 26.0, 32.0, 30.0, 30.0, 25.0, 15.0, 10.0, 8.0, 9.0, 8.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7392578125, -1.68121337890625, -1.6231689453125, -1.56512451171875, -1.507080078125, -1.44903564453125, -1.3909912109375, -1.33294677734375, -1.27490234375, -1.21685791015625, -1.1588134765625, -1.10076904296875, -1.042724609375, -0.98468017578125, -0.9266357421875, -0.86859130859375, -0.810546875, -0.75250244140625, -0.6944580078125, -0.63641357421875, -0.578369140625, -0.52032470703125, -0.4622802734375, -0.40423583984375, -0.34619140625, -0.28814697265625, -0.2301025390625, -0.17205810546875, -0.114013671875, -0.05596923828125, 0.0020751953125, 0.06011962890625, 0.1181640625, 0.17620849609375, 0.2342529296875, 0.29229736328125, 0.350341796875, 0.40838623046875, 0.4664306640625, 0.52447509765625, 0.58251953125, 0.64056396484375, 0.6986083984375, 0.75665283203125, 0.814697265625, 0.87274169921875, 0.9307861328125, 0.98883056640625, 1.046875, 1.10491943359375, 1.1629638671875, 1.22100830078125, 1.279052734375, 1.33709716796875, 1.3951416015625, 1.45318603515625, 1.51123046875, 1.56927490234375, 1.6273193359375, 1.68536376953125, 1.743408203125, 1.80145263671875, 1.8594970703125, 1.91754150390625, 1.9755859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 11.0, 52.0, 126.0, 271.0, 307.0, 157.0, 51.0, 18.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.32373046875, -0.3176288604736328, -0.3115272521972656, -0.30542564392089844, -0.29932403564453125, -0.29322242736816406, -0.2871208190917969, -0.2810192108154297, -0.2749176025390625, -0.2688159942626953, -0.2627143859863281, -0.25661277770996094, -0.25051116943359375, -0.24440956115722656, -0.23830795288085938, -0.2322063446044922, -0.226104736328125, -0.2200031280517578, -0.21390151977539062, -0.20779991149902344, -0.20169830322265625, -0.19559669494628906, -0.18949508666992188, -0.1833934783935547, -0.1772918701171875, -0.1711902618408203, -0.16508865356445312, -0.15898704528808594, -0.15288543701171875, -0.14678382873535156, -0.14068222045898438, -0.1345806121826172, -0.12847900390625, -0.12237739562988281, -0.11627578735351562, -0.11017417907714844, -0.10407257080078125, -0.09797096252441406, -0.09186935424804688, -0.08576774597167969, -0.0796661376953125, -0.07356452941894531, -0.06746292114257812, -0.06136131286621094, -0.05525970458984375, -0.04915809631347656, -0.043056488037109375, -0.03695487976074219, -0.030853271484375, -0.024751663208007812, -0.018650054931640625, -0.012548446655273438, -0.00644683837890625, -0.0003452301025390625, 0.005756378173828125, 0.011857986450195312, 0.0179595947265625, 0.024061203002929688, 0.030162811279296875, 0.03626441955566406, 0.04236602783203125, 0.04846763610839844, 0.054569244384765625, 0.06067085266113281, 0.0667724609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 11.0, 11.0, 13.0, 11.0, 23.0, 30.0, 39.0, 64.0, 58.0, 90.0, 159.0, 271.0, 457.0, 962.0, 2161.0, 5278.0, 14657.0, 44481.0, 168924.0, 480036.0, 239904.0, 60565.0, 18618.0, 6506.0, 2618.0, 1225.0, 542.0, 294.0, 165.0, 99.0, 79.0, 46.0, 39.0, 32.0, 27.0, 15.0, 10.0, 9.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455322265625, -0.4399528503417969, -0.42458343505859375, -0.4092140197753906, -0.3938446044921875, -0.3784751892089844, -0.36310577392578125, -0.3477363586425781, -0.332366943359375, -0.3169975280761719, -0.30162811279296875, -0.2862586975097656, -0.2708892822265625, -0.2555198669433594, -0.24015045166015625, -0.22478103637695312, -0.20941162109375, -0.19404220581054688, -0.17867279052734375, -0.16330337524414062, -0.1479339599609375, -0.13256454467773438, -0.11719512939453125, -0.10182571411132812, -0.086456298828125, -0.07108688354492188, -0.05571746826171875, -0.040348052978515625, -0.0249786376953125, -0.009609222412109375, 0.00576019287109375, 0.021129608154296875, 0.0364990234375, 0.051868438720703125, 0.06723785400390625, 0.08260726928710938, 0.0979766845703125, 0.11334609985351562, 0.12871551513671875, 0.14408493041992188, 0.159454345703125, 0.17482376098632812, 0.19019317626953125, 0.20556259155273438, 0.2209320068359375, 0.23630142211914062, 0.25167083740234375, 0.2670402526855469, 0.28240966796875, 0.2977790832519531, 0.31314849853515625, 0.3285179138183594, 0.3438873291015625, 0.3592567443847656, 0.37462615966796875, 0.3899955749511719, 0.405364990234375, 0.4207344055175781, 0.43610382080078125, 0.4514732360839844, 0.4668426513671875, 0.4822120666503906, 0.49758148193359375, 0.5129508972167969, 0.5283203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 5.0, 6.0, 10.0, 5.0, 13.0, 11.0, 13.0, 9.0, 21.0, 24.0, 25.0, 31.0, 40.0, 35.0, 28.0, 37.0, 46.0, 53.0, 43.0, 49.0, 41.0, 47.0, 45.0, 40.0, 44.0, 43.0, 31.0, 37.0, 26.0, 26.0, 27.0, 15.0, 14.0, 12.0, 12.0, 12.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.303466796875, -0.2940330505371094, -0.28459930419921875, -0.2751655578613281, -0.2657318115234375, -0.2562980651855469, -0.24686431884765625, -0.23743057250976562, -0.227996826171875, -0.21856307983398438, -0.20912933349609375, -0.19969558715820312, -0.1902618408203125, -0.18082809448242188, -0.17139434814453125, -0.16196060180664062, -0.15252685546875, -0.14309310913085938, -0.13365936279296875, -0.12422561645507812, -0.1147918701171875, -0.10535812377929688, -0.09592437744140625, -0.08649063110351562, -0.077056884765625, -0.06762313842773438, -0.05818939208984375, -0.048755645751953125, -0.0393218994140625, -0.029888153076171875, -0.02045440673828125, -0.011020660400390625, -0.0015869140625, 0.007846832275390625, 0.01728057861328125, 0.026714324951171875, 0.0361480712890625, 0.045581817626953125, 0.05501556396484375, 0.06444931030273438, 0.073883056640625, 0.08331680297851562, 0.09275054931640625, 0.10218429565429688, 0.1116180419921875, 0.12105178833007812, 0.13048553466796875, 0.13991928100585938, 0.14935302734375, 0.15878677368164062, 0.16822052001953125, 0.17765426635742188, 0.1870880126953125, 0.19652175903320312, 0.20595550537109375, 0.21538925170898438, 0.224822998046875, 0.23425674438476562, 0.24369049072265625, 0.2531242370605469, 0.2625579833984375, 0.2719917297363281, 0.28142547607421875, 0.2908592224121094, 0.30029296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 6.0, 4.0, 15.0, 18.0, 24.0, 39.0, 71.0, 126.0, 206.0, 372.0, 811.0, 2125.0, 7493.0, 39120.0, 376623.0, 548305.0, 58624.0, 9966.0, 2592.0, 1003.0, 452.0, 247.0, 107.0, 81.0, 35.0, 34.0, 14.0, 12.0, 8.0, 6.0, 2.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.44873046875, -0.4338226318359375, -0.418914794921875, -0.4040069580078125, -0.38909912109375, -0.3741912841796875, -0.359283447265625, -0.3443756103515625, -0.3294677734375, -0.3145599365234375, -0.299652099609375, -0.2847442626953125, -0.26983642578125, -0.2549285888671875, -0.240020751953125, -0.2251129150390625, -0.210205078125, -0.1952972412109375, -0.180389404296875, -0.1654815673828125, -0.15057373046875, -0.1356658935546875, -0.120758056640625, -0.1058502197265625, -0.0909423828125, -0.0760345458984375, -0.061126708984375, -0.0462188720703125, -0.03131103515625, -0.0164031982421875, -0.001495361328125, 0.0134124755859375, 0.0283203125, 0.0432281494140625, 0.058135986328125, 0.0730438232421875, 0.08795166015625, 0.1028594970703125, 0.117767333984375, 0.1326751708984375, 0.1475830078125, 0.1624908447265625, 0.177398681640625, 0.1923065185546875, 0.20721435546875, 0.2221221923828125, 0.237030029296875, 0.2519378662109375, 0.266845703125, 0.2817535400390625, 0.296661376953125, 0.3115692138671875, 0.32647705078125, 0.3413848876953125, 0.356292724609375, 0.3712005615234375, 0.3861083984375, 0.4010162353515625, 0.415924072265625, 0.4308319091796875, 0.44573974609375, 0.4606475830078125, 0.475555419921875, 0.4904632568359375, 0.50537109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 8.0, 14.0, 11.0, 13.0, 15.0, 27.0, 36.0, 37.0, 48.0, 65.0, 68.0, 72.0, 75.0, 74.0, 69.0, 49.0, 57.0, 43.0, 40.0, 22.0, 33.0, 28.0, 19.0, 10.0, 13.0, 10.0, 6.0, 9.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.266334533691406e-05, -3.144238144159317e-05, -3.0221417546272278e-05, -2.9000453650951385e-05, -2.7779489755630493e-05, -2.65585258603096e-05, -2.533756196498871e-05, -2.4116598069667816e-05, -2.2895634174346924e-05, -2.167467027902603e-05, -2.045370638370514e-05, -1.9232742488384247e-05, -1.8011778593063354e-05, -1.6790814697742462e-05, -1.556985080242157e-05, -1.4348886907100677e-05, -1.3127923011779785e-05, -1.1906959116458893e-05, -1.0685995221138e-05, -9.465031325817108e-06, -8.244067430496216e-06, -7.0231035351753235e-06, -5.802139639854431e-06, -4.581175744533539e-06, -3.3602118492126465e-06, -2.139247953891754e-06, -9.182840585708618e-07, 3.026798367500305e-07, 1.5236437320709229e-06, 2.744607627391815e-06, 3.9655715227127075e-06, 5.1865354180336e-06, 6.407499313354492e-06, 7.6284632086753845e-06, 8.849427103996277e-06, 1.007039099931717e-05, 1.1291354894638062e-05, 1.2512318789958954e-05, 1.3733282685279846e-05, 1.4954246580600739e-05, 1.617521047592163e-05, 1.7396174371242523e-05, 1.8617138266563416e-05, 1.9838102161884308e-05, 2.10590660572052e-05, 2.2280029952526093e-05, 2.3500993847846985e-05, 2.4721957743167877e-05, 2.594292163848877e-05, 2.7163885533809662e-05, 2.8384849429130554e-05, 2.9605813324451447e-05, 3.082677721977234e-05, 3.204774111509323e-05, 3.3268705010414124e-05, 3.4489668905735016e-05, 3.571063280105591e-05, 3.69315966963768e-05, 3.815256059169769e-05, 3.9373524487018585e-05, 4.059448838233948e-05, 4.181545227766037e-05, 4.303641617298126e-05, 4.4257380068302155e-05, 4.547834396362305e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 10.0, 7.0, 17.0, 23.0, 37.0, 59.0, 106.0, 219.0, 402.0, 769.0, 1852.0, 4938.0, 16722.0, 88881.0, 640518.0, 246410.0, 33682.0, 8567.0, 2928.0, 1226.0, 536.0, 276.0, 151.0, 89.0, 41.0, 36.0, 16.0, 11.0, 6.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.68115234375, -0.6644287109375, -0.647705078125, -0.6309814453125, -0.6142578125, -0.5975341796875, -0.580810546875, -0.5640869140625, -0.54736328125, -0.5306396484375, -0.513916015625, -0.4971923828125, -0.48046875, -0.4637451171875, -0.447021484375, -0.4302978515625, -0.41357421875, -0.3968505859375, -0.380126953125, -0.3634033203125, -0.3466796875, -0.3299560546875, -0.313232421875, -0.2965087890625, -0.27978515625, -0.2630615234375, -0.246337890625, -0.2296142578125, -0.212890625, -0.1961669921875, -0.179443359375, -0.1627197265625, -0.14599609375, -0.1292724609375, -0.112548828125, -0.0958251953125, -0.0791015625, -0.0623779296875, -0.045654296875, -0.0289306640625, -0.01220703125, 0.0045166015625, 0.021240234375, 0.0379638671875, 0.0546875, 0.0714111328125, 0.088134765625, 0.1048583984375, 0.12158203125, 0.1383056640625, 0.155029296875, 0.1717529296875, 0.1884765625, 0.2052001953125, 0.221923828125, 0.2386474609375, 0.25537109375, 0.2720947265625, 0.288818359375, 0.3055419921875, 0.322265625, 0.3389892578125, 0.355712890625, 0.3724365234375, 0.38916015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 8.0, 4.0, 8.0, 11.0, 15.0, 21.0, 41.0, 60.0, 86.0, 100.0, 92.0, 108.0, 121.0, 99.0, 72.0, 42.0, 32.0, 19.0, 19.0, 14.0, 8.0, 9.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349853515625, -0.3402214050292969, -0.33058929443359375, -0.3209571838378906, -0.3113250732421875, -0.3016929626464844, -0.29206085205078125, -0.2824287414550781, -0.272796630859375, -0.2631645202636719, -0.25353240966796875, -0.24390029907226562, -0.2342681884765625, -0.22463607788085938, -0.21500396728515625, -0.20537185668945312, -0.19573974609375, -0.18610763549804688, -0.17647552490234375, -0.16684341430664062, -0.1572113037109375, -0.14757919311523438, -0.13794708251953125, -0.12831497192382812, -0.118682861328125, -0.10905075073242188, -0.09941864013671875, -0.08978652954101562, -0.0801544189453125, -0.07052230834960938, -0.06089019775390625, -0.051258087158203125, -0.0416259765625, -0.031993865966796875, -0.02236175537109375, -0.012729644775390625, -0.0030975341796875, 0.006534576416015625, 0.01616668701171875, 0.025798797607421875, 0.035430908203125, 0.045063018798828125, 0.05469512939453125, 0.06432723999023438, 0.0739593505859375, 0.08359146118164062, 0.09322357177734375, 0.10285568237304688, 0.11248779296875, 0.12211990356445312, 0.13175201416015625, 0.14138412475585938, 0.1510162353515625, 0.16064834594726562, 0.17028045654296875, 0.17991256713867188, 0.189544677734375, 0.19917678833007812, 0.20880889892578125, 0.21844100952148438, 0.2280731201171875, 0.23770523071289062, 0.24733734130859375, 0.2569694519042969, 0.2666015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 15.0, 56.0, 285.0, 366.0, 167.0, 63.0, 20.0, 9.0, 10.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.080022811889648, -9.851767539978027, -9.623512268066406, -9.395256996154785, -9.167001724243164, -8.93874740600586, -8.710491180419922, -8.482236862182617, -8.253981590270996, -8.025726318359375, -7.797471046447754, -7.569215774536133, -7.34096097946167, -7.112705707550049, -6.884450435638428, -6.656195163726807, -6.4279398918151855, -6.1996846199035645, -5.971429347991943, -5.7431745529174805, -5.514919281005859, -5.286664009094238, -5.058408737182617, -4.830153465270996, -4.601898193359375, -4.373642921447754, -4.145387649536133, -3.917132616043091, -3.688877582550049, -3.4606223106384277, -3.2323670387268066, -3.0041117668151855, -2.775857448577881, -2.5476021766662598, -2.3193471431732178, -2.0910918712615967, -1.8628367185592651, -1.6345815658569336, -1.4063262939453125, -1.178071141242981, -0.9498159885406494, -0.7215608358383179, -0.49330562353134155, -0.26505041122436523, -0.03679525852203369, 0.19145989418029785, 0.41971516609191895, 0.6479703187942505, 0.876225471496582, 1.1044806241989136, 1.3327357769012451, 1.5609910488128662, 1.7892462015151978, 2.0175013542175293, 2.2457566261291504, 2.4740118980407715, 2.7022669315338135, 2.9305222034454346, 3.1587772369384766, 3.3870325088500977, 3.6152877807617188, 3.8435428142547607, 4.071798324584961, 4.300053119659424, 4.528308391571045]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 9.0, 5.0, 9.0, 11.0, 23.0, 25.0, 34.0, 42.0, 51.0, 48.0, 58.0, 53.0, 57.0, 68.0, 67.0, 66.0, 68.0, 42.0, 49.0, 31.0, 35.0, 38.0, 20.0, 15.0, 18.0, 17.0, 12.0, 7.0, 6.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3112001419067383, -3.2188661098480225, -3.1265320777893066, -3.034198045730591, -2.941864013671875, -2.849529981613159, -2.7571959495544434, -2.6648621559143066, -2.5725278854370117, -2.480193853378296, -2.38785982131958, -2.2955257892608643, -2.2031917572021484, -2.1108577251434326, -2.018523693084717, -1.9261897802352905, -1.8338558673858643, -1.7415218353271484, -1.6491878032684326, -1.5568537712097168, -1.464519739151001, -1.3721857070922852, -1.2798517942428589, -1.187517762184143, -1.0951837301254272, -1.0028496980667114, -0.9105156660079956, -0.8181816935539246, -0.7258476614952087, -0.6335136294364929, -0.5411796569824219, -0.44884562492370605, -0.35651159286499023, -0.2641775608062744, -0.17184355854988098, -0.07950955629348755, 0.012824475765228271, 0.10515850782394409, 0.19749248027801514, 0.28982651233673096, 0.3821605443954468, 0.4744945764541626, 0.5668286085128784, 0.6591625809669495, 0.7514966130256653, 0.8438306450843811, 0.9361646175384521, 1.028498649597168, 1.1208326816558838, 1.2131667137145996, 1.3055007457733154, 1.3978347778320312, 1.490168809890747, 1.582502841949463, 1.6748367547988892, 1.767170786857605, 1.8595048189163208, 1.9518388509750366, 2.044172763824463, 2.1365067958831787, 2.2288408279418945, 2.3211748600006104, 2.413508892059326, 2.505842924118042, 2.598176956176758]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 13.0, 9.0, 16.0, 10.0, 8.0, 12.0, 15.0, 28.0, 32.0, 13.0, 41.0, 50.0, 43.0, 62.0, 85.0, 176.0, 299.0, 772.0, 3283.0, 34103.0, 4096432.0, 52742.0, 4391.0, 973.0, 308.0, 166.0, 65.0, 41.0, 27.0, 16.0, 13.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.177734375, -3.095306396484375, -3.01287841796875, -2.930450439453125, -2.8480224609375, -2.765594482421875, -2.68316650390625, -2.600738525390625, -2.518310546875, -2.435882568359375, -2.35345458984375, -2.271026611328125, -2.1885986328125, -2.106170654296875, -2.02374267578125, -1.941314697265625, -1.85888671875, -1.776458740234375, -1.69403076171875, -1.611602783203125, -1.5291748046875, -1.446746826171875, -1.36431884765625, -1.281890869140625, -1.199462890625, -1.117034912109375, -1.03460693359375, -0.952178955078125, -0.8697509765625, -0.787322998046875, -0.70489501953125, -0.622467041015625, -0.5400390625, -0.457611083984375, -0.37518310546875, -0.292755126953125, -0.2103271484375, -0.127899169921875, -0.04547119140625, 0.036956787109375, 0.119384765625, 0.201812744140625, 0.28424072265625, 0.366668701171875, 0.4490966796875, 0.531524658203125, 0.61395263671875, 0.696380615234375, 0.77880859375, 0.861236572265625, 0.94366455078125, 1.026092529296875, 1.1085205078125, 1.190948486328125, 1.27337646484375, 1.355804443359375, 1.438232421875, 1.520660400390625, 1.60308837890625, 1.685516357421875, 1.7679443359375, 1.850372314453125, 1.93280029296875, 2.015228271484375, 2.09765625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 9.0, 12.0, 33.0, 61.0, 89.0, 132.0, 175.0, 199.0, 125.0, 77.0, 46.0, 26.0, 10.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.266357421875, -0.26067066192626953, -0.25498390197753906, -0.2492971420288086, -0.24361038208007812, -0.23792362213134766, -0.2322368621826172, -0.22655010223388672, -0.22086334228515625, -0.21517658233642578, -0.2094898223876953, -0.20380306243896484, -0.19811630249023438, -0.1924295425415039, -0.18674278259277344, -0.18105602264404297, -0.1753692626953125, -0.16968250274658203, -0.16399574279785156, -0.1583089828491211, -0.15262222290039062, -0.14693546295166016, -0.1412487030029297, -0.13556194305419922, -0.12987518310546875, -0.12418842315673828, -0.11850166320800781, -0.11281490325927734, -0.10712814331054688, -0.1014413833618164, -0.09575462341308594, -0.09006786346435547, -0.084381103515625, -0.07869434356689453, -0.07300758361816406, -0.0673208236694336, -0.061634063720703125, -0.055947303771972656, -0.05026054382324219, -0.04457378387451172, -0.03888702392578125, -0.03320026397705078, -0.027513504028320312, -0.021826744079589844, -0.016139984130859375, -0.010453224182128906, -0.0047664642333984375, 0.0009202957153320312, 0.0066070556640625, 0.012293815612792969, 0.017980575561523438, 0.023667335510253906, 0.029354095458984375, 0.035040855407714844, 0.04072761535644531, 0.04641437530517578, 0.05210113525390625, 0.05778789520263672, 0.06347465515136719, 0.06916141510009766, 0.07484817504882812, 0.0805349349975586, 0.08622169494628906, 0.09190845489501953, 0.09759521484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 4.0, 10.0, 7.0, 7.0, 13.0, 8.0, 18.0, 13.0, 11.0, 27.0, 24.0, 34.0, 29.0, 31.0, 37.0, 56.0, 79.0, 109.0, 198.0, 299.0, 927.0, 10919.0, 4112000.0, 66101.0, 2218.0, 468.0, 190.0, 113.0, 74.0, 46.0, 30.0, 28.0, 20.0, 21.0, 19.0, 16.0, 10.0, 12.0, 9.0, 9.0, 9.0, 4.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.375, -4.2451171875, -4.115234375, -3.9853515625, -3.85546875, -3.7255859375, -3.595703125, -3.4658203125, -3.3359375, -3.2060546875, -3.076171875, -2.9462890625, -2.81640625, -2.6865234375, -2.556640625, -2.4267578125, -2.296875, -2.1669921875, -2.037109375, -1.9072265625, -1.77734375, -1.6474609375, -1.517578125, -1.3876953125, -1.2578125, -1.1279296875, -0.998046875, -0.8681640625, -0.73828125, -0.6083984375, -0.478515625, -0.3486328125, -0.21875, -0.0888671875, 0.041015625, 0.1708984375, 0.30078125, 0.4306640625, 0.560546875, 0.6904296875, 0.8203125, 0.9501953125, 1.080078125, 1.2099609375, 1.33984375, 1.4697265625, 1.599609375, 1.7294921875, 1.859375, 1.9892578125, 2.119140625, 2.2490234375, 2.37890625, 2.5087890625, 2.638671875, 2.7685546875, 2.8984375, 3.0283203125, 3.158203125, 3.2880859375, 3.41796875, 3.5478515625, 3.677734375, 3.8076171875, 3.9375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 24.0, 94.0, 595.0, 2933.0, 298.0, 85.0, 27.0, 11.0, 7.0, 6.0, 1.0, 2.0], "bins": [-1.3115234375, -1.2878150939941406, -1.2641067504882812, -1.2403984069824219, -1.2166900634765625, -1.1929817199707031, -1.1692733764648438, -1.1455650329589844, -1.121856689453125, -1.0981483459472656, -1.0744400024414062, -1.0507316589355469, -1.0270233154296875, -1.0033149719238281, -0.9796066284179688, -0.9558982849121094, -0.93218994140625, -0.9084815979003906, -0.8847732543945312, -0.8610649108886719, -0.8373565673828125, -0.8136482238769531, -0.7899398803710938, -0.7662315368652344, -0.742523193359375, -0.7188148498535156, -0.6951065063476562, -0.6713981628417969, -0.6476898193359375, -0.6239814758300781, -0.6002731323242188, -0.5765647888183594, -0.5528564453125, -0.5291481018066406, -0.5054397583007812, -0.4817314147949219, -0.4580230712890625, -0.4343147277832031, -0.41060638427734375, -0.3868980407714844, -0.363189697265625, -0.3394813537597656, -0.31577301025390625, -0.2920646667480469, -0.2683563232421875, -0.24464797973632812, -0.22093963623046875, -0.19723129272460938, -0.17352294921875, -0.14981460571289062, -0.12610626220703125, -0.10239791870117188, -0.0786895751953125, -0.054981231689453125, -0.03127288818359375, -0.007564544677734375, 0.016143798828125, 0.039852142333984375, 0.06356048583984375, 0.08726882934570312, 0.1109771728515625, 0.13468551635742188, 0.15839385986328125, 0.18210220336914062, 0.205810546875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 41.0, 788.0, 162.0, 12.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.56743049621582, -9.027774810791016, -8.488119125366211, -7.94846248626709, -7.408806800842285, -6.8691511154174805, -6.329494953155518, -5.789838790893555, -5.25018310546875, -4.710527420043945, -4.170871257781982, -3.6312153339385986, -3.091559410095215, -2.551903486251831, -2.0122475624084473, -1.4725916385650635, -0.9329357147216797, -0.3932797908782959, 0.1463761329650879, 0.6860320568084717, 1.2256879806518555, 1.7653439044952393, 2.304999828338623, 2.844655752182007, 3.3843116760253906, 3.9239675998687744, 4.463623523712158, 5.003279685974121, 5.542935371398926, 6.0825910568237305, 6.622247219085693, 7.161903381347656, 7.701560974121094, 8.241216659545898, 8.780872344970703, 9.320528984069824, 9.860184669494629, 10.399840354919434, 10.939496994018555, 11.47915267944336, 12.018808364868164, 12.558464050292969, 13.098119735717773, 13.637776374816895, 14.1774320602417, 14.717087745666504, 15.256744384765625, 15.79640007019043, 16.336055755615234, 16.87571144104004, 17.415367126464844, 17.95502281188965, 18.494678497314453, 19.03433609008789, 19.573991775512695, 20.1136474609375, 20.653303146362305, 21.19295883178711, 21.732614517211914, 22.27227020263672, 22.811927795410156, 23.35158348083496, 23.891239166259766, 24.43089485168457, 24.970550537109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 7.0, 11.0, 25.0, 30.0, 48.0, 85.0, 121.0, 119.0, 130.0, 105.0, 113.0, 80.0, 54.0, 37.0, 21.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1875815391540527, -3.0876879692077637, -2.9877943992614746, -2.8879008293151855, -2.7880072593688965, -2.6881136894226074, -2.5882201194763184, -2.4883265495300293, -2.3884329795837402, -2.288539409637451, -2.188645839691162, -2.088752269744873, -1.988858699798584, -1.888965129852295, -1.7890715599060059, -1.6891779899597168, -1.5892845392227173, -1.4893909692764282, -1.3894973993301392, -1.28960382938385, -1.189710259437561, -1.089816689491272, -0.9899231791496277, -0.8900296092033386, -0.7901360392570496, -0.6902424693107605, -0.5903488993644714, -0.49045535922050476, -0.3905617892742157, -0.29066821932792664, -0.19077467918395996, -0.0908811092376709, 0.009012460708618164, 0.10890602320432663, 0.2087995857000351, 0.30869314074516296, 0.408586710691452, 0.5084803104400635, 0.6083738207817078, 0.7082673907279968, 0.8081609606742859, 0.908054530620575, 1.0079480409622192, 1.1078416109085083, 1.2077351808547974, 1.3076287508010864, 1.4075223207473755, 1.5074158906936646, 1.6073094606399536, 1.7072030305862427, 1.8070966005325317, 1.9069901704788208, 2.0068836212158203, 2.1067771911621094, 2.2066707611083984, 2.3065643310546875, 2.4064579010009766, 2.5063514709472656, 2.6062450408935547, 2.7061386108398438, 2.806032180786133, 2.905925750732422, 3.005819320678711, 3.105712890625, 3.205606460571289]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 10.0, 14.0, 22.0, 19.0, 25.0, 33.0, 51.0, 50.0, 99.0, 310.0, 1166.0, 8578.0, 355019.0, 668276.0, 12803.0, 1397.0, 333.0, 121.0, 60.0, 45.0, 40.0, 16.0, 18.0, 18.0, 5.0, 8.0, 7.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.937225341796875, -2.85101318359375, -2.764801025390625, -2.6785888671875, -2.592376708984375, -2.50616455078125, -2.419952392578125, -2.333740234375, -2.247528076171875, -2.16131591796875, -2.075103759765625, -1.9888916015625, -1.902679443359375, -1.81646728515625, -1.730255126953125, -1.64404296875, -1.557830810546875, -1.47161865234375, -1.385406494140625, -1.2991943359375, -1.212982177734375, -1.12677001953125, -1.040557861328125, -0.954345703125, -0.868133544921875, -0.78192138671875, -0.695709228515625, -0.6094970703125, -0.523284912109375, -0.43707275390625, -0.350860595703125, -0.2646484375, -0.178436279296875, -0.09222412109375, -0.006011962890625, 0.0802001953125, 0.166412353515625, 0.25262451171875, 0.338836669921875, 0.425048828125, 0.511260986328125, 0.59747314453125, 0.683685302734375, 0.7698974609375, 0.856109619140625, 0.94232177734375, 1.028533935546875, 1.11474609375, 1.200958251953125, 1.28717041015625, 1.373382568359375, 1.4595947265625, 1.545806884765625, 1.63201904296875, 1.718231201171875, 1.804443359375, 1.890655517578125, 1.97686767578125, 2.063079833984375, 2.1492919921875, 2.235504150390625, 2.32171630859375, 2.407928466796875, 2.494140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 11.0, 19.0, 37.0, 77.0, 123.0, 160.0, 195.0, 155.0, 84.0, 69.0, 38.0, 16.0, 15.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.3994140625, -0.39132118225097656, -0.3832283020019531, -0.3751354217529297, -0.36704254150390625, -0.3589496612548828, -0.3508567810058594, -0.34276390075683594, -0.3346710205078125, -0.32657814025878906, -0.3184852600097656, -0.3103923797607422, -0.30229949951171875, -0.2942066192626953, -0.2861137390136719, -0.27802085876464844, -0.269927978515625, -0.26183509826660156, -0.2537422180175781, -0.2456493377685547, -0.23755645751953125, -0.2294635772705078, -0.22137069702148438, -0.21327781677246094, -0.2051849365234375, -0.19709205627441406, -0.18899917602539062, -0.1809062957763672, -0.17281341552734375, -0.1647205352783203, -0.15662765502929688, -0.14853477478027344, -0.14044189453125, -0.13234901428222656, -0.12425613403320312, -0.11616325378417969, -0.10807037353515625, -0.09997749328613281, -0.09188461303710938, -0.08379173278808594, -0.0756988525390625, -0.06760597229003906, -0.059513092041015625, -0.05142021179199219, -0.04332733154296875, -0.03523445129394531, -0.027141571044921875, -0.019048690795898438, -0.010955810546875, -0.0028629302978515625, 0.005229949951171875, 0.013322830200195312, 0.02141571044921875, 0.029508590698242188, 0.037601470947265625, 0.04569435119628906, 0.0537872314453125, 0.06188011169433594, 0.06997299194335938, 0.07806587219238281, 0.08615875244140625, 0.09425163269042969, 0.10234451293945312, 0.11043739318847656, 0.1185302734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 10.0, 10.0, 12.0, 13.0, 30.0, 42.0, 42.0, 79.0, 89.0, 145.0, 195.0, 391.0, 677.0, 1262.0, 2447.0, 5535.0, 14266.0, 41198.0, 142844.0, 465026.0, 266369.0, 70055.0, 22394.0, 8285.0, 3408.0, 1501.0, 847.0, 481.0, 255.0, 193.0, 133.0, 84.0, 76.0, 47.0, 30.0, 23.0, 16.0, 11.0, 7.0, 5.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6298828125, -0.6106338500976562, -0.5913848876953125, -0.5721359252929688, -0.552886962890625, -0.5336380004882812, -0.5143890380859375, -0.49514007568359375, -0.47589111328125, -0.45664215087890625, -0.4373931884765625, -0.41814422607421875, -0.398895263671875, -0.37964630126953125, -0.3603973388671875, -0.34114837646484375, -0.3218994140625, -0.30265045166015625, -0.2834014892578125, -0.26415252685546875, -0.244903564453125, -0.22565460205078125, -0.2064056396484375, -0.18715667724609375, -0.16790771484375, -0.14865875244140625, -0.1294097900390625, -0.11016082763671875, -0.090911865234375, -0.07166290283203125, -0.0524139404296875, -0.03316497802734375, -0.013916015625, 0.00533294677734375, 0.0245819091796875, 0.04383087158203125, 0.063079833984375, 0.08232879638671875, 0.1015777587890625, 0.12082672119140625, 0.14007568359375, 0.15932464599609375, 0.1785736083984375, 0.19782257080078125, 0.217071533203125, 0.23632049560546875, 0.2555694580078125, 0.27481842041015625, 0.2940673828125, 0.31331634521484375, 0.3325653076171875, 0.35181427001953125, 0.371063232421875, 0.39031219482421875, 0.4095611572265625, 0.42881011962890625, 0.44805908203125, 0.46730804443359375, 0.4865570068359375, 0.5058059692382812, 0.525054931640625, 0.5443038940429688, 0.5635528564453125, 0.5828018188476562, 0.60205078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 7.0, 2.0, 8.0, 5.0, 8.0, 16.0, 13.0, 11.0, 24.0, 23.0, 42.0, 19.0, 35.0, 36.0, 40.0, 55.0, 50.0, 47.0, 51.0, 54.0, 44.0, 48.0, 34.0, 41.0, 42.0, 30.0, 39.0, 26.0, 28.0, 24.0, 23.0, 16.0, 13.0, 15.0, 5.0, 11.0, 6.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.4886436462402344, -0.47435760498046875, -0.4600715637207031, -0.4457855224609375, -0.4314994812011719, -0.41721343994140625, -0.4029273986816406, -0.388641357421875, -0.3743553161621094, -0.36006927490234375, -0.3457832336425781, -0.3314971923828125, -0.3172111511230469, -0.30292510986328125, -0.2886390686035156, -0.27435302734375, -0.2600669860839844, -0.24578094482421875, -0.23149490356445312, -0.2172088623046875, -0.20292282104492188, -0.18863677978515625, -0.17435073852539062, -0.160064697265625, -0.14577865600585938, -0.13149261474609375, -0.11720657348632812, -0.1029205322265625, -0.08863449096679688, -0.07434844970703125, -0.060062408447265625, -0.0457763671875, -0.031490325927734375, -0.01720428466796875, -0.002918243408203125, 0.0113677978515625, 0.025653839111328125, 0.03993988037109375, 0.054225921630859375, 0.068511962890625, 0.08279800415039062, 0.09708404541015625, 0.11137008666992188, 0.1256561279296875, 0.13994216918945312, 0.15422821044921875, 0.16851425170898438, 0.18280029296875, 0.19708633422851562, 0.21137237548828125, 0.22565841674804688, 0.2399444580078125, 0.2542304992675781, 0.26851654052734375, 0.2828025817871094, 0.297088623046875, 0.3113746643066406, 0.32566070556640625, 0.3399467468261719, 0.3542327880859375, 0.3685188293457031, 0.38280487060546875, 0.3970909118652344, 0.411376953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 13.0, 8.0, 11.0, 24.0, 32.0, 60.0, 79.0, 143.0, 278.0, 577.0, 1268.0, 3097.0, 9703.0, 61933.0, 879486.0, 75487.0, 10412.0, 3312.0, 1305.0, 608.0, 284.0, 156.0, 85.0, 62.0, 24.0, 23.0, 20.0, 20.0, 11.0, 6.0, 4.0, 4.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0458984375, -1.0104827880859375, -0.975067138671875, -0.9396514892578125, -0.90423583984375, -0.8688201904296875, -0.833404541015625, -0.7979888916015625, -0.7625732421875, -0.7271575927734375, -0.691741943359375, -0.6563262939453125, -0.62091064453125, -0.5854949951171875, -0.550079345703125, -0.5146636962890625, -0.479248046875, -0.4438323974609375, -0.408416748046875, -0.3730010986328125, -0.33758544921875, -0.3021697998046875, -0.266754150390625, -0.2313385009765625, -0.1959228515625, -0.1605072021484375, -0.125091552734375, -0.0896759033203125, -0.05426025390625, -0.0188446044921875, 0.016571044921875, 0.0519866943359375, 0.08740234375, 0.1228179931640625, 0.158233642578125, 0.1936492919921875, 0.22906494140625, 0.2644805908203125, 0.299896240234375, 0.3353118896484375, 0.3707275390625, 0.4061431884765625, 0.441558837890625, 0.4769744873046875, 0.51239013671875, 0.5478057861328125, 0.583221435546875, 0.6186370849609375, 0.654052734375, 0.6894683837890625, 0.724884033203125, 0.7602996826171875, 0.79571533203125, 0.8311309814453125, 0.866546630859375, 0.9019622802734375, 0.9373779296875, 0.9727935791015625, 1.008209228515625, 1.0436248779296875, 1.07904052734375, 1.1144561767578125, 1.149871826171875, 1.1852874755859375, 1.220703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 7.0, 18.0, 35.0, 45.0, 112.0, 208.0, 221.0, 160.0, 82.0, 49.0, 17.0, 12.0, 13.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020051002502441406, -0.00019514933228492737, -0.00018978863954544067, -0.00018442794680595398, -0.00017906725406646729, -0.0001737065613269806, -0.0001683458685874939, -0.0001629851758480072, -0.0001576244831085205, -0.0001522637903690338, -0.00014690309762954712, -0.00014154240489006042, -0.00013618171215057373, -0.00013082101941108704, -0.00012546032667160034, -0.00012009963393211365, -0.00011473894119262695, -0.00010937824845314026, -0.00010401755571365356, -9.865686297416687e-05, -9.329617023468018e-05, -8.793547749519348e-05, -8.257478475570679e-05, -7.721409201622009e-05, -7.18533992767334e-05, -6.64927065372467e-05, -6.113201379776001e-05, -5.5771321058273315e-05, -5.041062831878662e-05, -4.504993557929993e-05, -3.968924283981323e-05, -3.432855010032654e-05, -2.8967857360839844e-05, -2.360716462135315e-05, -1.8246471881866455e-05, -1.288577914237976e-05, -7.525086402893066e-06, -2.164393663406372e-06, 3.1962990760803223e-06, 8.556991815567017e-06, 1.3917684555053711e-05, 1.9278377294540405e-05, 2.46390700340271e-05, 2.9999762773513794e-05, 3.536045551300049e-05, 4.072114825248718e-05, 4.608184099197388e-05, 5.144253373146057e-05, 5.6803226470947266e-05, 6.216391921043396e-05, 6.752461194992065e-05, 7.288530468940735e-05, 7.824599742889404e-05, 8.360669016838074e-05, 8.896738290786743e-05, 9.432807564735413e-05, 9.968876838684082e-05, 0.00010504946112632751, 0.00011041015386581421, 0.0001157708466053009, 0.0001211315393447876, 0.0001264922320842743, 0.00013185292482376099, 0.00013721361756324768, 0.00014257431030273438]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 12.0, 21.0, 33.0, 38.0, 57.0, 90.0, 168.0, 218.0, 493.0, 843.0, 1708.0, 3633.0, 9871.0, 39291.0, 461478.0, 473434.0, 39772.0, 9754.0, 3737.0, 1754.0, 913.0, 490.0, 267.0, 163.0, 102.0, 57.0, 39.0, 30.0, 18.0, 16.0, 10.0, 8.0, 8.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.974609375, -0.948272705078125, -0.92193603515625, -0.895599365234375, -0.8692626953125, -0.842926025390625, -0.81658935546875, -0.790252685546875, -0.763916015625, -0.737579345703125, -0.71124267578125, -0.684906005859375, -0.6585693359375, -0.632232666015625, -0.60589599609375, -0.579559326171875, -0.55322265625, -0.526885986328125, -0.50054931640625, -0.474212646484375, -0.4478759765625, -0.421539306640625, -0.39520263671875, -0.368865966796875, -0.342529296875, -0.316192626953125, -0.28985595703125, -0.263519287109375, -0.2371826171875, -0.210845947265625, -0.18450927734375, -0.158172607421875, -0.1318359375, -0.105499267578125, -0.07916259765625, -0.052825927734375, -0.0264892578125, -0.000152587890625, 0.02618408203125, 0.052520751953125, 0.078857421875, 0.105194091796875, 0.13153076171875, 0.157867431640625, 0.1842041015625, 0.210540771484375, 0.23687744140625, 0.263214111328125, 0.28955078125, 0.315887451171875, 0.34222412109375, 0.368560791015625, 0.3948974609375, 0.421234130859375, 0.44757080078125, 0.473907470703125, 0.500244140625, 0.526580810546875, 0.55291748046875, 0.579254150390625, 0.6055908203125, 0.631927490234375, 0.65826416015625, 0.684600830078125, 0.7109375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 3.0, 5.0, 6.0, 10.0, 6.0, 17.0, 24.0, 39.0, 61.0, 52.0, 74.0, 84.0, 108.0, 103.0, 88.0, 73.0, 55.0, 54.0, 28.0, 29.0, 19.0, 9.0, 9.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.316162109375, -0.3053016662597656, -0.29444122314453125, -0.2835807800292969, -0.2727203369140625, -0.2618598937988281, -0.25099945068359375, -0.24013900756835938, -0.229278564453125, -0.21841812133789062, -0.20755767822265625, -0.19669723510742188, -0.1858367919921875, -0.17497634887695312, -0.16411590576171875, -0.15325546264648438, -0.14239501953125, -0.13153457641601562, -0.12067413330078125, -0.10981369018554688, -0.0989532470703125, -0.08809280395507812, -0.07723236083984375, -0.06637191772460938, -0.055511474609375, -0.044651031494140625, -0.03379058837890625, -0.022930145263671875, -0.0120697021484375, -0.001209259033203125, 0.00965118408203125, 0.020511627197265625, 0.0313720703125, 0.042232513427734375, 0.05309295654296875, 0.06395339965820312, 0.0748138427734375, 0.08567428588867188, 0.09653472900390625, 0.10739517211914062, 0.118255615234375, 0.12911605834960938, 0.13997650146484375, 0.15083694458007812, 0.1616973876953125, 0.17255783081054688, 0.18341827392578125, 0.19427871704101562, 0.20513916015625, 0.21599960327148438, 0.22686004638671875, 0.23772048950195312, 0.2485809326171875, 0.2594413757324219, 0.27030181884765625, 0.2811622619628906, 0.292022705078125, 0.3028831481933594, 0.31374359130859375, 0.3246040344238281, 0.3354644775390625, 0.3463249206542969, 0.35718536376953125, 0.3680458068847656, 0.37890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 11.0, 7.0, 24.0, 37.0, 84.0, 191.0, 234.0, 177.0, 108.0, 52.0, 29.0, 14.0, 14.0, 6.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.231497764587402, -7.038308143615723, -6.845118045806885, -6.651928424835205, -6.458738803863525, -6.2655487060546875, -6.072359085083008, -5.879169464111328, -5.68597936630249, -5.4927897453308105, -5.299599647521973, -5.106410026550293, -4.913220405578613, -4.720030307769775, -4.526840686798096, -4.333650588989258, -4.140460968017578, -3.9472711086273193, -3.7540814876556396, -3.560891628265381, -3.367701768875122, -3.1745119094848633, -2.9813222885131836, -2.788132429122925, -2.594943046569824, -2.4017531871795654, -2.2085635662078857, -2.015373706817627, -1.8221838474273682, -1.628994107246399, -1.4358043670654297, -1.242614507675171, -1.049424648284912, -0.8562348484992981, -0.6630450487136841, -0.46985530853271484, -0.27666550874710083, -0.08347570896148682, 0.10971403121948242, 0.3029038906097412, 0.49609363079071045, 0.6892834305763245, 0.8824732303619385, 1.0756629705429077, 1.268852710723877, 1.4620425701141357, 1.655232310295105, 1.8484221696853638, 2.041611909866333, 2.234801769256592, 2.4279913902282715, 2.6211812496185303, 2.814371109008789, 3.0075607299804688, 3.2007505893707275, 3.3939404487609863, 3.587130069732666, 3.780319929122925, 3.9735095500946045, 4.166699409484863, 4.359889030456543, 4.553079128265381, 4.7462687492370605, 4.939458847045898, 5.132648468017578]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 6.0, 13.0, 9.0, 10.0, 14.0, 20.0, 16.0, 39.0, 42.0, 30.0, 41.0, 49.0, 63.0, 50.0, 46.0, 56.0, 54.0, 42.0, 44.0, 41.0, 45.0, 44.0, 24.0, 36.0, 30.0, 27.0, 25.0, 13.0, 9.0, 9.0, 18.0, 12.0, 7.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.9997143745422363, -3.894901752471924, -3.7900888919830322, -3.6852762699127197, -3.5804636478424072, -3.4756507873535156, -3.370838165283203, -3.2660255432128906, -3.161212921142578, -3.0564002990722656, -2.951587438583374, -2.8467748165130615, -2.741962194442749, -2.6371493339538574, -2.532336711883545, -2.4275240898132324, -2.32271146774292, -2.2178988456726074, -2.113085985183716, -2.0082733631134033, -1.9034607410430908, -1.7986479997634888, -1.6938352584838867, -1.5890226364135742, -1.4842097759246826, -1.3793970346450806, -1.274584412574768, -1.169771671295166, -1.0649590492248535, -0.9601463079452515, -0.8553336262702942, -0.7505209445953369, -0.6457083225250244, -0.5408956408500671, -0.43608295917510986, -0.3312702476978302, -0.22645756602287292, -0.12164485454559326, -0.016832172870635986, 0.08798050880432129, 0.19279319047927856, 0.29760587215423584, 0.4024185538291931, 0.5072312355041504, 0.6120439767837524, 0.7168566584587097, 0.821669340133667, 0.9264820218086243, 1.0312947034835815, 1.1361074447631836, 1.240920066833496, 1.3457328081130981, 1.4505454301834106, 1.5553581714630127, 1.6601707935333252, 1.7649835348129272, 1.8697962760925293, 1.9746090173721313, 2.0794217586517334, 2.184234380722046, 2.2890470027923584, 2.39385986328125, 2.4986724853515625, 2.603485107421875, 2.7082977294921875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 8.0, 2.0, 6.0, 7.0, 2.0, 6.0, 8.0, 9.0, 3.0, 6.0, 17.0, 9.0, 10.0, 11.0, 14.0, 26.0, 22.0, 28.0, 29.0, 46.0, 53.0, 86.0, 93.0, 141.0, 312.0, 524.0, 1119.0, 3005.0, 9602.0, 51533.0, 3799528.0, 295582.0, 23896.0, 5595.0, 1765.0, 648.0, 266.0, 141.0, 60.0, 31.0, 16.0, 9.0, 4.0, 3.0, 3.0], "bins": [-3.408203125, -3.3397369384765625, -3.271270751953125, -3.2028045654296875, -3.13433837890625, -3.0658721923828125, -2.997406005859375, -2.9289398193359375, -2.8604736328125, -2.7920074462890625, -2.723541259765625, -2.6550750732421875, -2.58660888671875, -2.5181427001953125, -2.449676513671875, -2.3812103271484375, -2.312744140625, -2.2442779541015625, -2.175811767578125, -2.1073455810546875, -2.03887939453125, -1.9704132080078125, -1.901947021484375, -1.8334808349609375, -1.7650146484375, -1.6965484619140625, -1.628082275390625, -1.5596160888671875, -1.49114990234375, -1.4226837158203125, -1.354217529296875, -1.2857513427734375, -1.21728515625, -1.1488189697265625, -1.080352783203125, -1.0118865966796875, -0.94342041015625, -0.8749542236328125, -0.806488037109375, -0.7380218505859375, -0.6695556640625, -0.6010894775390625, -0.532623291015625, -0.4641571044921875, -0.39569091796875, -0.3272247314453125, -0.258758544921875, -0.1902923583984375, -0.121826171875, -0.0533599853515625, 0.015106201171875, 0.0835723876953125, 0.15203857421875, 0.2205047607421875, 0.288970947265625, 0.3574371337890625, 0.4259033203125, 0.4943695068359375, 0.562835693359375, 0.6313018798828125, 0.69976806640625, 0.7682342529296875, 0.836700439453125, 0.9051666259765625, 0.9736328125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 10.0, 22.0, 37.0, 57.0, 102.0, 127.0, 154.0, 125.0, 123.0, 104.0, 60.0, 36.0, 18.0, 12.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.391357421875, -0.3835258483886719, -0.37569427490234375, -0.3678627014160156, -0.3600311279296875, -0.3521995544433594, -0.34436798095703125, -0.3365364074707031, -0.328704833984375, -0.3208732604980469, -0.31304168701171875, -0.3052101135253906, -0.2973785400390625, -0.2895469665527344, -0.28171539306640625, -0.2738838195800781, -0.26605224609375, -0.2582206726074219, -0.25038909912109375, -0.24255752563476562, -0.2347259521484375, -0.22689437866210938, -0.21906280517578125, -0.21123123168945312, -0.203399658203125, -0.19556808471679688, -0.18773651123046875, -0.17990493774414062, -0.1720733642578125, -0.16424179077148438, -0.15641021728515625, -0.14857864379882812, -0.1407470703125, -0.13291549682617188, -0.12508392333984375, -0.11725234985351562, -0.1094207763671875, -0.10158920288085938, -0.09375762939453125, -0.08592605590820312, -0.078094482421875, -0.07026290893554688, -0.06243133544921875, -0.054599761962890625, -0.0467681884765625, -0.038936614990234375, -0.03110504150390625, -0.023273468017578125, -0.01544189453125, -0.007610321044921875, 0.00022125244140625, 0.008052825927734375, 0.0158843994140625, 0.023715972900390625, 0.03154754638671875, 0.039379119873046875, 0.047210693359375, 0.055042266845703125, 0.06287384033203125, 0.07070541381835938, 0.0785369873046875, 0.08636856079101562, 0.09420013427734375, 0.10203170776367188, 0.10986328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 10.0, 13.0, 23.0, 25.0, 46.0, 54.0, 90.0, 133.0, 173.0, 243.0, 422.0, 752.0, 1589.0, 4762.0, 25408.0, 667425.0, 3442101.0, 41114.0, 6367.0, 1683.0, 725.0, 421.0, 215.0, 154.0, 94.0, 55.0, 56.0, 48.0, 22.0, 17.0, 13.0, 10.0, 4.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8544921875, -1.7834625244140625, -1.712432861328125, -1.6414031982421875, -1.57037353515625, -1.4993438720703125, -1.428314208984375, -1.3572845458984375, -1.2862548828125, -1.2152252197265625, -1.144195556640625, -1.0731658935546875, -1.00213623046875, -0.9311065673828125, -0.860076904296875, -0.7890472412109375, -0.718017578125, -0.6469879150390625, -0.575958251953125, -0.5049285888671875, -0.43389892578125, -0.3628692626953125, -0.291839599609375, -0.2208099365234375, -0.1497802734375, -0.0787506103515625, -0.007720947265625, 0.0633087158203125, 0.13433837890625, 0.2053680419921875, 0.276397705078125, 0.3474273681640625, 0.41845703125, 0.4894866943359375, 0.560516357421875, 0.6315460205078125, 0.70257568359375, 0.7736053466796875, 0.844635009765625, 0.9156646728515625, 0.9866943359375, 1.0577239990234375, 1.128753662109375, 1.1997833251953125, 1.27081298828125, 1.3418426513671875, 1.412872314453125, 1.4839019775390625, 1.554931640625, 1.6259613037109375, 1.696990966796875, 1.7680206298828125, 1.83905029296875, 1.9100799560546875, 1.981109619140625, 2.0521392822265625, 2.1231689453125, 2.1941986083984375, 2.265228271484375, 2.3362579345703125, 2.40728759765625, 2.4783172607421875, 2.549346923828125, 2.6203765869140625, 2.69140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 8.0, 14.0, 31.0, 48.0, 80.0, 157.0, 318.0, 1355.0, 1387.0, 341.0, 128.0, 61.0, 44.0, 36.0, 18.0, 15.0, 10.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.4935188293457031, -0.48117828369140625, -0.4688377380371094, -0.4564971923828125, -0.4441566467285156, -0.43181610107421875, -0.4194755554199219, -0.407135009765625, -0.3947944641113281, -0.38245391845703125, -0.3701133728027344, -0.3577728271484375, -0.3454322814941406, -0.33309173583984375, -0.3207511901855469, -0.30841064453125, -0.2960700988769531, -0.28372955322265625, -0.2713890075683594, -0.2590484619140625, -0.24670791625976562, -0.23436737060546875, -0.22202682495117188, -0.209686279296875, -0.19734573364257812, -0.18500518798828125, -0.17266464233398438, -0.1603240966796875, -0.14798355102539062, -0.13564300537109375, -0.12330245971679688, -0.1109619140625, -0.09862136840820312, -0.08628082275390625, -0.07394027709960938, -0.0615997314453125, -0.049259185791015625, -0.03691864013671875, -0.024578094482421875, -0.012237548828125, 0.000102996826171875, 0.01244354248046875, 0.024784088134765625, 0.0371246337890625, 0.049465179443359375, 0.06180572509765625, 0.07414627075195312, 0.08648681640625, 0.09882736206054688, 0.11116790771484375, 0.12350845336914062, 0.1358489990234375, 0.14818954467773438, 0.16053009033203125, 0.17287063598632812, 0.185211181640625, 0.19755172729492188, 0.20989227294921875, 0.22223281860351562, 0.2345733642578125, 0.24691390991210938, 0.25925445556640625, 0.2715950012207031, 0.283935546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 7.0, 10.0, 12.0, 28.0, 66.0, 171.0, 290.0, 245.0, 101.0, 43.0, 17.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7197020053863525, -3.5946264266967773, -3.4695510864257812, -3.344475507736206, -3.219399929046631, -3.0943245887756348, -2.9692490100860596, -2.8441734313964844, -2.7190980911254883, -2.594022512435913, -2.468947172164917, -2.343871593475342, -2.2187960147857666, -2.0937204360961914, -1.9686450958251953, -1.8435695171356201, -1.718493938446045, -1.5934184789657593, -1.468342900276184, -1.3432674407958984, -1.2181918621063232, -1.0931164026260376, -0.968040943145752, -0.8429654240608215, -0.7178899049758911, -0.5928143858909607, -0.46773889660835266, -0.34266340732574463, -0.2175878882408142, -0.09251236915588379, 0.032563090324401855, 0.15763860940933228, 0.2827138900756836, 0.407789409160614, 0.5328649282455444, 0.6579403877258301, 0.7830159068107605, 0.9080914258956909, 1.0331668853759766, 1.1582424640655518, 1.2833179235458374, 1.408393383026123, 1.5334689617156982, 1.6585444211959839, 1.7836198806762695, 1.9086954593658447, 2.03377103805542, 2.158846378326416, 2.283921957015991, 2.4089975357055664, 2.5340728759765625, 2.6591484546661377, 2.784224033355713, 2.909299373626709, 3.034374952316284, 3.1594505310058594, 3.2845258712768555, 3.4096014499664307, 3.5346767902374268, 3.659752368927002, 3.784827947616577, 3.9099035263061523, 4.034978866577148, 4.1600542068481445, 4.285130023956299]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 11.0, 15.0, 23.0, 42.0, 58.0, 80.0, 89.0, 85.0, 88.0, 106.0, 88.0, 71.0, 64.0, 58.0, 43.0, 24.0, 22.0, 12.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2537894248962402, -2.189366102218628, -2.1249430179595947, -2.0605196952819824, -1.9960963726043701, -1.9316731691360474, -1.8672499656677246, -1.8028266429901123, -1.7384034395217896, -1.6739802360534668, -1.6095569133758545, -1.5451337099075317, -1.480710506439209, -1.4162871837615967, -1.351863980293274, -1.2874407768249512, -1.2230174541473389, -1.1585942506790161, -1.0941709280014038, -1.029747724533081, -0.9653244614601135, -0.900901198387146, -0.8364779949188232, -0.7720547318458557, -0.7076314687728882, -0.6432082056999207, -0.5787849426269531, -0.5143617391586304, -0.44993847608566284, -0.3855152130126953, -0.32109197974205017, -0.25666874647140503, -0.1922457218170166, -0.12782247364521027, -0.06339922547340393, 0.0010240226984024048, 0.06544727087020874, 0.12987053394317627, 0.1942937672138214, 0.25871700048446655, 0.3231402635574341, 0.3875635266304016, 0.45198675990104675, 0.5164099931716919, 0.5808332562446594, 0.645256519317627, 0.7096797227859497, 0.7741029858589172, 0.8385262489318848, 0.9029495120048523, 0.9673727750778198, 1.0317959785461426, 1.0962193012237549, 1.1606425046920776, 1.2250657081604004, 1.2894890308380127, 1.3539122343063354, 1.4183354377746582, 1.4827587604522705, 1.5471819639205933, 1.611605167388916, 1.6760284900665283, 1.740451693534851, 1.8048748970031738, 1.8692982196807861]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 5.0, 6.0, 15.0, 12.0, 30.0, 35.0, 42.0, 66.0, 102.0, 166.0, 350.0, 846.0, 2815.0, 14088.0, 167482.0, 783526.0, 67942.0, 7856.0, 1807.0, 610.0, 263.0, 154.0, 88.0, 47.0, 58.0, 29.0, 25.0, 23.0, 13.0, 9.0, 6.0, 7.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6875, -1.6318817138671875, -1.576263427734375, -1.5206451416015625, -1.46502685546875, -1.4094085693359375, -1.353790283203125, -1.2981719970703125, -1.2425537109375, -1.1869354248046875, -1.131317138671875, -1.0756988525390625, -1.02008056640625, -0.9644622802734375, -0.908843994140625, -0.8532257080078125, -0.797607421875, -0.7419891357421875, -0.686370849609375, -0.6307525634765625, -0.57513427734375, -0.5195159912109375, -0.463897705078125, -0.4082794189453125, -0.3526611328125, -0.2970428466796875, -0.241424560546875, -0.1858062744140625, -0.13018798828125, -0.0745697021484375, -0.018951416015625, 0.0366668701171875, 0.09228515625, 0.1479034423828125, 0.203521728515625, 0.2591400146484375, 0.31475830078125, 0.3703765869140625, 0.425994873046875, 0.4816131591796875, 0.5372314453125, 0.5928497314453125, 0.648468017578125, 0.7040863037109375, 0.75970458984375, 0.8153228759765625, 0.870941162109375, 0.9265594482421875, 0.982177734375, 1.0377960205078125, 1.093414306640625, 1.1490325927734375, 1.20465087890625, 1.2602691650390625, 1.315887451171875, 1.3715057373046875, 1.4271240234375, 1.4827423095703125, 1.538360595703125, 1.5939788818359375, 1.64959716796875, 1.7052154541015625, 1.760833740234375, 1.8164520263671875, 1.8720703125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 21.0, 33.0, 58.0, 80.0, 109.0, 154.0, 133.0, 123.0, 114.0, 77.0, 45.0, 28.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.422119140625, -0.41300010681152344, -0.4038810729980469, -0.3947620391845703, -0.38564300537109375, -0.3765239715576172, -0.3674049377441406, -0.35828590393066406, -0.3491668701171875, -0.34004783630371094, -0.3309288024902344, -0.3218097686767578, -0.31269073486328125, -0.3035717010498047, -0.2944526672363281, -0.28533363342285156, -0.276214599609375, -0.26709556579589844, -0.2579765319824219, -0.2488574981689453, -0.23973846435546875, -0.2306194305419922, -0.22150039672851562, -0.21238136291503906, -0.2032623291015625, -0.19414329528808594, -0.18502426147460938, -0.1759052276611328, -0.16678619384765625, -0.1576671600341797, -0.14854812622070312, -0.13942909240722656, -0.13031005859375, -0.12119102478027344, -0.11207199096679688, -0.10295295715332031, -0.09383392333984375, -0.08471488952636719, -0.07559585571289062, -0.06647682189941406, -0.0573577880859375, -0.04823875427246094, -0.039119720458984375, -0.030000686645507812, -0.02088165283203125, -0.011762619018554688, -0.002643585205078125, 0.0064754486083984375, 0.015594482421875, 0.024713516235351562, 0.033832550048828125, 0.04295158386230469, 0.05207061767578125, 0.06118965148925781, 0.07030868530273438, 0.07942771911621094, 0.0885467529296875, 0.09766578674316406, 0.10678482055664062, 0.11590385437011719, 0.12502288818359375, 0.1341419219970703, 0.14326095581054688, 0.15237998962402344, 0.1614990234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 3.0, 14.0, 11.0, 31.0, 26.0, 33.0, 54.0, 93.0, 119.0, 223.0, 383.0, 687.0, 1306.0, 2809.0, 6630.0, 18638.0, 63160.0, 282790.0, 496197.0, 124273.0, 32291.0, 10512.0, 4152.0, 1897.0, 901.0, 502.0, 282.0, 174.0, 113.0, 69.0, 53.0, 36.0, 24.0, 17.0, 10.0, 15.0, 6.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76123046875, -0.736053466796875, -0.71087646484375, -0.685699462890625, -0.6605224609375, -0.635345458984375, -0.61016845703125, -0.584991455078125, -0.559814453125, -0.534637451171875, -0.50946044921875, -0.484283447265625, -0.4591064453125, -0.433929443359375, -0.40875244140625, -0.383575439453125, -0.3583984375, -0.333221435546875, -0.30804443359375, -0.282867431640625, -0.2576904296875, -0.232513427734375, -0.20733642578125, -0.182159423828125, -0.156982421875, -0.131805419921875, -0.10662841796875, -0.081451416015625, -0.0562744140625, -0.031097412109375, -0.00592041015625, 0.019256591796875, 0.04443359375, 0.069610595703125, 0.09478759765625, 0.119964599609375, 0.1451416015625, 0.170318603515625, 0.19549560546875, 0.220672607421875, 0.245849609375, 0.271026611328125, 0.29620361328125, 0.321380615234375, 0.3465576171875, 0.371734619140625, 0.39691162109375, 0.422088623046875, 0.447265625, 0.472442626953125, 0.49761962890625, 0.522796630859375, 0.5479736328125, 0.573150634765625, 0.59832763671875, 0.623504638671875, 0.648681640625, 0.673858642578125, 0.69903564453125, 0.724212646484375, 0.7493896484375, 0.774566650390625, 0.79974365234375, 0.824920654296875, 0.85009765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 7.0, 4.0, 7.0, 11.0, 11.0, 13.0, 19.0, 20.0, 21.0, 23.0, 34.0, 49.0, 43.0, 40.0, 52.0, 44.0, 52.0, 36.0, 53.0, 42.0, 47.0, 39.0, 49.0, 34.0, 29.0, 32.0, 25.0, 27.0, 33.0, 17.0, 11.0, 20.0, 10.0, 12.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5576171875, -0.5404129028320312, -0.5232086181640625, -0.5060043334960938, -0.488800048828125, -0.47159576416015625, -0.4543914794921875, -0.43718719482421875, -0.41998291015625, -0.40277862548828125, -0.3855743408203125, -0.36837005615234375, -0.351165771484375, -0.33396148681640625, -0.3167572021484375, -0.29955291748046875, -0.2823486328125, -0.26514434814453125, -0.2479400634765625, -0.23073577880859375, -0.213531494140625, -0.19632720947265625, -0.1791229248046875, -0.16191864013671875, -0.14471435546875, -0.12751007080078125, -0.1103057861328125, -0.09310150146484375, -0.075897216796875, -0.05869293212890625, -0.0414886474609375, -0.02428436279296875, -0.007080078125, 0.01012420654296875, 0.0273284912109375, 0.04453277587890625, 0.061737060546875, 0.07894134521484375, 0.0961456298828125, 0.11334991455078125, 0.13055419921875, 0.14775848388671875, 0.1649627685546875, 0.18216705322265625, 0.199371337890625, 0.21657562255859375, 0.2337799072265625, 0.25098419189453125, 0.2681884765625, 0.28539276123046875, 0.3025970458984375, 0.31980133056640625, 0.337005615234375, 0.35420989990234375, 0.3714141845703125, 0.38861846923828125, 0.40582275390625, 0.42302703857421875, 0.4402313232421875, 0.45743560791015625, 0.474639892578125, 0.49184417724609375, 0.5090484619140625, 0.5262527465820312, 0.54345703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 15.0, 15.0, 20.0, 51.0, 84.0, 140.0, 262.0, 485.0, 1007.0, 2429.0, 8195.0, 67860.0, 872101.0, 81818.0, 9387.0, 2614.0, 996.0, 458.0, 215.0, 135.0, 77.0, 50.0, 32.0, 20.0, 23.0, 14.0, 8.0, 5.0, 10.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.95849609375, -0.9271011352539062, -0.8957061767578125, -0.8643112182617188, -0.832916259765625, -0.8015213012695312, -0.7701263427734375, -0.7387313842773438, -0.70733642578125, -0.6759414672851562, -0.6445465087890625, -0.6131515502929688, -0.581756591796875, -0.5503616333007812, -0.5189666748046875, -0.48757171630859375, -0.4561767578125, -0.42478179931640625, -0.3933868408203125, -0.36199188232421875, -0.330596923828125, -0.29920196533203125, -0.2678070068359375, -0.23641204833984375, -0.20501708984375, -0.17362213134765625, -0.1422271728515625, -0.11083221435546875, -0.079437255859375, -0.04804229736328125, -0.0166473388671875, 0.01474761962890625, 0.046142578125, 0.07753753662109375, 0.1089324951171875, 0.14032745361328125, 0.171722412109375, 0.20311737060546875, 0.2345123291015625, 0.26590728759765625, 0.29730224609375, 0.32869720458984375, 0.3600921630859375, 0.39148712158203125, 0.422882080078125, 0.45427703857421875, 0.4856719970703125, 0.5170669555664062, 0.5484619140625, 0.5798568725585938, 0.6112518310546875, 0.6426467895507812, 0.674041748046875, 0.7054367065429688, 0.7368316650390625, 0.7682266235351562, 0.79962158203125, 0.8310165405273438, 0.8624114990234375, 0.8938064575195312, 0.925201416015625, 0.9565963745117188, 0.9879913330078125, 1.0193862915039062, 1.05078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 6.0, 9.0, 11.0, 16.0, 15.0, 27.0, 38.0, 76.0, 125.0, 201.0, 186.0, 111.0, 73.0, 32.0, 21.0, 11.0, 9.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016689300537109375, -0.00016224384307861328, -0.0001575946807861328, -0.00015294551849365234, -0.00014829635620117188, -0.0001436471939086914, -0.00013899803161621094, -0.00013434886932373047, -0.00012969970703125, -0.00012505054473876953, -0.00012040138244628906, -0.0001157522201538086, -0.00011110305786132812, -0.00010645389556884766, -0.00010180473327636719, -9.715557098388672e-05, -9.250640869140625e-05, -8.785724639892578e-05, -8.320808410644531e-05, -7.855892181396484e-05, -7.390975952148438e-05, -6.92605972290039e-05, -6.461143493652344e-05, -5.996227264404297e-05, -5.53131103515625e-05, -5.066394805908203e-05, -4.601478576660156e-05, -4.1365623474121094e-05, -3.6716461181640625e-05, -3.2067298889160156e-05, -2.7418136596679688e-05, -2.276897430419922e-05, -1.811981201171875e-05, -1.3470649719238281e-05, -8.821487426757812e-06, -4.172325134277344e-06, 4.76837158203125e-07, 5.125999450683594e-06, 9.775161743164062e-06, 1.4424324035644531e-05, 1.9073486328125e-05, 2.372264862060547e-05, 2.8371810913085938e-05, 3.3020973205566406e-05, 3.7670135498046875e-05, 4.2319297790527344e-05, 4.696846008300781e-05, 5.161762237548828e-05, 5.626678466796875e-05, 6.091594696044922e-05, 6.556510925292969e-05, 7.021427154541016e-05, 7.486343383789062e-05, 7.95125961303711e-05, 8.416175842285156e-05, 8.881092071533203e-05, 9.34600830078125e-05, 9.810924530029297e-05, 0.00010275840759277344, 0.0001074075698852539, 0.00011205673217773438, 0.00011670589447021484, 0.00012135505676269531, 0.00012600421905517578, 0.00013065338134765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 9.0, 6.0, 12.0, 26.0, 30.0, 48.0, 61.0, 117.0, 196.0, 297.0, 638.0, 1168.0, 2605.0, 7464.0, 57696.0, 904222.0, 61162.0, 7619.0, 2639.0, 1193.0, 542.0, 322.0, 172.0, 108.0, 62.0, 45.0, 24.0, 14.0, 20.0, 6.0, 8.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2158203125, -1.1731719970703125, -1.130523681640625, -1.0878753662109375, -1.04522705078125, -1.0025787353515625, -0.959930419921875, -0.9172821044921875, -0.8746337890625, -0.8319854736328125, -0.789337158203125, -0.7466888427734375, -0.70404052734375, -0.6613922119140625, -0.618743896484375, -0.5760955810546875, -0.533447265625, -0.4907989501953125, -0.448150634765625, -0.4055023193359375, -0.36285400390625, -0.3202056884765625, -0.277557373046875, -0.2349090576171875, -0.1922607421875, -0.1496124267578125, -0.106964111328125, -0.0643157958984375, -0.02166748046875, 0.0209808349609375, 0.063629150390625, 0.1062774658203125, 0.14892578125, 0.1915740966796875, 0.234222412109375, 0.2768707275390625, 0.31951904296875, 0.3621673583984375, 0.404815673828125, 0.4474639892578125, 0.4901123046875, 0.5327606201171875, 0.575408935546875, 0.6180572509765625, 0.66070556640625, 0.7033538818359375, 0.746002197265625, 0.7886505126953125, 0.831298828125, 0.8739471435546875, 0.916595458984375, 0.9592437744140625, 1.00189208984375, 1.0445404052734375, 1.087188720703125, 1.1298370361328125, 1.1724853515625, 1.2151336669921875, 1.257781982421875, 1.3004302978515625, 1.34307861328125, 1.3857269287109375, 1.428375244140625, 1.4710235595703125, 1.513671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 13.0, 20.0, 27.0, 53.0, 92.0, 176.0, 194.0, 153.0, 95.0, 66.0, 40.0, 18.0, 14.0, 5.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.740234375, -0.7210884094238281, -0.7019424438476562, -0.6827964782714844, -0.6636505126953125, -0.6445045471191406, -0.6253585815429688, -0.6062126159667969, -0.587066650390625, -0.5679206848144531, -0.5487747192382812, -0.5296287536621094, -0.5104827880859375, -0.4913368225097656, -0.47219085693359375, -0.4530448913574219, -0.43389892578125, -0.4147529602050781, -0.39560699462890625, -0.3764610290527344, -0.3573150634765625, -0.3381690979003906, -0.31902313232421875, -0.2998771667480469, -0.280731201171875, -0.2615852355957031, -0.24243927001953125, -0.22329330444335938, -0.2041473388671875, -0.18500137329101562, -0.16585540771484375, -0.14670944213867188, -0.1275634765625, -0.10841751098632812, -0.08927154541015625, -0.07012557983398438, -0.0509796142578125, -0.031833648681640625, -0.01268768310546875, 0.006458282470703125, 0.025604248046875, 0.044750213623046875, 0.06389617919921875, 0.08304214477539062, 0.1021881103515625, 0.12133407592773438, 0.14048004150390625, 0.15962600708007812, 0.17877197265625, 0.19791793823242188, 0.21706390380859375, 0.23620986938476562, 0.2553558349609375, 0.2745018005371094, 0.29364776611328125, 0.3127937316894531, 0.331939697265625, 0.3510856628417969, 0.37023162841796875, 0.3893775939941406, 0.4085235595703125, 0.4276695251464844, 0.44681549072265625, 0.4659614562988281, 0.485107421875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 9.0, 44.0, 119.0, 286.0, 321.0, 129.0, 48.0, 17.0, 10.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.310275554656982, -4.956239700317383, -4.602204322814941, -4.2481689453125, -3.8941330909729004, -3.54009747505188, -3.1860618591308594, -2.832026243209839, -2.4779906272888184, -2.123955011367798, -1.7699193954467773, -1.4158837795257568, -1.0618481636047363, -0.7078125476837158, -0.3537769317626953, 0.0002586841583251953, 0.3542943000793457, 0.7083299160003662, 1.0623655319213867, 1.4164011478424072, 1.7704367637634277, 2.1244723796844482, 2.4785079956054688, 2.8325436115264893, 3.1865792274475098, 3.5406148433685303, 3.894650459289551, 4.248685836791992, 4.602721691131592, 4.956757545471191, 5.310792922973633, 5.664828300476074, 6.018863677978516, 6.372899055480957, 6.726934909820557, 7.080970764160156, 7.435006141662598, 7.789041519165039, 8.143077850341797, 8.497113227844238, 8.85114860534668, 9.205183982849121, 9.559219360351562, 9.91325569152832, 10.267291069030762, 10.621326446533203, 10.975362777709961, 11.329398155212402, 11.683433532714844, 12.037468910217285, 12.391504287719727, 12.745540618896484, 13.099575996398926, 13.453611373901367, 13.807647705078125, 14.161683082580566, 14.515718460083008, 14.86975383758545, 15.22378921508789, 15.577825546264648, 15.93186092376709, 16.28589630126953, 16.63993263244629, 16.993967056274414, 17.348003387451172]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 7.0, 5.0, 3.0, 8.0, 9.0, 15.0, 14.0, 21.0, 20.0, 30.0, 34.0, 35.0, 45.0, 50.0, 41.0, 40.0, 53.0, 64.0, 37.0, 49.0, 56.0, 56.0, 45.0, 55.0, 40.0, 24.0, 28.0, 17.0, 24.0, 10.0, 11.0, 9.0, 9.0, 12.0, 2.0, 7.0, 5.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.445357322692871, -3.3283238410949707, -3.2112903594970703, -3.094256639480591, -2.9772231578826904, -2.86018967628479, -2.7431559562683105, -2.62612247467041, -2.5090889930725098, -2.3920555114746094, -2.275022029876709, -2.1579883098602295, -2.040954828262329, -1.9239213466644287, -1.8068877458572388, -1.6898541450500488, -1.5728206634521484, -1.455787181854248, -1.338753581047058, -1.2217199802398682, -1.1046864986419678, -0.9876529574394226, -0.8706194162368774, -0.7535858750343323, -0.6365523338317871, -0.5195187926292419, -0.4024852514266968, -0.2854517102241516, -0.16841816902160645, -0.05138462781906128, 0.06564891338348389, 0.18268245458602905, 0.2997159957885742, 0.4167495369911194, 0.5337830781936646, 0.6508166193962097, 0.7678501605987549, 0.8848837018013, 1.0019172430038452, 1.1189508438110352, 1.2359843254089355, 1.353017807006836, 1.4700514078140259, 1.5870850086212158, 1.7041184902191162, 1.8211519718170166, 1.9381855726242065, 2.0552191734313965, 2.172252655029297, 2.2892861366271973, 2.4063196182250977, 2.523353338241577, 2.6403868198394775, 2.757420301437378, 2.8744540214538574, 2.991487503051758, 3.108520984649658, 3.2255544662475586, 3.342587947845459, 3.4596216678619385, 3.576655149459839, 3.6936886310577393, 3.8107223510742188, 3.927755832672119, 4.0447893142700195]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 5.0, 6.0, 3.0, 9.0, 11.0, 10.0, 15.0, 11.0, 14.0, 29.0, 20.0, 32.0, 56.0, 57.0, 108.0, 141.0, 170.0, 337.0, 848.0, 2155.0, 7698.0, 44170.0, 3970659.0, 147342.0, 14489.0, 3608.0, 1225.0, 496.0, 261.0, 121.0, 69.0, 37.0, 23.0, 14.0, 14.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.306640625, -3.232666015625, -3.15869140625, -3.084716796875, -3.0107421875, -2.936767578125, -2.86279296875, -2.788818359375, -2.71484375, -2.640869140625, -2.56689453125, -2.492919921875, -2.4189453125, -2.344970703125, -2.27099609375, -2.197021484375, -2.123046875, -2.049072265625, -1.97509765625, -1.901123046875, -1.8271484375, -1.753173828125, -1.67919921875, -1.605224609375, -1.53125, -1.457275390625, -1.38330078125, -1.309326171875, -1.2353515625, -1.161376953125, -1.08740234375, -1.013427734375, -0.939453125, -0.865478515625, -0.79150390625, -0.717529296875, -0.6435546875, -0.569580078125, -0.49560546875, -0.421630859375, -0.34765625, -0.273681640625, -0.19970703125, -0.125732421875, -0.0517578125, 0.022216796875, 0.09619140625, 0.170166015625, 0.244140625, 0.318115234375, 0.39208984375, 0.466064453125, 0.5400390625, 0.614013671875, 0.68798828125, 0.761962890625, 0.8359375, 0.909912109375, 0.98388671875, 1.057861328125, 1.1318359375, 1.205810546875, 1.27978515625, 1.353759765625, 1.427734375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 7.0, 20.0, 31.0, 60.0, 82.0, 126.0, 133.0, 152.0, 118.0, 117.0, 63.0, 37.0, 21.0, 17.0, 7.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.454345703125, -0.44472503662109375, -0.4351043701171875, -0.42548370361328125, -0.415863037109375, -0.40624237060546875, -0.3966217041015625, -0.38700103759765625, -0.37738037109375, -0.36775970458984375, -0.3581390380859375, -0.34851837158203125, -0.338897705078125, -0.32927703857421875, -0.3196563720703125, -0.31003570556640625, -0.3004150390625, -0.29079437255859375, -0.2811737060546875, -0.27155303955078125, -0.261932373046875, -0.25231170654296875, -0.2426910400390625, -0.23307037353515625, -0.22344970703125, -0.21382904052734375, -0.2042083740234375, -0.19458770751953125, -0.184967041015625, -0.17534637451171875, -0.1657257080078125, -0.15610504150390625, -0.146484375, -0.13686370849609375, -0.1272430419921875, -0.11762237548828125, -0.108001708984375, -0.09838104248046875, -0.0887603759765625, -0.07913970947265625, -0.06951904296875, -0.05989837646484375, -0.0502777099609375, -0.04065704345703125, -0.031036376953125, -0.02141571044921875, -0.0117950439453125, -0.00217437744140625, 0.0074462890625, 0.01706695556640625, 0.0266876220703125, 0.03630828857421875, 0.045928955078125, 0.05554962158203125, 0.0651702880859375, 0.07479095458984375, 0.08441162109375, 0.09403228759765625, 0.1036529541015625, 0.11327362060546875, 0.122894287109375, 0.13251495361328125, 0.1421356201171875, 0.15175628662109375, 0.161376953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 7.0, 19.0, 18.0, 29.0, 41.0, 69.0, 66.0, 115.0, 160.0, 274.0, 496.0, 942.0, 2405.0, 6932.0, 26970.0, 336917.0, 3738463.0, 61306.0, 12078.0, 3523.0, 1490.0, 704.0, 421.0, 266.0, 175.0, 126.0, 72.0, 57.0, 47.0, 20.0, 17.0, 15.0, 6.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.548828125, -2.482147216796875, -2.41546630859375, -2.348785400390625, -2.2821044921875, -2.215423583984375, -2.14874267578125, -2.082061767578125, -2.015380859375, -1.948699951171875, -1.88201904296875, -1.815338134765625, -1.7486572265625, -1.681976318359375, -1.61529541015625, -1.548614501953125, -1.48193359375, -1.415252685546875, -1.34857177734375, -1.281890869140625, -1.2152099609375, -1.148529052734375, -1.08184814453125, -1.015167236328125, -0.948486328125, -0.881805419921875, -0.81512451171875, -0.748443603515625, -0.6817626953125, -0.615081787109375, -0.54840087890625, -0.481719970703125, -0.4150390625, -0.348358154296875, -0.28167724609375, -0.214996337890625, -0.1483154296875, -0.081634521484375, -0.01495361328125, 0.051727294921875, 0.118408203125, 0.185089111328125, 0.25177001953125, 0.318450927734375, 0.3851318359375, 0.451812744140625, 0.51849365234375, 0.585174560546875, 0.65185546875, 0.718536376953125, 0.78521728515625, 0.851898193359375, 0.9185791015625, 0.985260009765625, 1.05194091796875, 1.118621826171875, 1.185302734375, 1.251983642578125, 1.31866455078125, 1.385345458984375, 1.4520263671875, 1.518707275390625, 1.58538818359375, 1.652069091796875, 1.71875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 6.0, 8.0, 12.0, 18.0, 39.0, 50.0, 90.0, 222.0, 865.0, 2026.0, 400.0, 127.0, 60.0, 47.0, 25.0, 16.0, 18.0, 11.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.4677734375, -0.4532661437988281, -0.43875885009765625, -0.4242515563964844, -0.4097442626953125, -0.3952369689941406, -0.38072967529296875, -0.3662223815917969, -0.351715087890625, -0.3372077941894531, -0.32270050048828125, -0.3081932067871094, -0.2936859130859375, -0.2791786193847656, -0.26467132568359375, -0.2501640319824219, -0.23565673828125, -0.22114944458007812, -0.20664215087890625, -0.19213485717773438, -0.1776275634765625, -0.16312026977539062, -0.14861297607421875, -0.13410568237304688, -0.119598388671875, -0.10509109497070312, -0.09058380126953125, -0.07607650756835938, -0.0615692138671875, -0.047061920166015625, -0.03255462646484375, -0.018047332763671875, -0.0035400390625, 0.010967254638671875, 0.02547454833984375, 0.039981842041015625, 0.0544891357421875, 0.06899642944335938, 0.08350372314453125, 0.09801101684570312, 0.112518310546875, 0.12702560424804688, 0.14153289794921875, 0.15604019165039062, 0.1705474853515625, 0.18505477905273438, 0.19956207275390625, 0.21406936645507812, 0.22857666015625, 0.24308395385742188, 0.25759124755859375, 0.2720985412597656, 0.2866058349609375, 0.3011131286621094, 0.31562042236328125, 0.3301277160644531, 0.344635009765625, 0.3591423034667969, 0.37364959716796875, 0.3881568908691406, 0.4026641845703125, 0.4171714782714844, 0.43167877197265625, 0.4461860656738281, 0.460693359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 8.0, 15.0, 24.0, 31.0, 61.0, 84.0, 87.0, 126.0, 142.0, 125.0, 90.0, 67.0, 48.0, 34.0, 10.0, 15.0, 9.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994015455245972, -1.8349367380142212, -1.7704719305038452, -1.7060070037841797, -1.6415421962738037, -1.5770773887634277, -1.5126125812530518, -1.4481477737426758, -1.3836829662322998, -1.3192181587219238, -1.2547533512115479, -1.1902885437011719, -1.1258236169815063, -1.0613588094711304, -0.9968940019607544, -0.9324291944503784, -0.8679642677307129, -0.8034994602203369, -0.7390345931053162, -0.6745697855949402, -0.6101049184799194, -0.5456401109695435, -0.4811753034591675, -0.4167104661464691, -0.35224562883377075, -0.2877807915210724, -0.22331596910953522, -0.15885114669799805, -0.09438630938529968, -0.02992147207260132, 0.03454333543777466, 0.09900817275047302, 0.16347289085388184, 0.2279377281665802, 0.29240256547927856, 0.35686737298965454, 0.4213322103023529, 0.48579704761505127, 0.5502618551254272, 0.6147266626358032, 0.679191529750824, 0.7436563372612, 0.8081212043762207, 0.8725860118865967, 0.9370508193969727, 1.0015156269073486, 1.0659804344177246, 1.1304453611373901, 1.1949101686477661, 1.259374976158142, 1.323839783668518, 1.3883047103881836, 1.4527695178985596, 1.5172343254089355, 1.5816991329193115, 1.6461639404296875, 1.7106287479400635, 1.7750935554504395, 1.8395583629608154, 1.9040231704711914, 1.968488097190857, 2.0329527854919434, 2.0974178314208984, 2.1618826389312744, 2.2263474464416504]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 9.0, 4.0, 14.0, 27.0, 20.0, 27.0, 33.0, 21.0, 37.0, 29.0, 59.0, 46.0, 45.0, 54.0, 48.0, 49.0, 52.0, 53.0, 34.0, 40.0, 54.0, 36.0, 23.0, 35.0, 30.0, 27.0, 19.0, 13.0, 11.0, 10.0, 7.0, 7.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.325851559638977, -1.289284110069275, -1.2527167797088623, -1.2161493301391602, -1.1795819997787476, -1.1430145502090454, -1.1064472198486328, -1.0698797702789307, -1.0333123207092285, -0.9967449307441711, -0.9601775407791138, -0.9236101508140564, -0.887042760848999, -0.8504753112792969, -0.8139079213142395, -0.7773405313491821, -0.7407732009887695, -0.7042058110237122, -0.6676384210586548, -0.6310710310935974, -0.59450364112854, -0.5579361915588379, -0.5213688015937805, -0.48480141162872314, -0.44823402166366577, -0.4116666316986084, -0.375099241733551, -0.33853182196617126, -0.3019644320011139, -0.2653970420360565, -0.22882963716983795, -0.19226223230361938, -0.15569496154785156, -0.11912756413221359, -0.08256016671657562, -0.04599276930093765, -0.009425371885299683, 0.02714201807975769, 0.06370942294597626, 0.10027682781219482, 0.1368442177772522, 0.17341160774230957, 0.20997901260852814, 0.2465464174747467, 0.2831138074398041, 0.31968119740486145, 0.3562486171722412, 0.3928160071372986, 0.42938339710235596, 0.46595078706741333, 0.5025181770324707, 0.5390855669975281, 0.5756529569625854, 0.6122204065322876, 0.648787796497345, 0.6853551864624023, 0.7219225764274597, 0.7584899663925171, 0.7950573563575745, 0.8316247463226318, 0.868192195892334, 0.9047595262527466, 0.9413269758224487, 0.9778943657875061, 1.0144617557525635]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 7.0, 11.0, 12.0, 11.0, 16.0, 21.0, 27.0, 26.0, 56.0, 86.0, 111.0, 185.0, 371.0, 753.0, 2040.0, 6712.0, 30572.0, 236052.0, 662803.0, 87210.0, 15211.0, 3783.0, 1223.0, 502.0, 271.0, 138.0, 89.0, 51.0, 41.0, 33.0, 32.0, 8.0, 19.0, 13.0, 5.0, 8.0, 6.0, 5.0, 6.0, 2.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0], "bins": [-1.623046875, -1.57830810546875, -1.5335693359375, -1.48883056640625, -1.444091796875, -1.39935302734375, -1.3546142578125, -1.30987548828125, -1.26513671875, -1.22039794921875, -1.1756591796875, -1.13092041015625, -1.086181640625, -1.04144287109375, -0.9967041015625, -0.95196533203125, -0.9072265625, -0.86248779296875, -0.8177490234375, -0.77301025390625, -0.728271484375, -0.68353271484375, -0.6387939453125, -0.59405517578125, -0.54931640625, -0.50457763671875, -0.4598388671875, -0.41510009765625, -0.370361328125, -0.32562255859375, -0.2808837890625, -0.23614501953125, -0.19140625, -0.14666748046875, -0.1019287109375, -0.05718994140625, -0.012451171875, 0.03228759765625, 0.0770263671875, 0.12176513671875, 0.16650390625, 0.21124267578125, 0.2559814453125, 0.30072021484375, 0.345458984375, 0.39019775390625, 0.4349365234375, 0.47967529296875, 0.5244140625, 0.56915283203125, 0.6138916015625, 0.65863037109375, 0.703369140625, 0.74810791015625, 0.7928466796875, 0.83758544921875, 0.88232421875, 0.92706298828125, 0.9718017578125, 1.01654052734375, 1.061279296875, 1.10601806640625, 1.1507568359375, 1.19549560546875, 1.240234375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 16.0, 20.0, 42.0, 69.0, 90.0, 119.0, 147.0, 120.0, 118.0, 92.0, 50.0, 42.0, 32.0, 14.0, 12.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.463623046875, -0.45354461669921875, -0.4434661865234375, -0.43338775634765625, -0.423309326171875, -0.41323089599609375, -0.4031524658203125, -0.39307403564453125, -0.38299560546875, -0.37291717529296875, -0.3628387451171875, -0.35276031494140625, -0.342681884765625, -0.33260345458984375, -0.3225250244140625, -0.31244659423828125, -0.3023681640625, -0.29228973388671875, -0.2822113037109375, -0.27213287353515625, -0.262054443359375, -0.25197601318359375, -0.2418975830078125, -0.23181915283203125, -0.22174072265625, -0.21166229248046875, -0.2015838623046875, -0.19150543212890625, -0.181427001953125, -0.17134857177734375, -0.1612701416015625, -0.15119171142578125, -0.14111328125, -0.13103485107421875, -0.1209564208984375, -0.11087799072265625, -0.100799560546875, -0.09072113037109375, -0.0806427001953125, -0.07056427001953125, -0.06048583984375, -0.05040740966796875, -0.0403289794921875, -0.03025054931640625, -0.020172119140625, -0.01009368896484375, -1.52587890625e-05, 0.01006317138671875, 0.0201416015625, 0.03022003173828125, 0.0402984619140625, 0.05037689208984375, 0.060455322265625, 0.07053375244140625, 0.0806121826171875, 0.09069061279296875, 0.10076904296875, 0.11084747314453125, 0.1209259033203125, 0.13100433349609375, 0.141082763671875, 0.15116119384765625, 0.1612396240234375, 0.17131805419921875, 0.181396484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 5.0, 7.0, 11.0, 11.0, 23.0, 32.0, 52.0, 63.0, 96.0, 163.0, 312.0, 530.0, 963.0, 2073.0, 4773.0, 13472.0, 45806.0, 226686.0, 574669.0, 131366.0, 30521.0, 9683.0, 3648.0, 1675.0, 785.0, 446.0, 261.0, 145.0, 93.0, 53.0, 49.0, 27.0, 20.0, 9.0, 3.0, 10.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1025390625, -1.07220458984375, -1.0418701171875, -1.01153564453125, -0.981201171875, -0.95086669921875, -0.9205322265625, -0.89019775390625, -0.85986328125, -0.82952880859375, -0.7991943359375, -0.76885986328125, -0.738525390625, -0.70819091796875, -0.6778564453125, -0.64752197265625, -0.6171875, -0.58685302734375, -0.5565185546875, -0.52618408203125, -0.495849609375, -0.46551513671875, -0.4351806640625, -0.40484619140625, -0.37451171875, -0.34417724609375, -0.3138427734375, -0.28350830078125, -0.253173828125, -0.22283935546875, -0.1925048828125, -0.16217041015625, -0.1318359375, -0.10150146484375, -0.0711669921875, -0.04083251953125, -0.010498046875, 0.01983642578125, 0.0501708984375, 0.08050537109375, 0.11083984375, 0.14117431640625, 0.1715087890625, 0.20184326171875, 0.232177734375, 0.26251220703125, 0.2928466796875, 0.32318115234375, 0.353515625, 0.38385009765625, 0.4141845703125, 0.44451904296875, 0.474853515625, 0.50518798828125, 0.5355224609375, 0.56585693359375, 0.59619140625, 0.62652587890625, 0.6568603515625, 0.68719482421875, 0.717529296875, 0.74786376953125, 0.7781982421875, 0.80853271484375, 0.8388671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 9.0, 7.0, 14.0, 22.0, 26.0, 22.0, 35.0, 48.0, 51.0, 63.0, 80.0, 57.0, 75.0, 70.0, 60.0, 62.0, 60.0, 58.0, 39.0, 28.0, 35.0, 19.0, 15.0, 8.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1252517700195312, -1.0962066650390625, -1.0671615600585938, -1.038116455078125, -1.0090713500976562, -0.9800262451171875, -0.9509811401367188, -0.92193603515625, -0.8928909301757812, -0.8638458251953125, -0.8348007202148438, -0.805755615234375, -0.7767105102539062, -0.7476654052734375, -0.7186203002929688, -0.6895751953125, -0.6605300903320312, -0.6314849853515625, -0.6024398803710938, -0.573394775390625, -0.5443496704101562, -0.5153045654296875, -0.48625946044921875, -0.45721435546875, -0.42816925048828125, -0.3991241455078125, -0.37007904052734375, -0.341033935546875, -0.31198883056640625, -0.2829437255859375, -0.25389862060546875, -0.224853515625, -0.19580841064453125, -0.1667633056640625, -0.13771820068359375, -0.108673095703125, -0.07962799072265625, -0.0505828857421875, -0.02153778076171875, 0.00750732421875, 0.03655242919921875, 0.0655975341796875, 0.09464263916015625, 0.123687744140625, 0.15273284912109375, 0.1817779541015625, 0.21082305908203125, 0.2398681640625, 0.26891326904296875, 0.2979583740234375, 0.32700347900390625, 0.356048583984375, 0.38509368896484375, 0.4141387939453125, 0.44318389892578125, 0.47222900390625, 0.5012741088867188, 0.5303192138671875, 0.5593643188476562, 0.588409423828125, 0.6174545288085938, 0.6464996337890625, 0.6755447387695312, 0.70458984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 8.0, 10.0, 10.0, 12.0, 20.0, 26.0, 40.0, 60.0, 72.0, 121.0, 212.0, 352.0, 588.0, 1104.0, 2234.0, 5428.0, 17745.0, 105174.0, 696754.0, 180767.0, 25097.0, 6992.0, 2663.0, 1323.0, 668.0, 404.0, 230.0, 149.0, 99.0, 54.0, 34.0, 22.0, 20.0, 15.0, 9.0, 12.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64501953125, -0.6258316040039062, -0.6066436767578125, -0.5874557495117188, -0.568267822265625, -0.5490798950195312, -0.5298919677734375, -0.5107040405273438, -0.49151611328125, -0.47232818603515625, -0.4531402587890625, -0.43395233154296875, -0.414764404296875, -0.39557647705078125, -0.3763885498046875, -0.35720062255859375, -0.3380126953125, -0.31882476806640625, -0.2996368408203125, -0.28044891357421875, -0.261260986328125, -0.24207305908203125, -0.2228851318359375, -0.20369720458984375, -0.18450927734375, -0.16532135009765625, -0.1461334228515625, -0.12694549560546875, -0.107757568359375, -0.08856964111328125, -0.0693817138671875, -0.05019378662109375, -0.031005859375, -0.01181793212890625, 0.0073699951171875, 0.02655792236328125, 0.045745849609375, 0.06493377685546875, 0.0841217041015625, 0.10330963134765625, 0.12249755859375, 0.14168548583984375, 0.1608734130859375, 0.18006134033203125, 0.199249267578125, 0.21843719482421875, 0.2376251220703125, 0.25681304931640625, 0.2760009765625, 0.29518890380859375, 0.3143768310546875, 0.33356475830078125, 0.352752685546875, 0.37194061279296875, 0.3911285400390625, 0.41031646728515625, 0.42950439453125, 0.44869232177734375, 0.4678802490234375, 0.48706817626953125, 0.506256103515625, 0.5254440307617188, 0.5446319580078125, 0.5638198852539062, 0.5830078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 2.0, 7.0, 9.0, 22.0, 33.0, 54.0, 71.0, 141.0, 190.0, 159.0, 123.0, 68.0, 42.0, 24.0, 10.0, 14.0, 11.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00016057491302490234, -0.0001559574156999588, -0.00015133991837501526, -0.00014672242105007172, -0.00014210492372512817, -0.00013748742640018463, -0.0001328699290752411, -0.00012825243175029755, -0.000123634934425354, -0.00011901743710041046, -0.00011439993977546692, -0.00010978244245052338, -0.00010516494512557983, -0.00010054744780063629, -9.592995047569275e-05, -9.13124531507492e-05, -8.669495582580566e-05, -8.207745850086212e-05, -7.745996117591858e-05, -7.284246385097504e-05, -6.82249665260315e-05, -6.360746920108795e-05, -5.898997187614441e-05, -5.437247455120087e-05, -4.9754977226257324e-05, -4.513747990131378e-05, -4.051998257637024e-05, -3.59024852514267e-05, -3.1284987926483154e-05, -2.6667490601539612e-05, -2.204999327659607e-05, -1.7432495951652527e-05, -1.2814998626708984e-05, -8.197501301765442e-06, -3.5800039768218994e-06, 1.037493348121643e-06, 5.6549906730651855e-06, 1.0272487998008728e-05, 1.488998532295227e-05, 1.9507482647895813e-05, 2.4124979972839355e-05, 2.8742477297782898e-05, 3.335997462272644e-05, 3.797747194766998e-05, 4.2594969272613525e-05, 4.721246659755707e-05, 5.182996392250061e-05, 5.644746124744415e-05, 6.10649585723877e-05, 6.568245589733124e-05, 7.029995322227478e-05, 7.491745054721832e-05, 7.953494787216187e-05, 8.415244519710541e-05, 8.876994252204895e-05, 9.338743984699249e-05, 9.800493717193604e-05, 0.00010262243449687958, 0.00010723993182182312, 0.00011185742914676666, 0.0001164749264717102, 0.00012109242379665375, 0.0001257099211215973, 0.00013032741844654083, 0.00013494491577148438]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 8.0, 5.0, 17.0, 17.0, 17.0, 17.0, 42.0, 45.0, 68.0, 83.0, 146.0, 206.0, 332.0, 555.0, 1044.0, 1927.0, 4128.0, 10042.0, 31976.0, 197884.0, 649514.0, 112787.0, 22721.0, 7743.0, 3327.0, 1665.0, 865.0, 450.0, 309.0, 173.0, 128.0, 102.0, 64.0, 33.0, 33.0, 18.0, 15.0, 11.0, 11.0, 7.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.572265625, -0.5534210205078125, -0.534576416015625, -0.5157318115234375, -0.49688720703125, -0.4780426025390625, -0.459197998046875, -0.4403533935546875, -0.4215087890625, -0.4026641845703125, -0.383819580078125, -0.3649749755859375, -0.34613037109375, -0.3272857666015625, -0.308441162109375, -0.2895965576171875, -0.270751953125, -0.2519073486328125, -0.233062744140625, -0.2142181396484375, -0.19537353515625, -0.1765289306640625, -0.157684326171875, -0.1388397216796875, -0.1199951171875, -0.1011505126953125, -0.082305908203125, -0.0634613037109375, -0.04461669921875, -0.0257720947265625, -0.006927490234375, 0.0119171142578125, 0.03076171875, 0.0496063232421875, 0.068450927734375, 0.0872955322265625, 0.10614013671875, 0.1249847412109375, 0.143829345703125, 0.1626739501953125, 0.1815185546875, 0.2003631591796875, 0.219207763671875, 0.2380523681640625, 0.25689697265625, 0.2757415771484375, 0.294586181640625, 0.3134307861328125, 0.332275390625, 0.3511199951171875, 0.369964599609375, 0.3888092041015625, 0.40765380859375, 0.4264984130859375, 0.445343017578125, 0.4641876220703125, 0.4830322265625, 0.5018768310546875, 0.520721435546875, 0.5395660400390625, 0.55841064453125, 0.5772552490234375, 0.596099853515625, 0.6149444580078125, 0.6337890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 5.0, 6.0, 10.0, 13.0, 12.0, 24.0, 31.0, 54.0, 69.0, 103.0, 116.0, 121.0, 117.0, 83.0, 59.0, 41.0, 31.0, 28.0, 14.0, 18.0, 8.0, 5.0, 7.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.447265625, -0.4346122741699219, -0.42195892333984375, -0.4093055725097656, -0.3966522216796875, -0.3839988708496094, -0.37134552001953125, -0.3586921691894531, -0.346038818359375, -0.3333854675292969, -0.32073211669921875, -0.3080787658691406, -0.2954254150390625, -0.2827720642089844, -0.27011871337890625, -0.2574653625488281, -0.24481201171875, -0.23215866088867188, -0.21950531005859375, -0.20685195922851562, -0.1941986083984375, -0.18154525756835938, -0.16889190673828125, -0.15623855590820312, -0.143585205078125, -0.13093185424804688, -0.11827850341796875, -0.10562515258789062, -0.0929718017578125, -0.08031845092773438, -0.06766510009765625, -0.055011749267578125, -0.0423583984375, -0.029705047607421875, -0.01705169677734375, -0.004398345947265625, 0.0082550048828125, 0.020908355712890625, 0.03356170654296875, 0.046215057373046875, 0.058868408203125, 0.07152175903320312, 0.08417510986328125, 0.09682846069335938, 0.1094818115234375, 0.12213516235351562, 0.13478851318359375, 0.14744186401367188, 0.16009521484375, 0.17274856567382812, 0.18540191650390625, 0.19805526733398438, 0.2107086181640625, 0.22336196899414062, 0.23601531982421875, 0.24866867065429688, 0.261322021484375, 0.2739753723144531, 0.28662872314453125, 0.2992820739746094, 0.3119354248046875, 0.3245887756347656, 0.33724212646484375, 0.3498954772949219, 0.362548828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 20.0, 18.0, 25.0, 62.0, 114.0, 222.0, 245.0, 141.0, 60.0, 41.0, 22.0, 15.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.541660308837891, -4.260741233825684, -3.9798223972320557, -3.6989035606384277, -3.4179844856262207, -3.1370654106140137, -2.8561465740203857, -2.575227737426758, -2.294308662414551, -2.0133895874023438, -1.7324707508087158, -1.4515517950057983, -1.1706328392028809, -0.8897138833999634, -0.6087949275970459, -0.3278759717941284, -0.04695701599121094, 0.23396193981170654, 0.514880895614624, 0.7957998514175415, 1.076718807220459, 1.3576377630233765, 1.638556718826294, 1.9194756746292114, 2.200394630432129, 2.481313705444336, 2.762232542037964, 3.043151378631592, 3.324070453643799, 3.604989528656006, 3.885908365249634, 4.166827201843262, 4.447747230529785, 4.728666305541992, 5.009585380554199, 5.290503978729248, 5.571423053741455, 5.852342128753662, 6.133260726928711, 6.414179801940918, 6.695098876953125, 6.976017951965332, 7.256937026977539, 7.537855625152588, 7.818774700164795, 8.099693298339844, 8.38061237335205, 8.661531448364258, 8.942450523376465, 9.223369598388672, 9.504288673400879, 9.785207748413086, 10.066125869750977, 10.347044944763184, 10.62796401977539, 10.908883094787598, 11.189802169799805, 11.470721244812012, 11.751640319824219, 12.032559394836426, 12.313478469848633, 12.594396591186523, 12.87531566619873, 13.156234741210938, 13.437153816223145]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 7.0, 8.0, 16.0, 17.0, 10.0, 29.0, 34.0, 25.0, 36.0, 25.0, 37.0, 41.0, 63.0, 51.0, 80.0, 61.0, 68.0, 58.0, 59.0, 45.0, 36.0, 44.0, 33.0, 27.0, 19.0, 15.0, 14.0, 10.0, 7.0, 8.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.831258773803711, -5.677872180938721, -5.5244855880737305, -5.371099472045898, -5.217712879180908, -5.064326286315918, -4.910939693450928, -4.7575531005859375, -4.6041669845581055, -4.450780391693115, -4.297393798828125, -4.144007682800293, -3.9906210899353027, -3.8372344970703125, -3.6838479042053223, -3.530461311340332, -3.377074718475342, -3.2236881256103516, -3.0703017711639404, -2.91691517829895, -2.763528823852539, -2.610142230987549, -2.4567556381225586, -2.3033690452575684, -2.1499826908111572, -1.9965962171554565, -1.8432097434997559, -1.6898231506347656, -1.536436676979065, -1.3830502033233643, -1.229663610458374, -1.0762771368026733, -0.9228904247283936, -0.7695039510726929, -0.6161174178123474, -0.46273091435432434, -0.30934441089630127, -0.15595793724060059, -0.002571403980255127, 0.15081512928009033, 0.304201602935791, 0.4575881063938141, 0.6109746098518372, 0.7643611431121826, 0.9177476167678833, 1.071134090423584, 1.2245206832885742, 1.377907156944275, 1.5312936305999756, 1.6846801042556763, 1.838066577911377, 1.9914531707763672, 2.1448397636413574, 2.2982261180877686, 2.451612710952759, 2.60499906539917, 2.75838565826416, 2.9117722511291504, 3.0651586055755615, 3.2185451984405518, 3.371931552886963, 3.525318145751953, 3.6787047386169434, 3.8320913314819336, 3.9854776859283447]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 5.0, 6.0, 8.0, 14.0, 25.0, 21.0, 32.0, 38.0, 57.0, 80.0, 115.0, 209.0, 429.0, 1034.0, 3710.0, 19981.0, 1239259.0, 2899306.0, 23521.0, 4350.0, 1236.0, 461.0, 182.0, 88.0, 50.0, 24.0, 8.0, 9.0, 4.0, 3.0, 1.0, 1.0], "bins": [-4.80078125, -4.702850341796875, -4.60491943359375, -4.506988525390625, -4.4090576171875, -4.311126708984375, -4.21319580078125, -4.115264892578125, -4.017333984375, -3.919403076171875, -3.82147216796875, -3.723541259765625, -3.6256103515625, -3.527679443359375, -3.42974853515625, -3.331817626953125, -3.23388671875, -3.135955810546875, -3.03802490234375, -2.940093994140625, -2.8421630859375, -2.744232177734375, -2.64630126953125, -2.548370361328125, -2.450439453125, -2.352508544921875, -2.25457763671875, -2.156646728515625, -2.0587158203125, -1.960784912109375, -1.86285400390625, -1.764923095703125, -1.6669921875, -1.569061279296875, -1.47113037109375, -1.373199462890625, -1.2752685546875, -1.177337646484375, -1.07940673828125, -0.981475830078125, -0.883544921875, -0.785614013671875, -0.68768310546875, -0.589752197265625, -0.4918212890625, -0.393890380859375, -0.29595947265625, -0.198028564453125, -0.10009765625, -0.002166748046875, 0.09576416015625, 0.193695068359375, 0.2916259765625, 0.389556884765625, 0.48748779296875, 0.585418701171875, 0.683349609375, 0.781280517578125, 0.87921142578125, 0.977142333984375, 1.0750732421875, 1.173004150390625, 1.27093505859375, 1.368865966796875, 1.466796875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 3.0, 9.0, 15.0, 26.0, 44.0, 64.0, 95.0, 103.0, 110.0, 131.0, 129.0, 85.0, 57.0, 47.0, 26.0, 19.0, 11.0, 13.0, 3.0, 6.0, 6.0, 2.0, 3.0, 1.0], "bins": [-0.47607421875, -0.46637916564941406, -0.4566841125488281, -0.4469890594482422, -0.43729400634765625, -0.4275989532470703, -0.4179039001464844, -0.40820884704589844, -0.3985137939453125, -0.38881874084472656, -0.3791236877441406, -0.3694286346435547, -0.35973358154296875, -0.3500385284423828, -0.3403434753417969, -0.33064842224121094, -0.320953369140625, -0.31125831604003906, -0.3015632629394531, -0.2918682098388672, -0.28217315673828125, -0.2724781036376953, -0.2627830505371094, -0.25308799743652344, -0.2433929443359375, -0.23369789123535156, -0.22400283813476562, -0.2143077850341797, -0.20461273193359375, -0.1949176788330078, -0.18522262573242188, -0.17552757263183594, -0.16583251953125, -0.15613746643066406, -0.14644241333007812, -0.1367473602294922, -0.12705230712890625, -0.11735725402832031, -0.10766220092773438, -0.09796714782714844, -0.0882720947265625, -0.07857704162597656, -0.06888198852539062, -0.05918693542480469, -0.04949188232421875, -0.03979682922363281, -0.030101776123046875, -0.020406723022460938, -0.010711669921875, -0.0010166168212890625, 0.008678436279296875, 0.018373489379882812, 0.02806854248046875, 0.03776359558105469, 0.047458648681640625, 0.05715370178222656, 0.0668487548828125, 0.07654380798339844, 0.08623886108398438, 0.09593391418457031, 0.10562896728515625, 0.11532402038574219, 0.12501907348632812, 0.13471412658691406, 0.1444091796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 10.0, 13.0, 13.0, 28.0, 40.0, 96.0, 149.0, 396.0, 1080.0, 4751.0, 79962.0, 4087992.0, 16522.0, 2119.0, 559.0, 229.0, 119.0, 75.0, 38.0, 39.0, 11.0, 15.0, 7.0, 11.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.03125, -8.8177490234375, -8.604248046875, -8.3907470703125, -8.17724609375, -7.9637451171875, -7.750244140625, -7.5367431640625, -7.3232421875, -7.1097412109375, -6.896240234375, -6.6827392578125, -6.46923828125, -6.2557373046875, -6.042236328125, -5.8287353515625, -5.615234375, -5.4017333984375, -5.188232421875, -4.9747314453125, -4.76123046875, -4.5477294921875, -4.334228515625, -4.1207275390625, -3.9072265625, -3.6937255859375, -3.480224609375, -3.2667236328125, -3.05322265625, -2.8397216796875, -2.626220703125, -2.4127197265625, -2.19921875, -1.9857177734375, -1.772216796875, -1.5587158203125, -1.34521484375, -1.1317138671875, -0.918212890625, -0.7047119140625, -0.4912109375, -0.2777099609375, -0.064208984375, 0.1492919921875, 0.36279296875, 0.5762939453125, 0.789794921875, 1.0032958984375, 1.216796875, 1.4302978515625, 1.643798828125, 1.8572998046875, 2.07080078125, 2.2843017578125, 2.497802734375, 2.7113037109375, 2.9248046875, 3.1383056640625, 3.351806640625, 3.5653076171875, 3.77880859375, 3.9923095703125, 4.205810546875, 4.4193115234375, 4.6328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 4.0, 4.0, 12.0, 18.0, 39.0, 58.0, 103.0, 275.0, 1692.0, 1343.0, 294.0, 100.0, 46.0, 26.0, 21.0, 11.0, 7.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9540023803710938, -0.9221649169921875, -0.8903274536132812, -0.858489990234375, -0.8266525268554688, -0.7948150634765625, -0.7629776000976562, -0.73114013671875, -0.6993026733398438, -0.6674652099609375, -0.6356277465820312, -0.603790283203125, -0.5719528198242188, -0.5401153564453125, -0.5082778930664062, -0.4764404296875, -0.44460296630859375, -0.4127655029296875, -0.38092803955078125, -0.349090576171875, -0.31725311279296875, -0.2854156494140625, -0.25357818603515625, -0.22174072265625, -0.18990325927734375, -0.1580657958984375, -0.12622833251953125, -0.094390869140625, -0.06255340576171875, -0.0307159423828125, 0.00112152099609375, 0.032958984375, 0.06479644775390625, 0.0966339111328125, 0.12847137451171875, 0.160308837890625, 0.19214630126953125, 0.2239837646484375, 0.25582122802734375, 0.28765869140625, 0.31949615478515625, 0.3513336181640625, 0.38317108154296875, 0.415008544921875, 0.44684600830078125, 0.4786834716796875, 0.5105209350585938, 0.5423583984375, 0.5741958618164062, 0.6060333251953125, 0.6378707885742188, 0.669708251953125, 0.7015457153320312, 0.7333831787109375, 0.7652206420898438, 0.79705810546875, 0.8288955688476562, 0.8607330322265625, 0.8925704956054688, 0.924407958984375, 0.9562454223632812, 0.9880828857421875, 1.0199203491210938, 1.0517578125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 21.0, 107.0, 653.0, 192.0, 26.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.709108352661133, -16.95880889892578, -16.208507537841797, -15.458208084106445, -14.707908630371094, -13.957608222961426, -13.207307815551758, -12.457008361816406, -11.706707954406738, -10.95640754699707, -10.206108093261719, -9.45580768585205, -8.705507278442383, -7.955207824707031, -7.204907417297363, -6.4546074867248535, -5.704307556152344, -4.954007625579834, -4.203707695007324, -3.4534072875976562, -2.7031073570251465, -1.9528074264526367, -1.2025070190429688, -0.452207088470459, 0.2980928421020508, 1.04839289188385, 1.7986929416656494, 2.5489931106567383, 3.299293041229248, 4.049592971801758, 4.799893379211426, 5.5501933097839355, 6.3004913330078125, 7.050791263580322, 7.801091194152832, 8.5513916015625, 9.301691055297852, 10.05199146270752, 10.802291870117188, 11.552591323852539, 12.302891731262207, 13.053192138671875, 13.803491592407227, 14.553791999816895, 15.304092407226562, 16.054391860961914, 16.804691314697266, 17.55499267578125, 18.3052921295166, 19.055591583251953, 19.805892944335938, 20.55619239807129, 21.30649185180664, 22.056793212890625, 22.807092666625977, 23.557392120361328, 24.307693481445312, 25.057992935180664, 25.80829429626465, 26.55859375, 27.30889320373535, 28.059192657470703, 28.809494018554688, 29.55979347229004, 30.31009292602539]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 10.0, 13.0, 15.0, 37.0, 54.0, 65.0, 78.0, 100.0, 107.0, 124.0, 117.0, 94.0, 57.0, 58.0, 35.0, 16.0, 12.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.502362251281738, -4.349108695983887, -4.195854663848877, -4.042601108551025, -3.889347553253174, -3.736093759536743, -3.5828399658203125, -3.429586410522461, -3.2763326168060303, -3.1230788230895996, -2.969825267791748, -2.8165714740753174, -2.6633176803588867, -2.510064125061035, -2.3568103313446045, -2.203556537628174, -2.0503029823303223, -1.8970493078231812, -1.74379563331604, -1.5905418395996094, -1.4372881650924683, -1.2840344905853271, -1.1307806968688965, -0.9775270223617554, -0.8242733478546143, -0.6710196733474731, -0.5177659392356873, -0.36451223492622375, -0.21125853061676025, -0.05800485610961914, 0.09524887800216675, 0.24850261211395264, 0.40175580978393555, 0.5550094842910767, 0.7082632184028625, 0.8615169525146484, 1.0147706270217896, 1.1680243015289307, 1.3212780952453613, 1.4745317697525024, 1.6277854442596436, 1.7810391187667847, 1.9342927932739258, 2.0875465869903564, 2.240800380706787, 2.3940539360046387, 2.5473077297210693, 2.7005615234375, 2.8538150787353516, 3.0070688724517822, 3.160322427749634, 3.3135762214660645, 3.466829776763916, 3.6200835704803467, 3.7733373641967773, 3.926590919494629, 4.0798444747924805, 4.233098030090332, 4.386352062225342, 4.539605617523193, 4.692859172821045, 4.846113204956055, 4.999366760253906, 5.152620315551758, 5.305874347686768]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 7.0, 7.0, 9.0, 9.0, 15.0, 22.0, 24.0, 37.0, 41.0, 67.0, 114.0, 164.0, 233.0, 409.0, 669.0, 1240.0, 2370.0, 5496.0, 15633.0, 62301.0, 423833.0, 443037.0, 65335.0, 16283.0, 5660.0, 2449.0, 1229.0, 660.0, 412.0, 236.0, 169.0, 99.0, 77.0, 51.0, 48.0, 28.0, 23.0, 12.0, 14.0, 9.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.283203125, -1.237396240234375, -1.19158935546875, -1.145782470703125, -1.0999755859375, -1.054168701171875, -1.00836181640625, -0.962554931640625, -0.916748046875, -0.870941162109375, -0.82513427734375, -0.779327392578125, -0.7335205078125, -0.687713623046875, -0.64190673828125, -0.596099853515625, -0.55029296875, -0.504486083984375, -0.45867919921875, -0.412872314453125, -0.3670654296875, -0.321258544921875, -0.27545166015625, -0.229644775390625, -0.183837890625, -0.138031005859375, -0.09222412109375, -0.046417236328125, -0.0006103515625, 0.045196533203125, 0.09100341796875, 0.136810302734375, 0.1826171875, 0.228424072265625, 0.27423095703125, 0.320037841796875, 0.3658447265625, 0.411651611328125, 0.45745849609375, 0.503265380859375, 0.549072265625, 0.594879150390625, 0.64068603515625, 0.686492919921875, 0.7322998046875, 0.778106689453125, 0.82391357421875, 0.869720458984375, 0.91552734375, 0.961334228515625, 1.00714111328125, 1.052947998046875, 1.0987548828125, 1.144561767578125, 1.19036865234375, 1.236175537109375, 1.281982421875, 1.327789306640625, 1.37359619140625, 1.419403076171875, 1.4652099609375, 1.511016845703125, 1.55682373046875, 1.602630615234375, 1.6484375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 9.0, 17.0, 33.0, 46.0, 56.0, 73.0, 116.0, 117.0, 111.0, 82.0, 105.0, 79.0, 44.0, 27.0, 25.0, 16.0, 13.0, 6.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30419921875, -0.294158935546875, -0.28411865234375, -0.274078369140625, -0.2640380859375, -0.253997802734375, -0.24395751953125, -0.233917236328125, -0.223876953125, -0.213836669921875, -0.20379638671875, -0.193756103515625, -0.1837158203125, -0.173675537109375, -0.16363525390625, -0.153594970703125, -0.1435546875, -0.133514404296875, -0.12347412109375, -0.113433837890625, -0.1033935546875, -0.093353271484375, -0.08331298828125, -0.073272705078125, -0.063232421875, -0.053192138671875, -0.04315185546875, -0.033111572265625, -0.0230712890625, -0.013031005859375, -0.00299072265625, 0.007049560546875, 0.01708984375, 0.027130126953125, 0.03717041015625, 0.047210693359375, 0.0572509765625, 0.067291259765625, 0.07733154296875, 0.087371826171875, 0.097412109375, 0.107452392578125, 0.11749267578125, 0.127532958984375, 0.1375732421875, 0.147613525390625, 0.15765380859375, 0.167694091796875, 0.177734375, 0.187774658203125, 0.19781494140625, 0.207855224609375, 0.2178955078125, 0.227935791015625, 0.23797607421875, 0.248016357421875, 0.258056640625, 0.268096923828125, 0.27813720703125, 0.288177490234375, 0.2982177734375, 0.308258056640625, 0.31829833984375, 0.328338623046875, 0.33837890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 15.0, 15.0, 20.0, 23.0, 41.0, 75.0, 114.0, 209.0, 308.0, 564.0, 1087.0, 2262.0, 5005.0, 11738.0, 30222.0, 90948.0, 322703.0, 400145.0, 119530.0, 37960.0, 14199.0, 5825.0, 2674.0, 1326.0, 644.0, 345.0, 196.0, 102.0, 77.0, 53.0, 41.0, 21.0, 20.0, 8.0, 9.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.79541015625, -0.7733840942382812, -0.7513580322265625, -0.7293319702148438, -0.707305908203125, -0.6852798461914062, -0.6632537841796875, -0.6412277221679688, -0.61920166015625, -0.5971755981445312, -0.5751495361328125, -0.5531234741210938, -0.531097412109375, -0.5090713500976562, -0.4870452880859375, -0.46501922607421875, -0.4429931640625, -0.42096710205078125, -0.3989410400390625, -0.37691497802734375, -0.354888916015625, -0.33286285400390625, -0.3108367919921875, -0.28881072998046875, -0.26678466796875, -0.24475860595703125, -0.2227325439453125, -0.20070648193359375, -0.178680419921875, -0.15665435791015625, -0.1346282958984375, -0.11260223388671875, -0.090576171875, -0.06855010986328125, -0.0465240478515625, -0.02449798583984375, -0.002471923828125, 0.01955413818359375, 0.0415802001953125, 0.06360626220703125, 0.08563232421875, 0.10765838623046875, 0.1296844482421875, 0.15171051025390625, 0.173736572265625, 0.19576263427734375, 0.2177886962890625, 0.23981475830078125, 0.2618408203125, 0.28386688232421875, 0.3058929443359375, 0.32791900634765625, 0.349945068359375, 0.37197113037109375, 0.3939971923828125, 0.41602325439453125, 0.43804931640625, 0.46007537841796875, 0.4821014404296875, 0.5041275024414062, 0.526153564453125, 0.5481796264648438, 0.5702056884765625, 0.5922317504882812, 0.6142578125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 8.0, 8.0, 10.0, 8.0, 15.0, 17.0, 17.0, 27.0, 26.0, 33.0, 32.0, 35.0, 48.0, 34.0, 53.0, 51.0, 44.0, 48.0, 50.0, 48.0, 53.0, 44.0, 38.0, 34.0, 28.0, 27.0, 37.0, 19.0, 21.0, 20.0, 16.0, 10.0, 14.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.72412109375, -0.7038803100585938, -0.6836395263671875, -0.6633987426757812, -0.643157958984375, -0.6229171752929688, -0.6026763916015625, -0.5824356079101562, -0.56219482421875, -0.5419540405273438, -0.5217132568359375, -0.5014724731445312, -0.481231689453125, -0.46099090576171875, -0.4407501220703125, -0.42050933837890625, -0.4002685546875, -0.38002777099609375, -0.3597869873046875, -0.33954620361328125, -0.319305419921875, -0.29906463623046875, -0.2788238525390625, -0.25858306884765625, -0.23834228515625, -0.21810150146484375, -0.1978607177734375, -0.17761993408203125, -0.157379150390625, -0.13713836669921875, -0.1168975830078125, -0.09665679931640625, -0.076416015625, -0.05617523193359375, -0.0359344482421875, -0.01569366455078125, 0.004547119140625, 0.02478790283203125, 0.0450286865234375, 0.06526947021484375, 0.08551025390625, 0.10575103759765625, 0.1259918212890625, 0.14623260498046875, 0.166473388671875, 0.18671417236328125, 0.2069549560546875, 0.22719573974609375, 0.2474365234375, 0.26767730712890625, 0.2879180908203125, 0.30815887451171875, 0.328399658203125, 0.34864044189453125, 0.3688812255859375, 0.38912200927734375, 0.40936279296875, 0.42960357666015625, 0.4498443603515625, 0.47008514404296875, 0.490325927734375, 0.5105667114257812, 0.5308074951171875, 0.5510482788085938, 0.5712890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 8.0, 5.0, 10.0, 16.0, 18.0, 49.0, 68.0, 94.0, 127.0, 246.0, 361.0, 601.0, 971.0, 1692.0, 3034.0, 5765.0, 12546.0, 31145.0, 95906.0, 338862.0, 381927.0, 111785.0, 35553.0, 13715.0, 6368.0, 3322.0, 1732.0, 992.0, 560.0, 357.0, 219.0, 141.0, 113.0, 71.0, 55.0, 30.0, 25.0, 20.0, 12.0, 14.0, 11.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.274658203125, -0.26581573486328125, -0.2569732666015625, -0.24813079833984375, -0.239288330078125, -0.23044586181640625, -0.2216033935546875, -0.21276092529296875, -0.20391845703125, -0.19507598876953125, -0.1862335205078125, -0.17739105224609375, -0.168548583984375, -0.15970611572265625, -0.1508636474609375, -0.14202117919921875, -0.1331787109375, -0.12433624267578125, -0.1154937744140625, -0.10665130615234375, -0.097808837890625, -0.08896636962890625, -0.0801239013671875, -0.07128143310546875, -0.06243896484375, -0.05359649658203125, -0.0447540283203125, -0.03591156005859375, -0.027069091796875, -0.01822662353515625, -0.0093841552734375, -0.00054168701171875, 0.00830078125, 0.01714324951171875, 0.0259857177734375, 0.03482818603515625, 0.043670654296875, 0.05251312255859375, 0.0613555908203125, 0.07019805908203125, 0.07904052734375, 0.08788299560546875, 0.0967254638671875, 0.10556793212890625, 0.114410400390625, 0.12325286865234375, 0.1320953369140625, 0.14093780517578125, 0.1497802734375, 0.15862274169921875, 0.1674652099609375, 0.17630767822265625, 0.185150146484375, 0.19399261474609375, 0.2028350830078125, 0.21167755126953125, 0.22052001953125, 0.22936248779296875, 0.2382049560546875, 0.24704742431640625, 0.255889892578125, 0.26473236083984375, 0.2735748291015625, 0.28241729736328125, 0.291259765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 3.0, 10.0, 20.0, 14.0, 32.0, 49.0, 104.0, 166.0, 194.0, 159.0, 89.0, 65.0, 24.0, 20.0, 9.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014352798461914062, -0.00013868138194084167, -0.00013383477926254272, -0.00012898817658424377, -0.00012414157390594482, -0.00011929497122764587, -0.00011444836854934692, -0.00010960176587104797, -0.00010475516319274902, -9.990856051445007e-05, -9.506195783615112e-05, -9.021535515785217e-05, -8.536875247955322e-05, -8.052214980125427e-05, -7.567554712295532e-05, -7.082894444465637e-05, -6.598234176635742e-05, -6.113573908805847e-05, -5.628913640975952e-05, -5.144253373146057e-05, -4.659593105316162e-05, -4.174932837486267e-05, -3.690272569656372e-05, -3.205612301826477e-05, -2.720952033996582e-05, -2.236291766166687e-05, -1.751631498336792e-05, -1.266971230506897e-05, -7.82310962677002e-06, -2.9765069484710693e-06, 1.8700957298278809e-06, 6.716698408126831e-06, 1.1563301086425781e-05, 1.640990376472473e-05, 2.125650644302368e-05, 2.6103109121322632e-05, 3.094971179962158e-05, 3.579631447792053e-05, 4.064291715621948e-05, 4.548951983451843e-05, 5.033612251281738e-05, 5.518272519111633e-05, 6.002932786941528e-05, 6.487593054771423e-05, 6.972253322601318e-05, 7.456913590431213e-05, 7.941573858261108e-05, 8.426234126091003e-05, 8.910894393920898e-05, 9.395554661750793e-05, 9.880214929580688e-05, 0.00010364875197410583, 0.00010849535465240479, 0.00011334195733070374, 0.00011818856000900269, 0.00012303516268730164, 0.00012788176536560059, 0.00013272836804389954, 0.00013757497072219849, 0.00014242157340049744, 0.0001472681760787964, 0.00015211477875709534, 0.0001569613814353943, 0.00016180798411369324, 0.0001666545867919922]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 11.0, 15.0, 15.0, 38.0, 34.0, 61.0, 86.0, 138.0, 230.0, 369.0, 661.0, 1097.0, 2043.0, 4198.0, 9645.0, 25478.0, 81229.0, 355227.0, 422951.0, 95323.0, 29080.0, 10751.0, 4799.0, 2183.0, 1200.0, 664.0, 361.0, 222.0, 155.0, 96.0, 55.0, 32.0, 36.0, 12.0, 15.0, 5.0, 9.0, 4.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.41357421875, -0.4017791748046875, -0.389984130859375, -0.3781890869140625, -0.36639404296875, -0.3545989990234375, -0.342803955078125, -0.3310089111328125, -0.3192138671875, -0.3074188232421875, -0.295623779296875, -0.2838287353515625, -0.27203369140625, -0.2602386474609375, -0.248443603515625, -0.2366485595703125, -0.224853515625, -0.2130584716796875, -0.201263427734375, -0.1894683837890625, -0.17767333984375, -0.1658782958984375, -0.154083251953125, -0.1422882080078125, -0.1304931640625, -0.1186981201171875, -0.106903076171875, -0.0951080322265625, -0.08331298828125, -0.0715179443359375, -0.059722900390625, -0.0479278564453125, -0.0361328125, -0.0243377685546875, -0.012542724609375, -0.0007476806640625, 0.01104736328125, 0.0228424072265625, 0.034637451171875, 0.0464324951171875, 0.0582275390625, 0.0700225830078125, 0.081817626953125, 0.0936126708984375, 0.10540771484375, 0.1172027587890625, 0.128997802734375, 0.1407928466796875, 0.152587890625, 0.1643829345703125, 0.176177978515625, 0.1879730224609375, 0.19976806640625, 0.2115631103515625, 0.223358154296875, 0.2351531982421875, 0.2469482421875, 0.2587432861328125, 0.270538330078125, 0.2823333740234375, 0.29412841796875, 0.3059234619140625, 0.317718505859375, 0.3295135498046875, 0.34130859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 9.0, 7.0, 10.0, 13.0, 20.0, 26.0, 24.0, 33.0, 45.0, 53.0, 69.0, 68.0, 104.0, 81.0, 76.0, 76.0, 57.0, 34.0, 30.0, 38.0, 19.0, 16.0, 21.0, 15.0, 10.0, 7.0, 9.0, 8.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2369384765625, -0.22908973693847656, -0.22124099731445312, -0.2133922576904297, -0.20554351806640625, -0.1976947784423828, -0.18984603881835938, -0.18199729919433594, -0.1741485595703125, -0.16629981994628906, -0.15845108032226562, -0.1506023406982422, -0.14275360107421875, -0.1349048614501953, -0.12705612182617188, -0.11920738220214844, -0.111358642578125, -0.10350990295410156, -0.09566116333007812, -0.08781242370605469, -0.07996368408203125, -0.07211494445800781, -0.06426620483398438, -0.05641746520996094, -0.0485687255859375, -0.04071998596191406, -0.032871246337890625, -0.025022506713867188, -0.01717376708984375, -0.009325027465820312, -0.001476287841796875, 0.0063724517822265625, 0.01422119140625, 0.022069931030273438, 0.029918670654296875, 0.03776741027832031, 0.04561614990234375, 0.05346488952636719, 0.061313629150390625, 0.06916236877441406, 0.0770111083984375, 0.08485984802246094, 0.09270858764648438, 0.10055732727050781, 0.10840606689453125, 0.11625480651855469, 0.12410354614257812, 0.13195228576660156, 0.139801025390625, 0.14764976501464844, 0.15549850463867188, 0.1633472442626953, 0.17119598388671875, 0.1790447235107422, 0.18689346313476562, 0.19474220275878906, 0.2025909423828125, 0.21043968200683594, 0.21828842163085938, 0.2261371612548828, 0.23398590087890625, 0.2418346405029297, 0.24968338012695312, 0.25753211975097656, 0.265380859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 6.0, 13.0, 18.0, 32.0, 56.0, 111.0, 161.0, 176.0, 172.0, 100.0, 64.0, 36.0, 11.0, 13.0, 12.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4878716468811035, -5.288812160491943, -5.089752197265625, -4.890692710876465, -4.691633224487305, -4.4925737380981445, -4.293514251708984, -4.094454288482666, -3.895394802093506, -3.6963353157043457, -3.4972755908966064, -3.298215866088867, -3.099156379699707, -2.900096893310547, -2.7010371685028076, -2.5019774436950684, -2.302917957305908, -2.103858470916748, -1.9047987461090088, -1.705739140510559, -1.5066795349121094, -1.3076199293136597, -1.10856032371521, -0.9095007181167603, -0.7104411125183105, -0.5113815069198608, -0.31232190132141113, -0.11326229572296143, 0.08579730987548828, 0.284856915473938, 0.4839165210723877, 0.6829761266708374, 0.8820362091064453, 1.081095814704895, 1.2801554203033447, 1.4792150259017944, 1.6782746315002441, 1.8773342370986938, 2.0763938426971436, 2.275453567504883, 2.474513053894043, 2.673572540283203, 2.8726322650909424, 3.0716919898986816, 3.270751476287842, 3.469810962677002, 3.668870687484741, 3.8679304122924805, 4.066989898681641, 4.266049385070801, 4.465108871459961, 4.664168834686279, 4.8632283210754395, 5.0622878074646, 5.261347770690918, 5.460407257080078, 5.659466743469238, 5.858526229858398, 6.057585716247559, 6.256645679473877, 6.455705165863037, 6.654764652252197, 6.853824615478516, 7.052884101867676, 7.251943588256836]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 3.0, 6.0, 5.0, 10.0, 9.0, 5.0, 9.0, 11.0, 23.0, 15.0, 20.0, 24.0, 37.0, 40.0, 23.0, 40.0, 46.0, 45.0, 34.0, 44.0, 45.0, 57.0, 41.0, 37.0, 41.0, 38.0, 42.0, 43.0, 23.0, 29.0, 23.0, 24.0, 24.0, 13.0, 17.0, 8.0, 6.0, 10.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.5036134719848633, -3.3969221115112305, -3.2902307510375977, -3.183539390563965, -3.076848030090332, -2.970156669616699, -2.8634653091430664, -2.7567739486694336, -2.650082588195801, -2.543391227722168, -2.436699867248535, -2.3300085067749023, -2.2233171463012695, -2.1166257858276367, -2.009934425354004, -1.9032431840896606, -1.7965519428253174, -1.6898605823516846, -1.5831692218780518, -1.476477861404419, -1.3697865009307861, -1.2630951404571533, -1.15640389919281, -1.0497125387191772, -0.9430211782455444, -0.8363298177719116, -0.7296384572982788, -0.6229471564292908, -0.516255795955658, -0.40956443548202515, -0.3028731346130371, -0.1961817741394043, -0.08949017524719238, 0.017201170325279236, 0.12389251589775085, 0.23058384656906128, 0.3372752070426941, 0.4439665675163269, 0.5506578683853149, 0.6573492288589478, 0.7640405893325806, 0.8707319498062134, 0.9774233102798462, 1.0841145515441895, 1.1908059120178223, 1.297497272491455, 1.404188632965088, 1.5108799934387207, 1.6175713539123535, 1.7242627143859863, 1.8309540748596191, 1.937645435333252, 2.0443367958068848, 2.1510281562805176, 2.2577195167541504, 2.364410877227783, 2.471102237701416, 2.577793598175049, 2.6844849586486816, 2.7911763191223145, 2.8978676795959473, 3.00455904006958, 3.111250400543213, 3.2179417610168457, 3.3246328830718994]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 10.0, 11.0, 15.0, 21.0, 25.0, 28.0, 52.0, 51.0, 84.0, 123.0, 147.0, 270.0, 450.0, 839.0, 1881.0, 4809.0, 15530.0, 94514.0, 3973517.0, 79618.0, 14015.0, 4456.0, 1707.0, 830.0, 433.0, 276.0, 160.0, 107.0, 78.0, 54.0, 36.0, 27.0, 24.0, 11.0, 15.0, 13.0, 3.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8291015625, -1.7572784423828125, -1.685455322265625, -1.6136322021484375, -1.54180908203125, -1.4699859619140625, -1.398162841796875, -1.3263397216796875, -1.2545166015625, -1.1826934814453125, -1.110870361328125, -1.0390472412109375, -0.96722412109375, -0.8954010009765625, -0.823577880859375, -0.7517547607421875, -0.679931640625, -0.6081085205078125, -0.536285400390625, -0.4644622802734375, -0.39263916015625, -0.3208160400390625, -0.248992919921875, -0.1771697998046875, -0.1053466796875, -0.0335235595703125, 0.038299560546875, 0.1101226806640625, 0.18194580078125, 0.2537689208984375, 0.325592041015625, 0.3974151611328125, 0.46923828125, 0.5410614013671875, 0.612884521484375, 0.6847076416015625, 0.75653076171875, 0.8283538818359375, 0.900177001953125, 0.9720001220703125, 1.0438232421875, 1.1156463623046875, 1.187469482421875, 1.2592926025390625, 1.33111572265625, 1.4029388427734375, 1.474761962890625, 1.5465850830078125, 1.618408203125, 1.6902313232421875, 1.762054443359375, 1.8338775634765625, 1.90570068359375, 1.9775238037109375, 2.049346923828125, 2.1211700439453125, 2.1929931640625, 2.2648162841796875, 2.336639404296875, 2.4084625244140625, 2.48028564453125, 2.5521087646484375, 2.623931884765625, 2.6957550048828125, 2.767578125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 0.0, 6.0, 7.0, 14.0, 13.0, 24.0, 36.0, 61.0, 66.0, 61.0, 75.0, 108.0, 98.0, 87.0, 76.0, 74.0, 60.0, 41.0, 23.0, 23.0, 13.0, 6.0, 7.0, 3.0, 8.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.279541015625, -0.27059173583984375, -0.2616424560546875, -0.25269317626953125, -0.243743896484375, -0.23479461669921875, -0.2258453369140625, -0.21689605712890625, -0.20794677734375, -0.19899749755859375, -0.1900482177734375, -0.18109893798828125, -0.172149658203125, -0.16320037841796875, -0.1542510986328125, -0.14530181884765625, -0.1363525390625, -0.12740325927734375, -0.1184539794921875, -0.10950469970703125, -0.100555419921875, -0.09160614013671875, -0.0826568603515625, -0.07370758056640625, -0.06475830078125, -0.05580902099609375, -0.0468597412109375, -0.03791046142578125, -0.028961181640625, -0.02001190185546875, -0.0110626220703125, -0.00211334228515625, 0.0068359375, 0.01578521728515625, 0.0247344970703125, 0.03368377685546875, 0.042633056640625, 0.05158233642578125, 0.0605316162109375, 0.06948089599609375, 0.07843017578125, 0.08737945556640625, 0.0963287353515625, 0.10527801513671875, 0.114227294921875, 0.12317657470703125, 0.1321258544921875, 0.14107513427734375, 0.1500244140625, 0.15897369384765625, 0.1679229736328125, 0.17687225341796875, 0.185821533203125, 0.19477081298828125, 0.2037200927734375, 0.21266937255859375, 0.22161865234375, 0.23056793212890625, 0.2395172119140625, 0.24846649169921875, 0.257415771484375, 0.26636505126953125, 0.2753143310546875, 0.28426361083984375, 0.293212890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 6.0, 3.0, 6.0, 2.0, 12.0, 18.0, 8.0, 17.0, 23.0, 23.0, 30.0, 42.0, 56.0, 68.0, 154.0, 502.0, 3551.0, 55337.0, 4087101.0, 42987.0, 3246.0, 559.0, 152.0, 86.0, 79.0, 36.0, 26.0, 28.0, 27.0, 16.0, 14.0, 18.0, 13.0, 14.0, 8.0, 3.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.3828125, -5.24639892578125, -5.1099853515625, -4.97357177734375, -4.837158203125, -4.70074462890625, -4.5643310546875, -4.42791748046875, -4.29150390625, -4.15509033203125, -4.0186767578125, -3.88226318359375, -3.745849609375, -3.60943603515625, -3.4730224609375, -3.33660888671875, -3.2001953125, -3.06378173828125, -2.9273681640625, -2.79095458984375, -2.654541015625, -2.51812744140625, -2.3817138671875, -2.24530029296875, -2.10888671875, -1.97247314453125, -1.8360595703125, -1.69964599609375, -1.563232421875, -1.42681884765625, -1.2904052734375, -1.15399169921875, -1.017578125, -0.88116455078125, -0.7447509765625, -0.60833740234375, -0.471923828125, -0.33551025390625, -0.1990966796875, -0.06268310546875, 0.07373046875, 0.21014404296875, 0.3465576171875, 0.48297119140625, 0.619384765625, 0.75579833984375, 0.8922119140625, 1.02862548828125, 1.1650390625, 1.30145263671875, 1.4378662109375, 1.57427978515625, 1.710693359375, 1.84710693359375, 1.9835205078125, 2.11993408203125, 2.25634765625, 2.39276123046875, 2.5291748046875, 2.66558837890625, 2.802001953125, 2.93841552734375, 3.0748291015625, 3.21124267578125, 3.34765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 6.0, 8.0, 22.0, 29.0, 84.0, 206.0, 2243.0, 1127.0, 190.0, 73.0, 31.0, 26.0, 13.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.30023956298828125, -0.2699127197265625, -0.23958587646484375, -0.209259033203125, -0.17893218994140625, -0.1486053466796875, -0.11827850341796875, -0.08795166015625, -0.05762481689453125, -0.0272979736328125, 0.00302886962890625, 0.033355712890625, 0.06368255615234375, 0.0940093994140625, 0.12433624267578125, 0.1546630859375, 0.18498992919921875, 0.2153167724609375, 0.24564361572265625, 0.275970458984375, 0.30629730224609375, 0.3366241455078125, 0.36695098876953125, 0.39727783203125, 0.42760467529296875, 0.4579315185546875, 0.48825836181640625, 0.518585205078125, 0.5489120483398438, 0.5792388916015625, 0.6095657348632812, 0.639892578125, 0.6702194213867188, 0.7005462646484375, 0.7308731079101562, 0.761199951171875, 0.7915267944335938, 0.8218536376953125, 0.8521804809570312, 0.88250732421875, 0.9128341674804688, 0.9431610107421875, 0.9734878540039062, 1.003814697265625, 1.0341415405273438, 1.0644683837890625, 1.0947952270507812, 1.1251220703125, 1.1554489135742188, 1.1857757568359375, 1.2161026000976562, 1.246429443359375, 1.2767562866210938, 1.3070831298828125, 1.3374099731445312, 1.36773681640625, 1.3980636596679688, 1.4283905029296875, 1.4587173461914062, 1.489044189453125, 1.5193710327148438, 1.5496978759765625, 1.5800247192382812, 1.6103515625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 11.0, 22.0, 71.0, 328.0, 339.0, 149.0, 42.0, 17.0, 10.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.684720993041992, -8.363730430603027, -8.042738914489746, -7.721748352050781, -7.400757789611816, -7.079766750335693, -6.75877571105957, -6.4377851486206055, -6.116794109344482, -5.795803070068359, -5.4748125076293945, -5.1538214683532715, -4.832830429077148, -4.511839866638184, -4.1908488273620605, -3.8698580265045166, -3.5488672256469727, -3.2278764247894287, -2.9068856239318848, -2.5858945846557617, -2.2649037837982178, -1.9439129829406738, -1.6229220628738403, -1.3019311428070068, -0.9809403419494629, -0.6599494814872742, -0.33895862102508545, -0.01796776056289673, 0.303023099899292, 0.6240139007568359, 0.9450048208236694, 1.265995740890503, 1.5869855880737305, 1.9079763889312744, 2.2289671897888184, 2.5499582290649414, 2.8709490299224854, 3.1919398307800293, 3.5129308700561523, 3.8339216709136963, 4.15491247177124, 4.475903511047363, 4.796894073486328, 5.117885112762451, 5.438876152038574, 5.759866714477539, 6.080857753753662, 6.401848793029785, 6.72283935546875, 7.043830394744873, 7.364820957183838, 7.685811996459961, 8.006802558898926, 8.32779312133789, 8.648784637451172, 8.969775199890137, 9.290765762329102, 9.611756324768066, 9.932747840881348, 10.253738403320312, 10.574728965759277, 10.895719528198242, 11.216711044311523, 11.537701606750488, 11.85869312286377]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 11.0, 7.0, 11.0, 15.0, 43.0, 37.0, 52.0, 65.0, 69.0, 84.0, 108.0, 80.0, 71.0, 73.0, 60.0, 69.0, 41.0, 30.0, 23.0, 20.0, 15.0, 6.0, 4.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.737337589263916, -3.6351592540740967, -3.5329811573028564, -3.430802822113037, -3.3286244869232178, -3.2264461517333984, -3.124268054962158, -3.022089719772339, -2.9199113845825195, -2.8177330493927, -2.71555495262146, -2.6133766174316406, -2.5111982822418213, -2.409019947052002, -2.3068418502807617, -2.2046635150909424, -2.102485418319702, -2.000307083129883, -1.898128867149353, -1.7959506511688232, -1.693772315979004, -1.5915940999984741, -1.4894158840179443, -1.387237548828125, -1.2850593328475952, -1.1828811168670654, -1.080702781677246, -0.9785245656967163, -0.8763462901115417, -0.7741680145263672, -0.6719897985458374, -0.5698115229606628, -0.4676334857940674, -0.3654552102088928, -0.26327696442604065, -0.16109871864318848, -0.058920443058013916, 0.043257832527160645, 0.14543604850769043, 0.247614324092865, 0.34979259967803955, 0.4519708752632141, 0.5541491508483887, 0.6563273668289185, 0.758505642414093, 0.8606839179992676, 0.9628621339797974, 1.0650403499603271, 1.1672186851501465, 1.2693969011306763, 1.3715752363204956, 1.4737534523010254, 1.5759317874908447, 1.6781100034713745, 1.7802882194519043, 1.8824665546417236, 1.9846447706222534, 2.086822986602783, 2.1890013217926025, 2.291179656982422, 2.393357753753662, 2.4955360889434814, 2.597714424133301, 2.699892520904541, 2.8020708560943604]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 9.0, 15.0, 21.0, 29.0, 48.0, 51.0, 58.0, 99.0, 171.0, 232.0, 353.0, 579.0, 1068.0, 2067.0, 4396.0, 10738.0, 31640.0, 128881.0, 543421.0, 245692.0, 51229.0, 15640.0, 6056.0, 2722.0, 1338.0, 753.0, 425.0, 260.0, 158.0, 113.0, 91.0, 55.0, 46.0, 28.0, 19.0, 8.0, 12.0, 7.0, 9.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2783203125, -1.236663818359375, -1.19500732421875, -1.153350830078125, -1.1116943359375, -1.070037841796875, -1.02838134765625, -0.986724853515625, -0.945068359375, -0.903411865234375, -0.86175537109375, -0.820098876953125, -0.7784423828125, -0.736785888671875, -0.69512939453125, -0.653472900390625, -0.61181640625, -0.570159912109375, -0.52850341796875, -0.486846923828125, -0.4451904296875, -0.403533935546875, -0.36187744140625, -0.320220947265625, -0.278564453125, -0.236907958984375, -0.19525146484375, -0.153594970703125, -0.1119384765625, -0.070281982421875, -0.02862548828125, 0.013031005859375, 0.0546875, 0.096343994140625, 0.13800048828125, 0.179656982421875, 0.2213134765625, 0.262969970703125, 0.30462646484375, 0.346282958984375, 0.387939453125, 0.429595947265625, 0.47125244140625, 0.512908935546875, 0.5545654296875, 0.596221923828125, 0.63787841796875, 0.679534912109375, 0.72119140625, 0.762847900390625, 0.80450439453125, 0.846160888671875, 0.8878173828125, 0.929473876953125, 0.97113037109375, 1.012786865234375, 1.054443359375, 1.096099853515625, 1.13775634765625, 1.179412841796875, 1.2210693359375, 1.262725830078125, 1.30438232421875, 1.346038818359375, 1.3876953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 10.0, 18.0, 15.0, 22.0, 23.0, 45.0, 55.0, 60.0, 82.0, 89.0, 72.0, 70.0, 76.0, 73.0, 62.0, 49.0, 46.0, 34.0, 22.0, 12.0, 11.0, 13.0, 9.0, 7.0, 5.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29833984375, -0.2893104553222656, -0.28028106689453125, -0.2712516784667969, -0.2622222900390625, -0.2531929016113281, -0.24416351318359375, -0.23513412475585938, -0.226104736328125, -0.21707534790039062, -0.20804595947265625, -0.19901657104492188, -0.1899871826171875, -0.18095779418945312, -0.17192840576171875, -0.16289901733398438, -0.15386962890625, -0.14484024047851562, -0.13581085205078125, -0.12678146362304688, -0.1177520751953125, -0.10872268676757812, -0.09969329833984375, -0.09066390991210938, -0.081634521484375, -0.07260513305664062, -0.06357574462890625, -0.054546356201171875, -0.0455169677734375, -0.036487579345703125, -0.02745819091796875, -0.018428802490234375, -0.0093994140625, -0.000370025634765625, 0.00865936279296875, 0.017688751220703125, 0.0267181396484375, 0.035747528076171875, 0.04477691650390625, 0.053806304931640625, 0.062835693359375, 0.07186508178710938, 0.08089447021484375, 0.08992385864257812, 0.0989532470703125, 0.10798263549804688, 0.11701202392578125, 0.12604141235351562, 0.13507080078125, 0.14410018920898438, 0.15312957763671875, 0.16215896606445312, 0.1711883544921875, 0.18021774291992188, 0.18924713134765625, 0.19827651977539062, 0.207305908203125, 0.21633529663085938, 0.22536468505859375, 0.23439407348632812, 0.2434234619140625, 0.2524528503417969, 0.26148223876953125, 0.2705116271972656, 0.279541015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 12.0, 23.0, 23.0, 21.0, 31.0, 39.0, 84.0, 110.0, 190.0, 291.0, 436.0, 878.0, 1561.0, 3219.0, 6466.0, 14477.0, 35249.0, 99908.0, 324528.0, 371646.0, 117406.0, 40691.0, 16292.0, 7258.0, 3509.0, 1879.0, 990.0, 493.0, 318.0, 173.0, 107.0, 77.0, 53.0, 38.0, 26.0, 16.0, 9.0, 7.0, 1.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.73583984375, -0.712158203125, -0.6884765625, -0.664794921875, -0.64111328125, -0.617431640625, -0.59375, -0.570068359375, -0.54638671875, -0.522705078125, -0.4990234375, -0.475341796875, -0.45166015625, -0.427978515625, -0.404296875, -0.380615234375, -0.35693359375, -0.333251953125, -0.3095703125, -0.285888671875, -0.26220703125, -0.238525390625, -0.21484375, -0.191162109375, -0.16748046875, -0.143798828125, -0.1201171875, -0.096435546875, -0.07275390625, -0.049072265625, -0.025390625, -0.001708984375, 0.02197265625, 0.045654296875, 0.0693359375, 0.093017578125, 0.11669921875, 0.140380859375, 0.1640625, 0.187744140625, 0.21142578125, 0.235107421875, 0.2587890625, 0.282470703125, 0.30615234375, 0.329833984375, 0.353515625, 0.377197265625, 0.40087890625, 0.424560546875, 0.4482421875, 0.471923828125, 0.49560546875, 0.519287109375, 0.54296875, 0.566650390625, 0.59033203125, 0.614013671875, 0.6376953125, 0.661376953125, 0.68505859375, 0.708740234375, 0.732421875, 0.756103515625, 0.77978515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 5.0, 4.0, 5.0, 8.0, 12.0, 8.0, 8.0, 14.0, 15.0, 17.0, 22.0, 20.0, 26.0, 28.0, 41.0, 45.0, 36.0, 42.0, 47.0, 38.0, 39.0, 41.0, 47.0, 40.0, 61.0, 41.0, 32.0, 35.0, 44.0, 29.0, 31.0, 19.0, 19.0, 14.0, 11.0, 17.0, 9.0, 5.0, 9.0, 2.0, 7.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70703125, -0.6821975708007812, -0.6573638916015625, -0.6325302124023438, -0.607696533203125, -0.5828628540039062, -0.5580291748046875, -0.5331954956054688, -0.50836181640625, -0.48352813720703125, -0.4586944580078125, -0.43386077880859375, -0.409027099609375, -0.38419342041015625, -0.3593597412109375, -0.33452606201171875, -0.3096923828125, -0.28485870361328125, -0.2600250244140625, -0.23519134521484375, -0.210357666015625, -0.18552398681640625, -0.1606903076171875, -0.13585662841796875, -0.11102294921875, -0.08618927001953125, -0.0613555908203125, -0.03652191162109375, -0.011688232421875, 0.01314544677734375, 0.0379791259765625, 0.06281280517578125, 0.087646484375, 0.11248016357421875, 0.1373138427734375, 0.16214752197265625, 0.186981201171875, 0.21181488037109375, 0.2366485595703125, 0.26148223876953125, 0.28631591796875, 0.31114959716796875, 0.3359832763671875, 0.36081695556640625, 0.385650634765625, 0.41048431396484375, 0.4353179931640625, 0.46015167236328125, 0.4849853515625, 0.5098190307617188, 0.5346527099609375, 0.5594863891601562, 0.584320068359375, 0.6091537475585938, 0.6339874267578125, 0.6588211059570312, 0.68365478515625, 0.7084884643554688, 0.7333221435546875, 0.7581558227539062, 0.782989501953125, 0.8078231811523438, 0.8326568603515625, 0.8574905395507812, 0.88232421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 10.0, 11.0, 21.0, 21.0, 34.0, 60.0, 72.0, 139.0, 194.0, 318.0, 617.0, 1369.0, 2914.0, 7404.0, 24592.0, 122049.0, 602637.0, 228915.0, 38926.0, 10801.0, 3850.0, 1685.0, 819.0, 440.0, 232.0, 135.0, 97.0, 50.0, 44.0, 31.0, 17.0, 12.0, 9.0, 11.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.607421875, -0.5903892517089844, -0.5733566284179688, -0.5563240051269531, -0.5392913818359375, -0.5222587585449219, -0.5052261352539062, -0.4881935119628906, -0.471160888671875, -0.4541282653808594, -0.43709564208984375, -0.4200630187988281, -0.4030303955078125, -0.3859977722167969, -0.36896514892578125, -0.3519325256347656, -0.33489990234375, -0.3178672790527344, -0.30083465576171875, -0.2838020324707031, -0.2667694091796875, -0.24973678588867188, -0.23270416259765625, -0.21567153930664062, -0.198638916015625, -0.18160629272460938, -0.16457366943359375, -0.14754104614257812, -0.1305084228515625, -0.11347579956054688, -0.09644317626953125, -0.07941055297851562, -0.0623779296875, -0.045345306396484375, -0.02831268310546875, -0.011280059814453125, 0.0057525634765625, 0.022785186767578125, 0.03981781005859375, 0.056850433349609375, 0.073883056640625, 0.09091567993164062, 0.10794830322265625, 0.12498092651367188, 0.1420135498046875, 0.15904617309570312, 0.17607879638671875, 0.19311141967773438, 0.21014404296875, 0.22717666625976562, 0.24420928955078125, 0.2612419128417969, 0.2782745361328125, 0.2953071594238281, 0.31233978271484375, 0.3293724060058594, 0.346405029296875, 0.3634376525878906, 0.38047027587890625, 0.3975028991699219, 0.4145355224609375, 0.4315681457519531, 0.44860076904296875, 0.4656333923339844, 0.482666015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 6.0, 8.0, 12.0, 20.0, 21.0, 27.0, 61.0, 73.0, 99.0, 117.0, 142.0, 111.0, 102.0, 49.0, 40.0, 29.0, 15.0, 13.0, 15.0, 7.0, 3.0, 2.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012373924255371094, -0.00012001954019069672, -0.0001162998378276825, -0.00011258013546466827, -0.00010886043310165405, -0.00010514073073863983, -0.00010142102837562561, -9.770132601261139e-05, -9.398162364959717e-05, -9.026192128658295e-05, -8.654221892356873e-05, -8.28225165605545e-05, -7.910281419754028e-05, -7.538311183452606e-05, -7.166340947151184e-05, -6.794370710849762e-05, -6.42240047454834e-05, -6.050430238246918e-05, -5.6784600019454956e-05, -5.3064897656440735e-05, -4.9345195293426514e-05, -4.562549293041229e-05, -4.190579056739807e-05, -3.818608820438385e-05, -3.446638584136963e-05, -3.074668347835541e-05, -2.7026981115341187e-05, -2.3307278752326965e-05, -1.9587576389312744e-05, -1.5867874026298523e-05, -1.2148171663284302e-05, -8.42846930027008e-06, -4.708766937255859e-06, -9.890645742416382e-07, 2.730637788772583e-06, 6.450340151786804e-06, 1.0170042514801025e-05, 1.3889744877815247e-05, 1.7609447240829468e-05, 2.132914960384369e-05, 2.504885196685791e-05, 2.876855432987213e-05, 3.248825669288635e-05, 3.6207959055900574e-05, 3.9927661418914795e-05, 4.3647363781929016e-05, 4.736706614494324e-05, 5.108676850795746e-05, 5.480647087097168e-05, 5.85261732339859e-05, 6.224587559700012e-05, 6.596557796001434e-05, 6.968528032302856e-05, 7.340498268604279e-05, 7.712468504905701e-05, 8.084438741207123e-05, 8.456408977508545e-05, 8.828379213809967e-05, 9.200349450111389e-05, 9.572319686412811e-05, 9.944289922714233e-05, 0.00010316260159015656, 0.00010688230395317078, 0.000110602006316185, 0.00011432170867919922]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 8.0, 11.0, 21.0, 17.0, 30.0, 37.0, 57.0, 86.0, 113.0, 176.0, 299.0, 538.0, 864.0, 1514.0, 2984.0, 6654.0, 16576.0, 51159.0, 246474.0, 545048.0, 123198.0, 31469.0, 11220.0, 4742.0, 2288.0, 1198.0, 644.0, 367.0, 251.0, 139.0, 101.0, 79.0, 50.0, 30.0, 27.0, 20.0, 10.0, 19.0, 8.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.55615234375, -0.5383834838867188, -0.5206146240234375, -0.5028457641601562, -0.485076904296875, -0.46730804443359375, -0.4495391845703125, -0.43177032470703125, -0.41400146484375, -0.39623260498046875, -0.3784637451171875, -0.36069488525390625, -0.342926025390625, -0.32515716552734375, -0.3073883056640625, -0.28961944580078125, -0.2718505859375, -0.25408172607421875, -0.2363128662109375, -0.21854400634765625, -0.200775146484375, -0.18300628662109375, -0.1652374267578125, -0.14746856689453125, -0.12969970703125, -0.11193084716796875, -0.0941619873046875, -0.07639312744140625, -0.058624267578125, -0.04085540771484375, -0.0230865478515625, -0.00531768798828125, 0.012451171875, 0.03022003173828125, 0.0479888916015625, 0.06575775146484375, 0.083526611328125, 0.10129547119140625, 0.1190643310546875, 0.13683319091796875, 0.15460205078125, 0.17237091064453125, 0.1901397705078125, 0.20790863037109375, 0.225677490234375, 0.24344635009765625, 0.2612152099609375, 0.27898406982421875, 0.2967529296875, 0.31452178955078125, 0.3322906494140625, 0.35005950927734375, 0.367828369140625, 0.38559722900390625, 0.4033660888671875, 0.42113494873046875, 0.43890380859375, 0.45667266845703125, 0.4744415283203125, 0.49221038818359375, 0.509979248046875, 0.5277481079101562, 0.5455169677734375, 0.5632858276367188, 0.5810546875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 0.0, 5.0, 9.0, 7.0, 4.0, 7.0, 7.0, 9.0, 19.0, 18.0, 31.0, 28.0, 37.0, 57.0, 57.0, 76.0, 100.0, 70.0, 75.0, 74.0, 48.0, 55.0, 42.0, 34.0, 26.0, 21.0, 20.0, 10.0, 11.0, 12.0, 5.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.38720703125, -0.37526702880859375, -0.3633270263671875, -0.35138702392578125, -0.339447021484375, -0.32750701904296875, -0.3155670166015625, -0.30362701416015625, -0.29168701171875, -0.27974700927734375, -0.2678070068359375, -0.25586700439453125, -0.243927001953125, -0.23198699951171875, -0.2200469970703125, -0.20810699462890625, -0.1961669921875, -0.18422698974609375, -0.1722869873046875, -0.16034698486328125, -0.148406982421875, -0.13646697998046875, -0.1245269775390625, -0.11258697509765625, -0.10064697265625, -0.08870697021484375, -0.0767669677734375, -0.06482696533203125, -0.052886962890625, -0.04094696044921875, -0.0290069580078125, -0.01706695556640625, -0.005126953125, 0.00681304931640625, 0.0187530517578125, 0.03069305419921875, 0.042633056640625, 0.05457305908203125, 0.0665130615234375, 0.07845306396484375, 0.09039306640625, 0.10233306884765625, 0.1142730712890625, 0.12621307373046875, 0.138153076171875, 0.15009307861328125, 0.1620330810546875, 0.17397308349609375, 0.1859130859375, 0.19785308837890625, 0.2097930908203125, 0.22173309326171875, 0.233673095703125, 0.24561309814453125, 0.2575531005859375, 0.26949310302734375, 0.28143310546875, 0.29337310791015625, 0.3053131103515625, 0.31725311279296875, 0.329193115234375, 0.34113311767578125, 0.3530731201171875, 0.36501312255859375, 0.376953125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 8.0, 13.0, 32.0, 73.0, 131.0, 177.0, 209.0, 149.0, 87.0, 41.0, 30.0, 18.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.909470558166504, -7.619542121887207, -7.32961368560791, -7.039685249328613, -6.749756813049316, -6.4598283767700195, -6.169900417327881, -5.879971981048584, -5.590043544769287, -5.30011510848999, -5.010186672210693, -4.7202582359313965, -4.430330276489258, -4.140401840209961, -3.850473403930664, -3.560544967651367, -3.2706165313720703, -2.9806880950927734, -2.6907596588134766, -2.400831460952759, -2.110903024673462, -1.820974588394165, -1.5310462713241577, -1.2411179542541504, -0.9511895179748535, -0.6612611413002014, -0.3713327646255493, -0.08140438795089722, 0.20852398872375488, 0.49845242500305176, 0.7883807420730591, 1.0783090591430664, 1.3682374954223633, 1.6581659317016602, 1.9480942487716675, 2.238022565841675, 2.5279510021209717, 2.8178794384002686, 3.1078076362609863, 3.397736072540283, 3.68766450881958, 3.977592945098877, 4.267521381378174, 4.557449817657471, 4.847377777099609, 5.137306213378906, 5.427234649658203, 5.7171630859375, 6.007091522216797, 6.297019958496094, 6.586948394775391, 6.8768768310546875, 7.166805267333984, 7.456733703613281, 7.74666166305542, 8.036590576171875, 8.326519012451172, 8.616447448730469, 8.906375885009766, 9.196304321289062, 9.48623275756836, 9.776161193847656, 10.066089630126953, 10.35601806640625, 10.64594554901123]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 7.0, 1.0, 8.0, 9.0, 9.0, 12.0, 14.0, 18.0, 16.0, 30.0, 20.0, 29.0, 38.0, 39.0, 32.0, 44.0, 50.0, 49.0, 54.0, 51.0, 35.0, 44.0, 47.0, 37.0, 43.0, 36.0, 39.0, 30.0, 32.0, 18.0, 22.0, 14.0, 15.0, 17.0, 8.0, 13.0, 7.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.7762956619262695, -4.626414775848389, -4.47653341293335, -4.326652526855469, -4.176771640777588, -4.026890754699707, -3.877009391784668, -3.727128505706787, -3.577247381210327, -3.427366256713867, -3.2774853706359863, -3.1276042461395264, -2.9777231216430664, -2.8278422355651855, -2.6779611110687256, -2.5280799865722656, -2.3781991004943848, -2.228317975997925, -2.078437089920044, -1.928555965423584, -1.7786749601364136, -1.6287939548492432, -1.4789128303527832, -1.3290318250656128, -1.1791508197784424, -1.029269814491272, -0.8793887495994568, -0.7295076847076416, -0.5796266794204712, -0.4297456741333008, -0.2798646092414856, -0.1299835443496704, 0.019897937774658203, 0.169778972864151, 0.3196600079536438, 0.4695410430431366, 0.6194220781326294, 0.7693030834197998, 0.919184148311615, 1.0690652132034302, 1.2189462184906006, 1.368827223777771, 1.5187082290649414, 1.6685893535614014, 1.8184703588485718, 1.9683513641357422, 2.118232488632202, 2.268113613128662, 2.417994499206543, 2.567875623703003, 2.717756509780884, 2.8676376342773438, 3.0175185203552246, 3.1673996448516846, 3.3172807693481445, 3.4671616554260254, 3.6170427799224854, 3.7669239044189453, 3.916804790496826, 4.066685676574707, 4.216567039489746, 4.366447925567627, 4.516328811645508, 4.666210174560547, 4.816091060638428]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 8.0, 8.0, 13.0, 29.0, 31.0, 41.0, 54.0, 87.0, 124.0, 254.0, 501.0, 1154.0, 3387.0, 14885.0, 369971.0, 3773888.0, 22053.0, 4730.0, 1603.0, 686.0, 325.0, 171.0, 100.0, 59.0, 36.0, 27.0, 16.0, 5.0, 10.0, 3.0, 2.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.84765625, -3.7410888671875, -3.634521484375, -3.5279541015625, -3.42138671875, -3.3148193359375, -3.208251953125, -3.1016845703125, -2.9951171875, -2.8885498046875, -2.781982421875, -2.6754150390625, -2.56884765625, -2.4622802734375, -2.355712890625, -2.2491455078125, -2.142578125, -2.0360107421875, -1.929443359375, -1.8228759765625, -1.71630859375, -1.6097412109375, -1.503173828125, -1.3966064453125, -1.2900390625, -1.1834716796875, -1.076904296875, -0.9703369140625, -0.86376953125, -0.7572021484375, -0.650634765625, -0.5440673828125, -0.4375, -0.3309326171875, -0.224365234375, -0.1177978515625, -0.01123046875, 0.0953369140625, 0.201904296875, 0.3084716796875, 0.4150390625, 0.5216064453125, 0.628173828125, 0.7347412109375, 0.84130859375, 0.9478759765625, 1.054443359375, 1.1610107421875, 1.267578125, 1.3741455078125, 1.480712890625, 1.5872802734375, 1.69384765625, 1.8004150390625, 1.906982421875, 2.0135498046875, 2.1201171875, 2.2266845703125, 2.333251953125, 2.4398193359375, 2.54638671875, 2.6529541015625, 2.759521484375, 2.8660888671875, 2.97265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 12.0, 12.0, 23.0, 48.0, 52.0, 66.0, 76.0, 106.0, 116.0, 103.0, 91.0, 70.0, 62.0, 64.0, 36.0, 21.0, 16.0, 5.0, 10.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.529296875, -0.5163497924804688, -0.5034027099609375, -0.49045562744140625, -0.477508544921875, -0.46456146240234375, -0.4516143798828125, -0.43866729736328125, -0.42572021484375, -0.41277313232421875, -0.3998260498046875, -0.38687896728515625, -0.373931884765625, -0.36098480224609375, -0.3480377197265625, -0.33509063720703125, -0.3221435546875, -0.30919647216796875, -0.2962493896484375, -0.28330230712890625, -0.270355224609375, -0.25740814208984375, -0.2444610595703125, -0.23151397705078125, -0.21856689453125, -0.20561981201171875, -0.1926727294921875, -0.17972564697265625, -0.166778564453125, -0.15383148193359375, -0.1408843994140625, -0.12793731689453125, -0.114990234375, -0.10204315185546875, -0.0890960693359375, -0.07614898681640625, -0.063201904296875, -0.05025482177734375, -0.0373077392578125, -0.02436065673828125, -0.01141357421875, 0.00153350830078125, 0.0144805908203125, 0.02742767333984375, 0.040374755859375, 0.05332183837890625, 0.0662689208984375, 0.07921600341796875, 0.0921630859375, 0.10511016845703125, 0.1180572509765625, 0.13100433349609375, 0.143951416015625, 0.15689849853515625, 0.1698455810546875, 0.18279266357421875, 0.19573974609375, 0.20868682861328125, 0.2216339111328125, 0.23458099365234375, 0.247528076171875, 0.26047515869140625, 0.2734222412109375, 0.28636932373046875, 0.29931640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 10.0, 12.0, 8.0, 14.0, 19.0, 27.0, 55.0, 78.0, 115.0, 162.0, 281.0, 498.0, 843.0, 1574.0, 2971.0, 6171.0, 13978.0, 38797.0, 182271.0, 3564695.0, 301398.0, 49155.0, 16896.0, 7132.0, 3258.0, 1669.0, 887.0, 541.0, 265.0, 170.0, 107.0, 65.0, 42.0, 36.0, 30.0, 18.0, 5.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.1822967529296875, -1.140960693359375, -1.0996246337890625, -1.05828857421875, -1.0169525146484375, -0.975616455078125, -0.9342803955078125, -0.8929443359375, -0.8516082763671875, -0.810272216796875, -0.7689361572265625, -0.72760009765625, -0.6862640380859375, -0.644927978515625, -0.6035919189453125, -0.562255859375, -0.5209197998046875, -0.479583740234375, -0.4382476806640625, -0.39691162109375, -0.3555755615234375, -0.314239501953125, -0.2729034423828125, -0.2315673828125, -0.1902313232421875, -0.148895263671875, -0.1075592041015625, -0.06622314453125, -0.0248870849609375, 0.016448974609375, 0.0577850341796875, 0.09912109375, 0.1404571533203125, 0.181793212890625, 0.2231292724609375, 0.26446533203125, 0.3058013916015625, 0.347137451171875, 0.3884735107421875, 0.4298095703125, 0.4711456298828125, 0.512481689453125, 0.5538177490234375, 0.59515380859375, 0.6364898681640625, 0.677825927734375, 0.7191619873046875, 0.760498046875, 0.8018341064453125, 0.843170166015625, 0.8845062255859375, 0.92584228515625, 0.9671783447265625, 1.008514404296875, 1.0498504638671875, 1.0911865234375, 1.1325225830078125, 1.173858642578125, 1.2151947021484375, 1.25653076171875, 1.2978668212890625, 1.339202880859375, 1.3805389404296875, 1.421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 7.0, 3.0, 12.0, 12.0, 11.0, 10.0, 25.0, 50.0, 50.0, 75.0, 141.0, 341.0, 1360.0, 1309.0, 280.0, 138.0, 81.0, 42.0, 25.0, 24.0, 19.0, 13.0, 6.0, 6.0, 7.0, 1.0, 7.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.79443359375, -0.7755126953125, -0.756591796875, -0.7376708984375, -0.71875, -0.6998291015625, -0.680908203125, -0.6619873046875, -0.64306640625, -0.6241455078125, -0.605224609375, -0.5863037109375, -0.5673828125, -0.5484619140625, -0.529541015625, -0.5106201171875, -0.49169921875, -0.4727783203125, -0.453857421875, -0.4349365234375, -0.416015625, -0.3970947265625, -0.378173828125, -0.3592529296875, -0.34033203125, -0.3214111328125, -0.302490234375, -0.2835693359375, -0.2646484375, -0.2457275390625, -0.226806640625, -0.2078857421875, -0.18896484375, -0.1700439453125, -0.151123046875, -0.1322021484375, -0.11328125, -0.0943603515625, -0.075439453125, -0.0565185546875, -0.03759765625, -0.0186767578125, 0.000244140625, 0.0191650390625, 0.0380859375, 0.0570068359375, 0.075927734375, 0.0948486328125, 0.11376953125, 0.1326904296875, 0.151611328125, 0.1705322265625, 0.189453125, 0.2083740234375, 0.227294921875, 0.2462158203125, 0.26513671875, 0.2840576171875, 0.302978515625, 0.3218994140625, 0.3408203125, 0.3597412109375, 0.378662109375, 0.3975830078125, 0.41650390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 17.0, 15.0, 32.0, 54.0, 92.0, 129.0, 190.0, 195.0, 129.0, 71.0, 23.0, 18.0, 10.0, 5.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.834409713745117, -6.671724319458008, -6.509038925170898, -6.346353530883789, -6.18366813659668, -6.02098274230957, -5.858297348022461, -5.695611953735352, -5.532926559448242, -5.370241165161133, -5.207555770874023, -5.044870376586914, -4.882184982299805, -4.719499588012695, -4.556814193725586, -4.394128799438477, -4.231443405151367, -4.068758010864258, -3.9060726165771484, -3.743387222290039, -3.5807018280029297, -3.4180164337158203, -3.255331039428711, -3.0926456451416016, -2.9299607276916504, -2.767275333404541, -2.6045899391174316, -2.4419045448303223, -2.279219150543213, -2.1165337562561035, -1.9538484811782837, -1.7911630868911743, -1.6284778118133545, -1.4657924175262451, -1.3031070232391357, -1.1404216289520264, -0.9777362942695618, -0.8150508999824524, -0.6523655652999878, -0.4896801710128784, -0.32699477672576904, -0.16430939733982086, -0.0016240179538726807, 0.1610613465309143, 0.3237467408180237, 0.48643213510513306, 0.6491174697875977, 0.811802864074707, 0.9744882583618164, 1.1371736526489258, 1.2998590469360352, 1.4625444412231445, 1.625229835510254, 1.7879152297973633, 1.950600504875183, 2.113286018371582, 2.2759714126586914, 2.438656806945801, 2.60134220123291, 2.7640275955200195, 2.926712989807129, 3.0893983840942383, 3.2520837783813477, 3.414769172668457, 3.5774543285369873]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 9.0, 11.0, 18.0, 10.0, 19.0, 21.0, 21.0, 20.0, 25.0, 29.0, 35.0, 37.0, 42.0, 41.0, 34.0, 37.0, 35.0, 40.0, 55.0, 34.0, 48.0, 43.0, 38.0, 35.0, 29.0, 32.0, 29.0, 17.0, 21.0, 25.0, 14.0, 12.0, 17.0, 10.0, 6.0, 8.0, 10.0, 6.0, 2.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6138734817504883, -1.5613279342651367, -1.5087823867797852, -1.4562368392944336, -1.403691291809082, -1.3511457443237305, -1.2986003160476685, -1.246054768562317, -1.1935092210769653, -1.1409636735916138, -1.0884181261062622, -1.0358725786209106, -0.9833270907402039, -0.9307815432548523, -0.8782360553741455, -0.825690507888794, -0.7731449604034424, -0.7205994129180908, -0.6680538654327393, -0.6155083775520325, -0.5629628300666809, -0.5104172825813293, -0.45787176489830017, -0.405326247215271, -0.35278069972991943, -0.30023515224456787, -0.2476896345615387, -0.19514410197734833, -0.14259856939315796, -0.0900530219078064, -0.03750750422477722, 0.015038013458251953, 0.06758356094360352, 0.12012909352779388, 0.17267462611198425, 0.22522015869617462, 0.277765691280365, 0.33031123876571655, 0.3828567564487457, 0.4354022741317749, 0.48794782161712646, 0.540493369102478, 0.5930389165878296, 0.6455844044685364, 0.6981299519538879, 0.7506754994392395, 0.8032209873199463, 0.8557665348052979, 0.9083120822906494, 0.960857629776001, 1.0134031772613525, 1.065948724746704, 1.1184942722320557, 1.1710398197174072, 1.2235852479934692, 1.2761307954788208, 1.3286763429641724, 1.381221890449524, 1.4337674379348755, 1.486312985420227, 1.538858413696289, 1.5914039611816406, 1.6439495086669922, 1.6964950561523438, 1.7490406036376953]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 14.0, 13.0, 14.0, 18.0, 24.0, 36.0, 60.0, 70.0, 114.0, 178.0, 303.0, 501.0, 1133.0, 2586.0, 6623.0, 22238.0, 106828.0, 651131.0, 206376.0, 34316.0, 9505.0, 3330.0, 1439.0, 659.0, 412.0, 200.0, 146.0, 74.0, 61.0, 39.0, 27.0, 27.0, 9.0, 8.0, 7.0, 5.0, 1.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3720703125, -1.3224639892578125, -1.272857666015625, -1.2232513427734375, -1.17364501953125, -1.1240386962890625, -1.074432373046875, -1.0248260498046875, -0.9752197265625, -0.9256134033203125, -0.876007080078125, -0.8264007568359375, -0.77679443359375, -0.7271881103515625, -0.677581787109375, -0.6279754638671875, -0.578369140625, -0.5287628173828125, -0.479156494140625, -0.4295501708984375, -0.37994384765625, -0.3303375244140625, -0.280731201171875, -0.2311248779296875, -0.1815185546875, -0.1319122314453125, -0.082305908203125, -0.0326995849609375, 0.01690673828125, 0.0665130615234375, 0.116119384765625, 0.1657257080078125, 0.21533203125, 0.2649383544921875, 0.314544677734375, 0.3641510009765625, 0.41375732421875, 0.4633636474609375, 0.512969970703125, 0.5625762939453125, 0.6121826171875, 0.6617889404296875, 0.711395263671875, 0.7610015869140625, 0.81060791015625, 0.8602142333984375, 0.909820556640625, 0.9594268798828125, 1.009033203125, 1.0586395263671875, 1.108245849609375, 1.1578521728515625, 1.20745849609375, 1.2570648193359375, 1.306671142578125, 1.3562774658203125, 1.4058837890625, 1.4554901123046875, 1.505096435546875, 1.5547027587890625, 1.60430908203125, 1.6539154052734375, 1.703521728515625, 1.7531280517578125, 1.802734375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 13.0, 22.0, 42.0, 36.0, 55.0, 68.0, 80.0, 102.0, 112.0, 102.0, 86.0, 73.0, 60.0, 52.0, 28.0, 16.0, 12.0, 13.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.53173828125, -0.5192337036132812, -0.5067291259765625, -0.49422454833984375, -0.481719970703125, -0.46921539306640625, -0.4567108154296875, -0.44420623779296875, -0.43170166015625, -0.41919708251953125, -0.4066925048828125, -0.39418792724609375, -0.381683349609375, -0.36917877197265625, -0.3566741943359375, -0.34416961669921875, -0.3316650390625, -0.31916046142578125, -0.3066558837890625, -0.29415130615234375, -0.281646728515625, -0.26914215087890625, -0.2566375732421875, -0.24413299560546875, -0.23162841796875, -0.21912384033203125, -0.2066192626953125, -0.19411468505859375, -0.181610107421875, -0.16910552978515625, -0.1566009521484375, -0.14409637451171875, -0.131591796875, -0.11908721923828125, -0.1065826416015625, -0.09407806396484375, -0.081573486328125, -0.06906890869140625, -0.0565643310546875, -0.04405975341796875, -0.03155517578125, -0.01905059814453125, -0.0065460205078125, 0.00595855712890625, 0.018463134765625, 0.03096771240234375, 0.0434722900390625, 0.05597686767578125, 0.0684814453125, 0.08098602294921875, 0.0934906005859375, 0.10599517822265625, 0.118499755859375, 0.13100433349609375, 0.1435089111328125, 0.15601348876953125, 0.16851806640625, 0.18102264404296875, 0.1935272216796875, 0.20603179931640625, 0.218536376953125, 0.23104095458984375, 0.2435455322265625, 0.25605010986328125, 0.2685546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 5.0, 19.0, 19.0, 26.0, 29.0, 46.0, 85.0, 109.0, 136.0, 275.0, 368.0, 644.0, 997.0, 1795.0, 3251.0, 6266.0, 12715.0, 28106.0, 69883.0, 211245.0, 442868.0, 165246.0, 57067.0, 23793.0, 11017.0, 5579.0, 2887.0, 1569.0, 880.0, 546.0, 382.0, 230.0, 157.0, 91.0, 55.0, 44.0, 30.0, 18.0, 12.0, 14.0, 12.0, 10.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.66845703125, -0.6464691162109375, -0.624481201171875, -0.6024932861328125, -0.58050537109375, -0.5585174560546875, -0.536529541015625, -0.5145416259765625, -0.4925537109375, -0.4705657958984375, -0.448577880859375, -0.4265899658203125, -0.40460205078125, -0.3826141357421875, -0.360626220703125, -0.3386383056640625, -0.316650390625, -0.2946624755859375, -0.272674560546875, -0.2506866455078125, -0.22869873046875, -0.2067108154296875, -0.184722900390625, -0.1627349853515625, -0.1407470703125, -0.1187591552734375, -0.096771240234375, -0.0747833251953125, -0.05279541015625, -0.0308074951171875, -0.008819580078125, 0.0131683349609375, 0.03515625, 0.0571441650390625, 0.079132080078125, 0.1011199951171875, 0.12310791015625, 0.1450958251953125, 0.167083740234375, 0.1890716552734375, 0.2110595703125, 0.2330474853515625, 0.255035400390625, 0.2770233154296875, 0.29901123046875, 0.3209991455078125, 0.342987060546875, 0.3649749755859375, 0.386962890625, 0.4089508056640625, 0.430938720703125, 0.4529266357421875, 0.47491455078125, 0.4969024658203125, 0.518890380859375, 0.5408782958984375, 0.5628662109375, 0.5848541259765625, 0.606842041015625, 0.6288299560546875, 0.65081787109375, 0.6728057861328125, 0.694793701171875, 0.7167816162109375, 0.73876953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 11.0, 10.0, 11.0, 15.0, 10.0, 15.0, 14.0, 17.0, 22.0, 30.0, 43.0, 32.0, 41.0, 34.0, 53.0, 40.0, 52.0, 50.0, 52.0, 58.0, 50.0, 27.0, 43.0, 46.0, 30.0, 24.0, 28.0, 23.0, 21.0, 15.0, 17.0, 12.0, 13.0, 11.0, 11.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.896484375, -0.8692474365234375, -0.842010498046875, -0.8147735595703125, -0.78753662109375, -0.7602996826171875, -0.733062744140625, -0.7058258056640625, -0.6785888671875, -0.6513519287109375, -0.624114990234375, -0.5968780517578125, -0.56964111328125, -0.5424041748046875, -0.515167236328125, -0.4879302978515625, -0.460693359375, -0.4334564208984375, -0.406219482421875, -0.3789825439453125, -0.35174560546875, -0.3245086669921875, -0.297271728515625, -0.2700347900390625, -0.2427978515625, -0.2155609130859375, -0.188323974609375, -0.1610870361328125, -0.13385009765625, -0.1066131591796875, -0.079376220703125, -0.0521392822265625, -0.02490234375, 0.0023345947265625, 0.029571533203125, 0.0568084716796875, 0.08404541015625, 0.1112823486328125, 0.138519287109375, 0.1657562255859375, 0.1929931640625, 0.2202301025390625, 0.247467041015625, 0.2747039794921875, 0.30194091796875, 0.3291778564453125, 0.356414794921875, 0.3836517333984375, 0.410888671875, 0.4381256103515625, 0.465362548828125, 0.4925994873046875, 0.51983642578125, 0.5470733642578125, 0.574310302734375, 0.6015472412109375, 0.6287841796875, 0.6560211181640625, 0.683258056640625, 0.7104949951171875, 0.73773193359375, 0.7649688720703125, 0.792205810546875, 0.8194427490234375, 0.8466796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 7.0, 5.0, 10.0, 4.0, 3.0, 12.0, 14.0, 13.0, 13.0, 35.0, 35.0, 51.0, 102.0, 159.0, 276.0, 477.0, 1011.0, 2523.0, 8073.0, 36434.0, 373012.0, 562584.0, 48168.0, 10150.0, 2967.0, 1113.0, 511.0, 303.0, 133.0, 92.0, 74.0, 56.0, 35.0, 27.0, 18.0, 15.0, 11.0, 7.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0], "bins": [-0.669921875, -0.6523284912109375, -0.634735107421875, -0.6171417236328125, -0.59954833984375, -0.5819549560546875, -0.564361572265625, -0.5467681884765625, -0.5291748046875, -0.5115814208984375, -0.493988037109375, -0.4763946533203125, -0.45880126953125, -0.4412078857421875, -0.423614501953125, -0.4060211181640625, -0.388427734375, -0.3708343505859375, -0.353240966796875, -0.3356475830078125, -0.31805419921875, -0.3004608154296875, -0.282867431640625, -0.2652740478515625, -0.2476806640625, -0.2300872802734375, -0.212493896484375, -0.1949005126953125, -0.17730712890625, -0.1597137451171875, -0.142120361328125, -0.1245269775390625, -0.10693359375, -0.0893402099609375, -0.071746826171875, -0.0541534423828125, -0.03656005859375, -0.0189666748046875, -0.001373291015625, 0.0162200927734375, 0.0338134765625, 0.0514068603515625, 0.069000244140625, 0.0865936279296875, 0.10418701171875, 0.1217803955078125, 0.139373779296875, 0.1569671630859375, 0.174560546875, 0.1921539306640625, 0.209747314453125, 0.2273406982421875, 0.24493408203125, 0.2625274658203125, 0.280120849609375, 0.2977142333984375, 0.3153076171875, 0.3329010009765625, 0.350494384765625, 0.3680877685546875, 0.38568115234375, 0.4032745361328125, 0.420867919921875, 0.4384613037109375, 0.4560546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 6.0, 4.0, 9.0, 7.0, 12.0, 10.0, 11.0, 22.0, 37.0, 49.0, 48.0, 56.0, 71.0, 130.0, 115.0, 103.0, 81.0, 51.0, 49.0, 32.0, 15.0, 15.0, 14.0, 9.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.867813110351562e-05, -7.638614624738693e-05, -7.409416139125824e-05, -7.180217653512955e-05, -6.951019167900085e-05, -6.721820682287216e-05, -6.492622196674347e-05, -6.263423711061478e-05, -6.0342252254486084e-05, -5.805026739835739e-05, -5.57582825422287e-05, -5.3466297686100006e-05, -5.1174312829971313e-05, -4.888232797384262e-05, -4.659034311771393e-05, -4.4298358261585236e-05, -4.200637340545654e-05, -3.971438854932785e-05, -3.742240369319916e-05, -3.5130418837070465e-05, -3.283843398094177e-05, -3.054644912481308e-05, -2.8254464268684387e-05, -2.5962479412555695e-05, -2.3670494556427002e-05, -2.137850970029831e-05, -1.9086524844169617e-05, -1.6794539988040924e-05, -1.4502555131912231e-05, -1.2210570275783539e-05, -9.918585419654846e-06, -7.6266005635261536e-06, -5.334615707397461e-06, -3.0426308512687683e-06, -7.506459951400757e-07, 1.541338860988617e-06, 3.8333237171173096e-06, 6.125308573246002e-06, 8.417293429374695e-06, 1.0709278285503387e-05, 1.300126314163208e-05, 1.5293247997760773e-05, 1.7585232853889465e-05, 1.9877217710018158e-05, 2.216920256614685e-05, 2.4461187422275543e-05, 2.6753172278404236e-05, 2.904515713453293e-05, 3.133714199066162e-05, 3.3629126846790314e-05, 3.5921111702919006e-05, 3.82130965590477e-05, 4.050508141517639e-05, 4.2797066271305084e-05, 4.508905112743378e-05, 4.738103598356247e-05, 4.967302083969116e-05, 5.1965005695819855e-05, 5.425699055194855e-05, 5.654897540807724e-05, 5.884096026420593e-05, 6.113294512033463e-05, 6.342492997646332e-05, 6.571691483259201e-05, 6.80088996887207e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 4.0, 8.0, 5.0, 8.0, 20.0, 15.0, 40.0, 44.0, 67.0, 106.0, 162.0, 253.0, 488.0, 1086.0, 2538.0, 8058.0, 40304.0, 741258.0, 223736.0, 21644.0, 5184.0, 1764.0, 803.0, 374.0, 183.0, 116.0, 79.0, 64.0, 41.0, 26.0, 24.0, 8.0, 10.0, 9.0, 4.0, 8.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8203125, -0.7918548583984375, -0.763397216796875, -0.7349395751953125, -0.70648193359375, -0.6780242919921875, -0.649566650390625, -0.6211090087890625, -0.5926513671875, -0.5641937255859375, -0.535736083984375, -0.5072784423828125, -0.47882080078125, -0.4503631591796875, -0.421905517578125, -0.3934478759765625, -0.364990234375, -0.3365325927734375, -0.308074951171875, -0.2796173095703125, -0.25115966796875, -0.2227020263671875, -0.194244384765625, -0.1657867431640625, -0.1373291015625, -0.1088714599609375, -0.080413818359375, -0.0519561767578125, -0.02349853515625, 0.0049591064453125, 0.033416748046875, 0.0618743896484375, 0.09033203125, 0.1187896728515625, 0.147247314453125, 0.1757049560546875, 0.20416259765625, 0.2326202392578125, 0.261077880859375, 0.2895355224609375, 0.3179931640625, 0.3464508056640625, 0.374908447265625, 0.4033660888671875, 0.43182373046875, 0.4602813720703125, 0.488739013671875, 0.5171966552734375, 0.545654296875, 0.5741119384765625, 0.602569580078125, 0.6310272216796875, 0.65948486328125, 0.6879425048828125, 0.716400146484375, 0.7448577880859375, 0.7733154296875, 0.8017730712890625, 0.830230712890625, 0.8586883544921875, 0.88714599609375, 0.9156036376953125, 0.944061279296875, 0.9725189208984375, 1.0009765625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 3.0, 5.0, 5.0, 3.0, 8.0, 6.0, 8.0, 10.0, 21.0, 21.0, 41.0, 67.0, 95.0, 178.0, 192.0, 123.0, 54.0, 53.0, 29.0, 21.0, 11.0, 7.0, 7.0, 8.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5537109375, -0.5383453369140625, -0.522979736328125, -0.5076141357421875, -0.49224853515625, -0.4768829345703125, -0.461517333984375, -0.4461517333984375, -0.4307861328125, -0.4154205322265625, -0.400054931640625, -0.3846893310546875, -0.36932373046875, -0.3539581298828125, -0.338592529296875, -0.3232269287109375, -0.307861328125, -0.2924957275390625, -0.277130126953125, -0.2617645263671875, -0.24639892578125, -0.2310333251953125, -0.215667724609375, -0.2003021240234375, -0.1849365234375, -0.1695709228515625, -0.154205322265625, -0.1388397216796875, -0.12347412109375, -0.1081085205078125, -0.092742919921875, -0.0773773193359375, -0.06201171875, -0.0466461181640625, -0.031280517578125, -0.0159149169921875, -0.00054931640625, 0.0148162841796875, 0.030181884765625, 0.0455474853515625, 0.0609130859375, 0.0762786865234375, 0.091644287109375, 0.1070098876953125, 0.12237548828125, 0.1377410888671875, 0.153106689453125, 0.1684722900390625, 0.183837890625, 0.1992034912109375, 0.214569091796875, 0.2299346923828125, 0.24530029296875, 0.2606658935546875, 0.276031494140625, 0.2913970947265625, 0.3067626953125, 0.3221282958984375, 0.337493896484375, 0.3528594970703125, 0.36822509765625, 0.3835906982421875, 0.398956298828125, 0.4143218994140625, 0.4296875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 8.0, 9.0, 17.0, 23.0, 53.0, 97.0, 127.0, 172.0, 189.0, 110.0, 84.0, 37.0, 25.0, 14.0, 8.0, 17.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.693691730499268, -6.434723854064941, -6.175756454467773, -5.9167890548706055, -5.657821178436279, -5.398853302001953, -5.139885902404785, -4.880918502807617, -4.621950626373291, -4.362982749938965, -4.104015350341797, -3.84504771232605, -3.5860800743103027, -3.3271124362945557, -3.0681447982788086, -2.8091771602630615, -2.5502095222473145, -2.2912418842315674, -2.0322742462158203, -1.7733066082000732, -1.5143389701843262, -1.255371332168579, -0.996403694152832, -0.737436056137085, -0.4784684181213379, -0.21950078010559082, 0.03946685791015625, 0.2984344959259033, 0.5574021339416504, 0.8163697719573975, 1.0753374099731445, 1.3343050479888916, 1.5932722091674805, 1.8522398471832275, 2.1112074851989746, 2.3701751232147217, 2.6291427612304688, 2.888110399246216, 3.147078037261963, 3.40604567527771, 3.665013313293457, 3.923980951309204, 4.182948589324951, 4.441916465759277, 4.700883865356445, 4.959851264953613, 5.2188191413879395, 5.477787017822266, 5.736754417419434, 5.995721817016602, 6.254689693450928, 6.513657569885254, 6.772624969482422, 7.03159236907959, 7.290560245513916, 7.549528121948242, 7.80849552154541, 8.067462921142578, 8.326431274414062, 8.58539867401123, 8.844366073608398, 9.103333473205566, 9.362300872802734, 9.621269226074219, 9.880236625671387]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 10.0, 8.0, 9.0, 15.0, 15.0, 19.0, 29.0, 28.0, 34.0, 33.0, 46.0, 46.0, 33.0, 55.0, 64.0, 42.0, 53.0, 47.0, 51.0, 41.0, 54.0, 40.0, 31.0, 30.0, 38.0, 37.0, 26.0, 13.0, 11.0, 9.0, 12.0, 10.0, 8.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.510470390319824, -5.339556694030762, -5.168642520904541, -4.9977288246154785, -4.826814651489258, -4.655900955200195, -4.484987258911133, -4.314073085784912, -4.143158912658691, -3.97224497795105, -3.801331043243408, -3.6304173469543457, -3.459503173828125, -3.2885894775390625, -3.117675542831421, -2.9467616081237793, -2.775847911834717, -2.604933977127075, -2.4340200424194336, -2.263106346130371, -2.0921921730041504, -1.9212783575057983, -1.7503645420074463, -1.5794506072998047, -1.408536672592163, -1.2376227378845215, -1.0667088031768799, -0.8957949876785278, -0.7248810529708862, -0.5539671182632446, -0.3830533027648926, -0.21213936805725098, -0.041225433349609375, 0.12968847155570984, 0.30060237646102905, 0.4715162515640259, 0.6424301862716675, 0.8133441209793091, 0.9842579364776611, 1.1551718711853027, 1.3260858058929443, 1.496999740600586, 1.6679136753082275, 1.8388274908065796, 2.0097413063049316, 2.1806554794311523, 2.351569175720215, 2.5224831104278564, 2.693397045135498, 2.8643109798431396, 3.0352249145507812, 3.2061386108398438, 3.3770527839660645, 3.547966480255127, 3.7188804149627686, 3.88979434967041, 4.060708045959473, 4.231621742248535, 4.402535915374756, 4.573449611663818, 4.744363784790039, 4.915277481079102, 5.086191177368164, 5.257105350494385, 5.4280195236206055]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 6.0, 9.0, 20.0, 37.0, 61.0, 101.0, 176.0, 320.0, 952.0, 4085.0, 48647.0, 4115014.0, 20403.0, 2920.0, 837.0, 333.0, 177.0, 75.0, 41.0, 18.0, 13.0, 10.0, 14.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5390625, -5.38677978515625, -5.2344970703125, -5.08221435546875, -4.929931640625, -4.77764892578125, -4.6253662109375, -4.47308349609375, -4.32080078125, -4.16851806640625, -4.0162353515625, -3.86395263671875, -3.711669921875, -3.55938720703125, -3.4071044921875, -3.25482177734375, -3.1025390625, -2.95025634765625, -2.7979736328125, -2.64569091796875, -2.493408203125, -2.34112548828125, -2.1888427734375, -2.03656005859375, -1.88427734375, -1.73199462890625, -1.5797119140625, -1.42742919921875, -1.275146484375, -1.12286376953125, -0.9705810546875, -0.81829833984375, -0.666015625, -0.51373291015625, -0.3614501953125, -0.20916748046875, -0.056884765625, 0.09539794921875, 0.2476806640625, 0.39996337890625, 0.55224609375, 0.70452880859375, 0.8568115234375, 1.00909423828125, 1.161376953125, 1.31365966796875, 1.4659423828125, 1.61822509765625, 1.7705078125, 1.92279052734375, 2.0750732421875, 2.22735595703125, 2.379638671875, 2.53192138671875, 2.6842041015625, 2.83648681640625, 2.98876953125, 3.14105224609375, 3.2933349609375, 3.44561767578125, 3.597900390625, 3.75018310546875, 3.9024658203125, 4.05474853515625, 4.20703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 3.0, 18.0, 30.0, 40.0, 53.0, 80.0, 79.0, 93.0, 115.0, 90.0, 92.0, 90.0, 64.0, 52.0, 29.0, 27.0, 17.0, 7.0, 4.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5859375, -0.57159423828125, -0.5572509765625, -0.54290771484375, -0.528564453125, -0.51422119140625, -0.4998779296875, -0.48553466796875, -0.47119140625, -0.45684814453125, -0.4425048828125, -0.42816162109375, -0.413818359375, -0.39947509765625, -0.3851318359375, -0.37078857421875, -0.3564453125, -0.34210205078125, -0.3277587890625, -0.31341552734375, -0.299072265625, -0.28472900390625, -0.2703857421875, -0.25604248046875, -0.24169921875, -0.22735595703125, -0.2130126953125, -0.19866943359375, -0.184326171875, -0.16998291015625, -0.1556396484375, -0.14129638671875, -0.126953125, -0.11260986328125, -0.0982666015625, -0.08392333984375, -0.069580078125, -0.05523681640625, -0.0408935546875, -0.02655029296875, -0.01220703125, 0.00213623046875, 0.0164794921875, 0.03082275390625, 0.045166015625, 0.05950927734375, 0.0738525390625, 0.08819580078125, 0.1025390625, 0.11688232421875, 0.1312255859375, 0.14556884765625, 0.159912109375, 0.17425537109375, 0.1885986328125, 0.20294189453125, 0.21728515625, 0.23162841796875, 0.2459716796875, 0.26031494140625, 0.274658203125, 0.28900146484375, 0.3033447265625, 0.31768798828125, 0.33203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 6.0, 17.0, 18.0, 28.0, 22.0, 32.0, 61.0, 71.0, 118.0, 153.0, 214.0, 290.0, 483.0, 803.0, 1417.0, 2873.0, 6160.0, 15468.0, 53217.0, 988679.0, 3030337.0, 62750.0, 17376.0, 6577.0, 2990.0, 1600.0, 830.0, 552.0, 348.0, 216.0, 134.0, 122.0, 65.0, 77.0, 38.0, 40.0, 18.0, 16.0, 10.0, 13.0, 7.0, 8.0, 6.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.794921875, -1.73712158203125, -1.6793212890625, -1.62152099609375, -1.563720703125, -1.50592041015625, -1.4481201171875, -1.39031982421875, -1.33251953125, -1.27471923828125, -1.2169189453125, -1.15911865234375, -1.101318359375, -1.04351806640625, -0.9857177734375, -0.92791748046875, -0.8701171875, -0.81231689453125, -0.7545166015625, -0.69671630859375, -0.638916015625, -0.58111572265625, -0.5233154296875, -0.46551513671875, -0.40771484375, -0.34991455078125, -0.2921142578125, -0.23431396484375, -0.176513671875, -0.11871337890625, -0.0609130859375, -0.00311279296875, 0.0546875, 0.11248779296875, 0.1702880859375, 0.22808837890625, 0.285888671875, 0.34368896484375, 0.4014892578125, 0.45928955078125, 0.51708984375, 0.57489013671875, 0.6326904296875, 0.69049072265625, 0.748291015625, 0.80609130859375, 0.8638916015625, 0.92169189453125, 0.9794921875, 1.03729248046875, 1.0950927734375, 1.15289306640625, 1.210693359375, 1.26849365234375, 1.3262939453125, 1.38409423828125, 1.44189453125, 1.49969482421875, 1.5574951171875, 1.61529541015625, 1.673095703125, 1.73089599609375, 1.7886962890625, 1.84649658203125, 1.904296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 6.0, 14.0, 12.0, 23.0, 18.0, 47.0, 49.0, 70.0, 214.0, 776.0, 2219.0, 287.0, 118.0, 63.0, 48.0, 16.0, 13.0, 14.0, 15.0, 11.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7021484375, -0.680999755859375, -0.65985107421875, -0.638702392578125, -0.6175537109375, -0.596405029296875, -0.57525634765625, -0.554107666015625, -0.532958984375, -0.511810302734375, -0.49066162109375, -0.469512939453125, -0.4483642578125, -0.427215576171875, -0.40606689453125, -0.384918212890625, -0.36376953125, -0.342620849609375, -0.32147216796875, -0.300323486328125, -0.2791748046875, -0.258026123046875, -0.23687744140625, -0.215728759765625, -0.194580078125, -0.173431396484375, -0.15228271484375, -0.131134033203125, -0.1099853515625, -0.088836669921875, -0.06768798828125, -0.046539306640625, -0.025390625, -0.004241943359375, 0.01690673828125, 0.038055419921875, 0.0592041015625, 0.080352783203125, 0.10150146484375, 0.122650146484375, 0.143798828125, 0.164947509765625, 0.18609619140625, 0.207244873046875, 0.2283935546875, 0.249542236328125, 0.27069091796875, 0.291839599609375, 0.31298828125, 0.334136962890625, 0.35528564453125, 0.376434326171875, 0.3975830078125, 0.418731689453125, 0.43988037109375, 0.461029052734375, 0.482177734375, 0.503326416015625, 0.52447509765625, 0.545623779296875, 0.5667724609375, 0.587921142578125, 0.60906982421875, 0.630218505859375, 0.6513671875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 9.0, 12.0, 25.0, 27.0, 67.0, 98.0, 191.0, 233.0, 158.0, 93.0, 43.0, 15.0, 13.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1549787521362305, -4.990641117095947, -4.826303958892822, -4.661966323852539, -4.497629165649414, -4.333291530609131, -4.168954372406006, -4.004616737365723, -3.8402793407440186, -3.6759419441223145, -3.5116045475006104, -3.3472671508789062, -3.182929515838623, -3.018592357635498, -2.854254722595215, -2.6899173259735107, -2.5255799293518066, -2.3612425327301025, -2.1969051361083984, -2.0325677394866943, -1.8682302236557007, -1.7038928270339966, -1.539555311203003, -1.3752179145812988, -1.2108805179595947, -1.0465431213378906, -0.8822056651115417, -0.7178682088851929, -0.5535308122634888, -0.38919341564178467, -0.2248559594154358, -0.060518503189086914, 0.10381937026977539, 0.2681567966938019, 0.43249422311782837, 0.5968316793441772, 0.7611690759658813, 0.9255064725875854, 1.089843988418579, 1.2541813850402832, 1.4185187816619873, 1.5828561782836914, 1.7471935749053955, 1.9115310907363892, 2.075868606567383, 2.240205764770508, 2.404543399810791, 2.568880796432495, 2.733218193054199, 2.8975555896759033, 3.0618929862976074, 3.2262303829193115, 3.3905677795410156, 3.554905414581299, 3.719242811203003, 3.883580207824707, 4.047917366027832, 4.212255001068115, 4.37659215927124, 4.540929794311523, 4.705266952514648, 4.869604587554932, 5.033941745758057, 5.19827938079834, 5.362617015838623]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 8.0, 9.0, 13.0, 17.0, 12.0, 17.0, 25.0, 25.0, 30.0, 30.0, 52.0, 39.0, 46.0, 49.0, 50.0, 45.0, 44.0, 54.0, 52.0, 33.0, 46.0, 45.0, 34.0, 39.0, 25.0, 34.0, 25.0, 23.0, 16.0, 17.0, 10.0, 2.0, 5.0, 10.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9063098430633545, -1.847139835357666, -1.787969946861267, -1.7287999391555786, -1.6696300506591797, -1.6104600429534912, -1.5512900352478027, -1.4921201467514038, -1.4329502582550049, -1.3737802505493164, -1.3146103620529175, -1.255440354347229, -1.19627046585083, -1.1371004581451416, -1.0779304504394531, -1.0187605619430542, -0.9595905542373657, -0.900420606136322, -0.8412506580352783, -0.7820806503295898, -0.7229107618331909, -0.6637407541275024, -0.6045708060264587, -0.545400857925415, -0.48623090982437134, -0.42706096172332764, -0.36789101362228394, -0.30872103571891785, -0.24955108761787415, -0.19038113951683044, -0.13121116161346436, -0.07204121351242065, -0.012871146202087402, 0.046298809349536896, 0.1054687649011612, 0.1646387279033661, 0.2238086760044098, 0.2829786241054535, 0.3421486020088196, 0.4013185501098633, 0.460488498210907, 0.5196584463119507, 0.5788283944129944, 0.6379983425140381, 0.6971683502197266, 0.7563382387161255, 0.815508246421814, 0.8746781945228577, 0.9338481426239014, 0.9930180907249451, 1.0521880388259888, 1.1113580465316772, 1.1705279350280762, 1.2296979427337646, 1.2888679504394531, 1.348037838935852, 1.407207727432251, 1.4663777351379395, 1.5255476236343384, 1.5847176313400269, 1.6438875198364258, 1.7030575275421143, 1.7622275352478027, 1.8213974237442017, 1.8805674314498901]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 5.0, 4.0, 5.0, 23.0, 20.0, 30.0, 47.0, 62.0, 80.0, 165.0, 262.0, 510.0, 1160.0, 3052.0, 10588.0, 50576.0, 430287.0, 479140.0, 55321.0, 11515.0, 3259.0, 1198.0, 521.0, 261.0, 159.0, 89.0, 50.0, 51.0, 35.0, 17.0, 10.0, 12.0, 6.0, 7.0, 1.0, 7.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6793365478515625, -1.619415283203125, -1.5594940185546875, -1.49957275390625, -1.4396514892578125, -1.379730224609375, -1.3198089599609375, -1.2598876953125, -1.1999664306640625, -1.140045166015625, -1.0801239013671875, -1.02020263671875, -0.9602813720703125, -0.900360107421875, -0.8404388427734375, -0.780517578125, -0.7205963134765625, -0.660675048828125, -0.6007537841796875, -0.54083251953125, -0.4809112548828125, -0.420989990234375, -0.3610687255859375, -0.3011474609375, -0.2412261962890625, -0.181304931640625, -0.1213836669921875, -0.06146240234375, -0.0015411376953125, 0.058380126953125, 0.1183013916015625, 0.17822265625, 0.2381439208984375, 0.298065185546875, 0.3579864501953125, 0.41790771484375, 0.4778289794921875, 0.537750244140625, 0.5976715087890625, 0.6575927734375, 0.7175140380859375, 0.777435302734375, 0.8373565673828125, 0.89727783203125, 0.9571990966796875, 1.017120361328125, 1.0770416259765625, 1.136962890625, 1.1968841552734375, 1.256805419921875, 1.3167266845703125, 1.37664794921875, 1.4365692138671875, 1.496490478515625, 1.5564117431640625, 1.6163330078125, 1.6762542724609375, 1.736175537109375, 1.7960968017578125, 1.85601806640625, 1.9159393310546875, 1.975860595703125, 2.0357818603515625, 2.095703125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 11.0, 10.0, 26.0, 33.0, 60.0, 83.0, 83.0, 91.0, 113.0, 82.0, 91.0, 97.0, 57.0, 54.0, 43.0, 23.0, 17.0, 5.0, 9.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5694465637207031, -0.5544204711914062, -0.5393943786621094, -0.5243682861328125, -0.5093421936035156, -0.49431610107421875, -0.4792900085449219, -0.464263916015625, -0.4492378234863281, -0.43421173095703125, -0.4191856384277344, -0.4041595458984375, -0.3891334533691406, -0.37410736083984375, -0.3590812683105469, -0.34405517578125, -0.3290290832519531, -0.31400299072265625, -0.2989768981933594, -0.2839508056640625, -0.2689247131347656, -0.25389862060546875, -0.23887252807617188, -0.223846435546875, -0.20882034301757812, -0.19379425048828125, -0.17876815795898438, -0.1637420654296875, -0.14871597290039062, -0.13368988037109375, -0.11866378784179688, -0.1036376953125, -0.08861160278320312, -0.07358551025390625, -0.058559417724609375, -0.0435333251953125, -0.028507232666015625, -0.01348114013671875, 0.001544952392578125, 0.016571044921875, 0.031597137451171875, 0.04662322998046875, 0.061649322509765625, 0.0766754150390625, 0.09170150756835938, 0.10672760009765625, 0.12175369262695312, 0.13677978515625, 0.15180587768554688, 0.16683197021484375, 0.18185806274414062, 0.1968841552734375, 0.21191024780273438, 0.22693634033203125, 0.24196243286132812, 0.256988525390625, 0.2720146179199219, 0.28704071044921875, 0.3020668029785156, 0.3170928955078125, 0.3321189880371094, 0.34714508056640625, 0.3621711730957031, 0.377197265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 14.0, 19.0, 21.0, 36.0, 46.0, 91.0, 126.0, 190.0, 327.0, 523.0, 924.0, 1626.0, 2755.0, 5214.0, 9937.0, 19983.0, 44134.0, 107523.0, 305378.0, 337143.0, 119485.0, 47860.0, 21973.0, 10875.0, 5366.0, 2923.0, 1612.0, 982.0, 527.0, 325.0, 188.0, 156.0, 85.0, 53.0, 38.0, 39.0, 17.0, 9.0, 9.0, 5.0, 4.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63525390625, -0.6133880615234375, -0.591522216796875, -0.5696563720703125, -0.54779052734375, -0.5259246826171875, -0.504058837890625, -0.4821929931640625, -0.4603271484375, -0.4384613037109375, -0.416595458984375, -0.3947296142578125, -0.37286376953125, -0.3509979248046875, -0.329132080078125, -0.3072662353515625, -0.285400390625, -0.2635345458984375, -0.241668701171875, -0.2198028564453125, -0.19793701171875, -0.1760711669921875, -0.154205322265625, -0.1323394775390625, -0.1104736328125, -0.0886077880859375, -0.066741943359375, -0.0448760986328125, -0.02301025390625, -0.0011444091796875, 0.020721435546875, 0.0425872802734375, 0.064453125, 0.0863189697265625, 0.108184814453125, 0.1300506591796875, 0.15191650390625, 0.1737823486328125, 0.195648193359375, 0.2175140380859375, 0.2393798828125, 0.2612457275390625, 0.283111572265625, 0.3049774169921875, 0.32684326171875, 0.3487091064453125, 0.370574951171875, 0.3924407958984375, 0.414306640625, 0.4361724853515625, 0.458038330078125, 0.4799041748046875, 0.50177001953125, 0.5236358642578125, 0.545501708984375, 0.5673675537109375, 0.5892333984375, 0.6110992431640625, 0.632965087890625, 0.6548309326171875, 0.67669677734375, 0.6985626220703125, 0.720428466796875, 0.7422943115234375, 0.76416015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 3.0, 2.0, 4.0, 7.0, 17.0, 13.0, 10.0, 14.0, 23.0, 22.0, 28.0, 25.0, 38.0, 50.0, 34.0, 43.0, 46.0, 37.0, 37.0, 39.0, 47.0, 43.0, 68.0, 36.0, 38.0, 34.0, 42.0, 25.0, 22.0, 23.0, 22.0, 15.0, 21.0, 14.0, 14.0, 11.0, 8.0, 4.0, 5.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1103515625, -1.07989501953125, -1.0494384765625, -1.01898193359375, -0.988525390625, -0.95806884765625, -0.9276123046875, -0.89715576171875, -0.86669921875, -0.83624267578125, -0.8057861328125, -0.77532958984375, -0.744873046875, -0.71441650390625, -0.6839599609375, -0.65350341796875, -0.623046875, -0.59259033203125, -0.5621337890625, -0.53167724609375, -0.501220703125, -0.47076416015625, -0.4403076171875, -0.40985107421875, -0.37939453125, -0.34893798828125, -0.3184814453125, -0.28802490234375, -0.257568359375, -0.22711181640625, -0.1966552734375, -0.16619873046875, -0.1357421875, -0.10528564453125, -0.0748291015625, -0.04437255859375, -0.013916015625, 0.01654052734375, 0.0469970703125, 0.07745361328125, 0.10791015625, 0.13836669921875, 0.1688232421875, 0.19927978515625, 0.229736328125, 0.26019287109375, 0.2906494140625, 0.32110595703125, 0.3515625, 0.38201904296875, 0.4124755859375, 0.44293212890625, 0.473388671875, 0.50384521484375, 0.5343017578125, 0.56475830078125, 0.59521484375, 0.62567138671875, 0.6561279296875, 0.68658447265625, 0.717041015625, 0.74749755859375, 0.7779541015625, 0.80841064453125, 0.8388671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 2.0, 8.0, 10.0, 11.0, 37.0, 45.0, 96.0, 203.0, 428.0, 943.0, 2475.0, 8432.0, 58783.0, 850072.0, 109781.0, 11968.0, 3119.0, 1113.0, 512.0, 237.0, 122.0, 61.0, 35.0, 20.0, 8.0, 4.0, 10.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86181640625, -0.837615966796875, -0.81341552734375, -0.789215087890625, -0.7650146484375, -0.740814208984375, -0.71661376953125, -0.692413330078125, -0.668212890625, -0.644012451171875, -0.61981201171875, -0.595611572265625, -0.5714111328125, -0.547210693359375, -0.52301025390625, -0.498809814453125, -0.474609375, -0.450408935546875, -0.42620849609375, -0.402008056640625, -0.3778076171875, -0.353607177734375, -0.32940673828125, -0.305206298828125, -0.281005859375, -0.256805419921875, -0.23260498046875, -0.208404541015625, -0.1842041015625, -0.160003662109375, -0.13580322265625, -0.111602783203125, -0.08740234375, -0.063201904296875, -0.03900146484375, -0.014801025390625, 0.0093994140625, 0.033599853515625, 0.05780029296875, 0.082000732421875, 0.106201171875, 0.130401611328125, 0.15460205078125, 0.178802490234375, 0.2030029296875, 0.227203369140625, 0.25140380859375, 0.275604248046875, 0.2998046875, 0.324005126953125, 0.34820556640625, 0.372406005859375, 0.3966064453125, 0.420806884765625, 0.44500732421875, 0.469207763671875, 0.493408203125, 0.517608642578125, 0.54180908203125, 0.566009521484375, 0.5902099609375, 0.614410400390625, 0.63861083984375, 0.662811279296875, 0.68701171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 8.0, 12.0, 7.0, 12.0, 24.0, 19.0, 45.0, 41.0, 77.0, 105.0, 138.0, 130.0, 115.0, 67.0, 53.0, 45.0, 18.0, 21.0, 11.0, 4.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.614229202270508e-05, -9.313132613897324e-05, -9.01203602552414e-05, -8.710939437150955e-05, -8.409842848777771e-05, -8.108746260404587e-05, -7.807649672031403e-05, -7.506553083658218e-05, -7.205456495285034e-05, -6.90435990691185e-05, -6.603263318538666e-05, -6.302166730165482e-05, -6.0010701417922974e-05, -5.699973553419113e-05, -5.398876965045929e-05, -5.097780376672745e-05, -4.7966837882995605e-05, -4.4955871999263763e-05, -4.194490611553192e-05, -3.893394023180008e-05, -3.592297434806824e-05, -3.2912008464336395e-05, -2.9901042580604553e-05, -2.689007669687271e-05, -2.387911081314087e-05, -2.0868144929409027e-05, -1.7857179045677185e-05, -1.4846213161945343e-05, -1.1835247278213501e-05, -8.824281394481659e-06, -5.813315510749817e-06, -2.802349627017975e-06, 2.086162567138672e-07, 3.2195821404457092e-06, 6.230548024177551e-06, 9.241513907909393e-06, 1.2252479791641235e-05, 1.5263445675373077e-05, 1.827441155910492e-05, 2.128537744283676e-05, 2.4296343326568604e-05, 2.7307309210300446e-05, 3.0318275094032288e-05, 3.332924097776413e-05, 3.634020686149597e-05, 3.9351172745227814e-05, 4.2362138628959656e-05, 4.53731045126915e-05, 4.838407039642334e-05, 5.139503628015518e-05, 5.4406002163887024e-05, 5.7416968047618866e-05, 6.042793393135071e-05, 6.343889981508255e-05, 6.644986569881439e-05, 6.946083158254623e-05, 7.247179746627808e-05, 7.548276335000992e-05, 7.849372923374176e-05, 8.15046951174736e-05, 8.451566100120544e-05, 8.752662688493729e-05, 9.053759276866913e-05, 9.354855865240097e-05, 9.655952453613281e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 4.0, 9.0, 10.0, 23.0, 25.0, 46.0, 66.0, 83.0, 152.0, 262.0, 488.0, 943.0, 2408.0, 7985.0, 43881.0, 889968.0, 85280.0, 11299.0, 3111.0, 1175.0, 563.0, 249.0, 181.0, 123.0, 65.0, 50.0, 25.0, 29.0, 12.0, 12.0, 11.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.193359375, -1.1598587036132812, -1.1263580322265625, -1.0928573608398438, -1.059356689453125, -1.0258560180664062, -0.9923553466796875, -0.9588546752929688, -0.92535400390625, -0.8918533325195312, -0.8583526611328125, -0.8248519897460938, -0.791351318359375, -0.7578506469726562, -0.7243499755859375, -0.6908493041992188, -0.6573486328125, -0.6238479614257812, -0.5903472900390625, -0.5568466186523438, -0.523345947265625, -0.48984527587890625, -0.4563446044921875, -0.42284393310546875, -0.38934326171875, -0.35584259033203125, -0.3223419189453125, -0.28884124755859375, -0.255340576171875, -0.22183990478515625, -0.1883392333984375, -0.15483856201171875, -0.121337890625, -0.08783721923828125, -0.0543365478515625, -0.02083587646484375, 0.012664794921875, 0.04616546630859375, 0.0796661376953125, 0.11316680908203125, 0.14666748046875, 0.18016815185546875, 0.2136688232421875, 0.24716949462890625, 0.280670166015625, 0.31417083740234375, 0.3476715087890625, 0.38117218017578125, 0.4146728515625, 0.44817352294921875, 0.4816741943359375, 0.5151748657226562, 0.548675537109375, 0.5821762084960938, 0.6156768798828125, 0.6491775512695312, 0.68267822265625, 0.7161788940429688, 0.7496795654296875, 0.7831802368164062, 0.816680908203125, 0.8501815795898438, 0.8836822509765625, 0.9171829223632812, 0.95068359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 6.0, 17.0, 22.0, 31.0, 97.0, 257.0, 302.0, 115.0, 55.0, 15.0, 23.0, 16.0, 13.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62353515625, -0.5976333618164062, -0.5717315673828125, -0.5458297729492188, -0.519927978515625, -0.49402618408203125, -0.4681243896484375, -0.44222259521484375, -0.41632080078125, -0.39041900634765625, -0.3645172119140625, -0.33861541748046875, -0.312713623046875, -0.28681182861328125, -0.2609100341796875, -0.23500823974609375, -0.2091064453125, -0.18320465087890625, -0.1573028564453125, -0.13140106201171875, -0.105499267578125, -0.07959747314453125, -0.0536956787109375, -0.02779388427734375, -0.00189208984375, 0.02400970458984375, 0.0499114990234375, 0.07581329345703125, 0.101715087890625, 0.12761688232421875, 0.1535186767578125, 0.17942047119140625, 0.205322265625, 0.23122406005859375, 0.2571258544921875, 0.28302764892578125, 0.308929443359375, 0.33483123779296875, 0.3607330322265625, 0.38663482666015625, 0.41253662109375, 0.43843841552734375, 0.4643402099609375, 0.49024200439453125, 0.516143798828125, 0.5420455932617188, 0.5679473876953125, 0.5938491821289062, 0.6197509765625, 0.6456527709960938, 0.6715545654296875, 0.6974563598632812, 0.723358154296875, 0.7492599487304688, 0.7751617431640625, 0.8010635375976562, 0.82696533203125, 0.8528671264648438, 0.8787689208984375, 0.9046707153320312, 0.930572509765625, 0.9564743041992188, 0.9823760986328125, 1.0082778930664062, 1.0341796875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 2.0, 0.0, 2.0, 23.0, 29.0, 78.0, 131.0, 253.0, 240.0, 141.0, 64.0, 23.0, 13.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.285696983337402, -6.86043643951416, -6.435175895690918, -6.009915351867676, -5.584654808044434, -5.159394264221191, -4.734133720397949, -4.308873176574707, -3.883612632751465, -3.4583520889282227, -3.0330915451049805, -2.6078310012817383, -2.182570457458496, -1.757309913635254, -1.3320493698120117, -0.9067888259887695, -0.48152828216552734, -0.056267738342285156, 0.36899280548095703, 0.7942533493041992, 1.2195138931274414, 1.6447744369506836, 2.070034980773926, 2.495295524597168, 2.92055606842041, 3.3458166122436523, 3.7710771560668945, 4.196337699890137, 4.621598243713379, 5.046858787536621, 5.472119331359863, 5.8973798751831055, 6.322641372680664, 6.747901916503906, 7.173162460327148, 7.598423004150391, 8.023683547973633, 8.448944091796875, 8.874204635620117, 9.29946517944336, 9.724725723266602, 10.149986267089844, 10.575246810913086, 11.000507354736328, 11.42576789855957, 11.851028442382812, 12.276288986206055, 12.701549530029297, 13.126810073852539, 13.552070617675781, 13.977331161499023, 14.402591705322266, 14.827852249145508, 15.25311279296875, 15.678373336791992, 16.103633880615234, 16.528894424438477, 16.95415496826172, 17.37941551208496, 17.804676055908203, 18.229936599731445, 18.655197143554688, 19.08045768737793, 19.505718231201172, 19.930978775024414]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 8.0, 4.0, 11.0, 6.0, 2.0, 5.0, 9.0, 16.0, 11.0, 16.0, 22.0, 23.0, 27.0, 27.0, 24.0, 25.0, 27.0, 26.0, 37.0, 40.0, 35.0, 39.0, 48.0, 41.0, 24.0, 43.0, 35.0, 37.0, 35.0, 36.0, 33.0, 33.0, 29.0, 28.0, 20.0, 11.0, 15.0, 18.0, 21.0, 13.0, 12.0, 3.0, 9.0, 8.0, 6.0, 2.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.478695869445801, -4.344449520111084, -4.210202693939209, -4.075956344604492, -3.9417099952697754, -3.8074634075164795, -3.6732168197631836, -3.538970470428467, -3.404723882675171, -3.270477294921875, -3.136230945587158, -3.0019843578338623, -2.8677377700805664, -2.7334914207458496, -2.5992448329925537, -2.464998245239258, -2.330751895904541, -2.196505308151245, -2.0622589588165283, -1.9280123710632324, -1.793765902519226, -1.6595194339752197, -1.5252728462219238, -1.3910263776779175, -1.2567799091339111, -1.1225334405899048, -0.9882869124412537, -0.8540403842926025, -0.7197939157485962, -0.5855474472045898, -0.4513009190559387, -0.3170543909072876, -0.18280792236328125, -0.048561424016952515, 0.08568507432937622, 0.21993157267570496, 0.3541780710220337, 0.48842453956604004, 0.6226710677146912, 0.7569175958633423, 0.8911640644073486, 1.025410532951355, 1.1596570014953613, 1.2939035892486572, 1.4281500577926636, 1.56239652633667, 1.6966431140899658, 1.8308895826339722, 1.9651360511779785, 2.0993826389312744, 2.233628988265991, 2.367875576019287, 2.502121925354004, 2.6363685131073, 2.7706151008605957, 2.9048614501953125, 3.0391080379486084, 3.1733546257019043, 3.307600975036621, 3.441847562789917, 3.576094150543213, 3.7103404998779297, 3.8445870876312256, 3.9788336753845215, 4.113080024719238]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 7.0, 18.0, 24.0, 39.0, 59.0, 84.0, 136.0, 163.0, 321.0, 533.0, 956.0, 2252.0, 8089.0, 68394.0, 4073571.0, 30102.0, 5648.0, 1858.0, 844.0, 456.0, 242.0, 173.0, 105.0, 55.0, 38.0, 28.0, 13.0, 16.0, 8.0, 12.0, 8.0, 4.0, 2.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.8099365234375, -3.670654296875, -3.5313720703125, -3.39208984375, -3.2528076171875, -3.113525390625, -2.9742431640625, -2.8349609375, -2.6956787109375, -2.556396484375, -2.4171142578125, -2.27783203125, -2.1385498046875, -1.999267578125, -1.8599853515625, -1.720703125, -1.5814208984375, -1.442138671875, -1.3028564453125, -1.16357421875, -1.0242919921875, -0.885009765625, -0.7457275390625, -0.6064453125, -0.4671630859375, -0.327880859375, -0.1885986328125, -0.04931640625, 0.0899658203125, 0.229248046875, 0.3685302734375, 0.5078125, 0.6470947265625, 0.786376953125, 0.9256591796875, 1.06494140625, 1.2042236328125, 1.343505859375, 1.4827880859375, 1.6220703125, 1.7613525390625, 1.900634765625, 2.0399169921875, 2.17919921875, 2.3184814453125, 2.457763671875, 2.5970458984375, 2.736328125, 2.8756103515625, 3.014892578125, 3.1541748046875, 3.29345703125, 3.4327392578125, 3.572021484375, 3.7113037109375, 3.8505859375, 3.9898681640625, 4.129150390625, 4.2684326171875, 4.40771484375, 4.5469970703125, 4.686279296875, 4.8255615234375, 4.96484375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 5.0, 12.0, 5.0, 16.0, 15.0, 29.0, 37.0, 33.0, 39.0, 56.0, 67.0, 60.0, 61.0, 71.0, 66.0, 66.0, 64.0, 54.0, 54.0, 46.0, 40.0, 32.0, 18.0, 10.0, 13.0, 8.0, 2.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.2931251525878906, -0.28253936767578125, -0.2719535827636719, -0.2613677978515625, -0.2507820129394531, -0.24019622802734375, -0.22961044311523438, -0.219024658203125, -0.20843887329101562, -0.19785308837890625, -0.18726730346679688, -0.1766815185546875, -0.16609573364257812, -0.15550994873046875, -0.14492416381835938, -0.13433837890625, -0.12375259399414062, -0.11316680908203125, -0.10258102416992188, -0.0919952392578125, -0.08140945434570312, -0.07082366943359375, -0.060237884521484375, -0.049652099609375, -0.039066314697265625, -0.02848052978515625, -0.017894744873046875, -0.0073089599609375, 0.003276824951171875, 0.01386260986328125, 0.024448394775390625, 0.0350341796875, 0.045619964599609375, 0.05620574951171875, 0.06679153442382812, 0.0773773193359375, 0.08796310424804688, 0.09854888916015625, 0.10913467407226562, 0.119720458984375, 0.13030624389648438, 0.14089202880859375, 0.15147781372070312, 0.1620635986328125, 0.17264938354492188, 0.18323516845703125, 0.19382095336914062, 0.20440673828125, 0.21499252319335938, 0.22557830810546875, 0.23616409301757812, 0.2467498779296875, 0.2573356628417969, 0.26792144775390625, 0.2785072326660156, 0.289093017578125, 0.2996788024902344, 0.31026458740234375, 0.3208503723144531, 0.3314361572265625, 0.3420219421386719, 0.35260772705078125, 0.3631935119628906, 0.373779296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 10.0, 9.0, 15.0, 16.0, 29.0, 25.0, 49.0, 51.0, 79.0, 126.0, 146.0, 248.0, 378.0, 685.0, 1241.0, 2722.0, 6769.0, 20779.0, 149677.0, 3916333.0, 70078.0, 14545.0, 5256.0, 2287.0, 1093.0, 610.0, 299.0, 219.0, 143.0, 103.0, 65.0, 61.0, 40.0, 26.0, 18.0, 11.0, 14.0, 8.0, 5.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.01171875, -2.926544189453125, -2.84136962890625, -2.756195068359375, -2.6710205078125, -2.585845947265625, -2.50067138671875, -2.415496826171875, -2.330322265625, -2.245147705078125, -2.15997314453125, -2.074798583984375, -1.9896240234375, -1.904449462890625, -1.81927490234375, -1.734100341796875, -1.64892578125, -1.563751220703125, -1.47857666015625, -1.393402099609375, -1.3082275390625, -1.223052978515625, -1.13787841796875, -1.052703857421875, -0.967529296875, -0.882354736328125, -0.79718017578125, -0.712005615234375, -0.6268310546875, -0.541656494140625, -0.45648193359375, -0.371307373046875, -0.2861328125, -0.200958251953125, -0.11578369140625, -0.030609130859375, 0.0545654296875, 0.139739990234375, 0.22491455078125, 0.310089111328125, 0.395263671875, 0.480438232421875, 0.56561279296875, 0.650787353515625, 0.7359619140625, 0.821136474609375, 0.90631103515625, 0.991485595703125, 1.07666015625, 1.161834716796875, 1.24700927734375, 1.332183837890625, 1.4173583984375, 1.502532958984375, 1.58770751953125, 1.672882080078125, 1.758056640625, 1.843231201171875, 1.92840576171875, 2.013580322265625, 2.0987548828125, 2.183929443359375, 2.26910400390625, 2.354278564453125, 2.439453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 5.0, 9.0, 9.0, 23.0, 28.0, 47.0, 130.0, 334.0, 2936.0, 321.0, 101.0, 35.0, 20.0, 16.0, 11.0, 6.0, 4.0, 10.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96142578125, -0.93182373046875, -0.9022216796875, -0.87261962890625, -0.843017578125, -0.81341552734375, -0.7838134765625, -0.75421142578125, -0.724609375, -0.69500732421875, -0.6654052734375, -0.63580322265625, -0.606201171875, -0.57659912109375, -0.5469970703125, -0.51739501953125, -0.48779296875, -0.45819091796875, -0.4285888671875, -0.39898681640625, -0.369384765625, -0.33978271484375, -0.3101806640625, -0.28057861328125, -0.2509765625, -0.22137451171875, -0.1917724609375, -0.16217041015625, -0.132568359375, -0.10296630859375, -0.0733642578125, -0.04376220703125, -0.01416015625, 0.01544189453125, 0.0450439453125, 0.07464599609375, 0.104248046875, 0.13385009765625, 0.1634521484375, 0.19305419921875, 0.22265625, 0.25225830078125, 0.2818603515625, 0.31146240234375, 0.341064453125, 0.37066650390625, 0.4002685546875, 0.42987060546875, 0.45947265625, 0.48907470703125, 0.5186767578125, 0.54827880859375, 0.577880859375, 0.60748291015625, 0.6370849609375, 0.66668701171875, 0.6962890625, 0.72589111328125, 0.7554931640625, 0.78509521484375, 0.814697265625, 0.84429931640625, 0.8739013671875, 0.90350341796875, 0.93310546875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 19.0, 109.0, 405.0, 322.0, 87.0, 33.0, 11.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.819730758666992, -16.460721969604492, -16.101713180541992, -15.742704391479492, -15.383695602416992, -15.024686813354492, -14.665678024291992, -14.306669235229492, -13.947660446166992, -13.588651657104492, -13.229642868041992, -12.870634078979492, -12.511625289916992, -12.152616500854492, -11.793607711791992, -11.434598922729492, -11.075591087341309, -10.716582298278809, -10.357573509216309, -9.998564720153809, -9.639555931091309, -9.280547142028809, -8.921539306640625, -8.562530517578125, -8.203521728515625, -7.844512939453125, -7.485504150390625, -7.126495361328125, -6.767486572265625, -6.408477783203125, -6.049469470977783, -5.690460681915283, -5.331451892852783, -4.972443103790283, -4.613434314727783, -4.254426002502441, -3.8954169750213623, -3.5364081859588623, -3.1773996353149414, -2.8183908462524414, -2.4593820571899414, -2.1003732681274414, -1.741364598274231, -1.3823559284210205, -1.0233471393585205, -0.6643383502960205, -0.3053297996520996, 0.05367898941040039, 0.4126877784729004, 0.7716965079307556, 1.1307052373886108, 1.4897139072418213, 1.8487226963043213, 2.2077314853668213, 2.566740036010742, 2.925748825073242, 3.284757614135742, 3.643766403198242, 4.002775192260742, 4.361783981323242, 4.720792770385742, 5.079801559448242, 5.438809871673584, 5.797818660736084, 6.156827449798584]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 9.0, 17.0, 20.0, 18.0, 32.0, 43.0, 50.0, 48.0, 66.0, 62.0, 83.0, 64.0, 69.0, 61.0, 71.0, 60.0, 43.0, 37.0, 44.0, 34.0, 23.0, 16.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.265709638595581, -2.1792290210723877, -2.0927481651306152, -2.006267547607422, -1.919786810874939, -1.833306074142456, -1.7468254566192627, -1.6603447198867798, -1.5738639831542969, -1.487383246421814, -1.400902509689331, -1.3144218921661377, -1.2279411554336548, -1.1414604187011719, -1.0549798011779785, -0.9684990644454956, -0.8820183277130127, -0.7955375909805298, -0.7090569138526917, -0.6225762367248535, -0.5360954999923706, -0.4496147930622101, -0.36313408613204956, -0.2766534090042114, -0.19017267227172852, -0.103691965341568, -0.01721125841140747, 0.06926944851875305, 0.15575015544891357, 0.2422308623790741, 0.3287115693092346, 0.41519224643707275, 0.5016727447509766, 0.5881534814834595, 0.6746341586112976, 0.7611148357391357, 0.8475955724716187, 0.9340763092041016, 1.020556926727295, 1.1070376634597778, 1.1935184001922607, 1.2799991369247437, 1.3664798736572266, 1.45296049118042, 1.5394412279129028, 1.6259219646453857, 1.712402582168579, 1.798883318901062, 1.885364055633545, 1.9718447923660278, 2.0583255290985107, 2.144806146621704, 2.2312870025634766, 2.31776762008667, 2.4042482376098633, 2.4907288551330566, 2.577209711074829, 2.6636903285980225, 2.750171184539795, 2.8366518020629883, 2.9231324195861816, 3.009613275527954, 3.0960938930511475, 3.18257474899292, 3.2690553665161133]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 10.0, 12.0, 12.0, 21.0, 32.0, 50.0, 73.0, 163.0, 310.0, 696.0, 1731.0, 6126.0, 32135.0, 406504.0, 548706.0, 41136.0, 7301.0, 2025.0, 783.0, 327.0, 164.0, 68.0, 48.0, 42.0, 20.0, 10.0, 12.0, 11.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.67578125, -2.589630126953125, -2.50347900390625, -2.417327880859375, -2.3311767578125, -2.245025634765625, -2.15887451171875, -2.072723388671875, -1.986572265625, -1.900421142578125, -1.81427001953125, -1.728118896484375, -1.6419677734375, -1.555816650390625, -1.46966552734375, -1.383514404296875, -1.29736328125, -1.211212158203125, -1.12506103515625, -1.038909912109375, -0.9527587890625, -0.866607666015625, -0.78045654296875, -0.694305419921875, -0.608154296875, -0.522003173828125, -0.43585205078125, -0.349700927734375, -0.2635498046875, -0.177398681640625, -0.09124755859375, -0.005096435546875, 0.0810546875, 0.167205810546875, 0.25335693359375, 0.339508056640625, 0.4256591796875, 0.511810302734375, 0.59796142578125, 0.684112548828125, 0.770263671875, 0.856414794921875, 0.94256591796875, 1.028717041015625, 1.1148681640625, 1.201019287109375, 1.28717041015625, 1.373321533203125, 1.45947265625, 1.545623779296875, 1.63177490234375, 1.717926025390625, 1.8040771484375, 1.890228271484375, 1.97637939453125, 2.062530517578125, 2.148681640625, 2.234832763671875, 2.32098388671875, 2.407135009765625, 2.4932861328125, 2.579437255859375, 2.66558837890625, 2.751739501953125, 2.837890625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 15.0, 17.0, 24.0, 37.0, 51.0, 73.0, 79.0, 89.0, 91.0, 105.0, 100.0, 76.0, 88.0, 45.0, 46.0, 21.0, 19.0, 14.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.82275390625, -0.8056755065917969, -0.7885971069335938, -0.7715187072753906, -0.7544403076171875, -0.7373619079589844, -0.7202835083007812, -0.7032051086425781, -0.686126708984375, -0.6690483093261719, -0.6519699096679688, -0.6348915100097656, -0.6178131103515625, -0.6007347106933594, -0.5836563110351562, -0.5665779113769531, -0.54949951171875, -0.5324211120605469, -0.5153427124023438, -0.4982643127441406, -0.4811859130859375, -0.4641075134277344, -0.44702911376953125, -0.4299507141113281, -0.412872314453125, -0.3957939147949219, -0.37871551513671875, -0.3616371154785156, -0.3445587158203125, -0.3274803161621094, -0.31040191650390625, -0.2933235168457031, -0.2762451171875, -0.2591667175292969, -0.24208831787109375, -0.22500991821289062, -0.2079315185546875, -0.19085311889648438, -0.17377471923828125, -0.15669631958007812, -0.139617919921875, -0.12253952026367188, -0.10546112060546875, -0.08838272094726562, -0.0713043212890625, -0.054225921630859375, -0.03714752197265625, -0.020069122314453125, -0.00299072265625, 0.014087677001953125, 0.03116607666015625, 0.048244476318359375, 0.0653228759765625, 0.08240127563476562, 0.09947967529296875, 0.11655807495117188, 0.133636474609375, 0.15071487426757812, 0.16779327392578125, 0.18487167358398438, 0.2019500732421875, 0.21902847290039062, 0.23610687255859375, 0.2531852722167969, 0.270263671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 9.0, 3.0, 8.0, 11.0, 14.0, 16.0, 27.0, 36.0, 55.0, 56.0, 103.0, 155.0, 255.0, 376.0, 741.0, 1231.0, 2439.0, 5183.0, 11766.0, 29646.0, 83236.0, 260651.0, 412154.0, 153994.0, 51547.0, 18989.0, 7972.0, 3561.0, 1840.0, 994.0, 562.0, 281.0, 221.0, 128.0, 84.0, 59.0, 31.0, 36.0, 24.0, 16.0, 13.0, 14.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.91943359375, -0.892608642578125, -0.86578369140625, -0.838958740234375, -0.8121337890625, -0.785308837890625, -0.75848388671875, -0.731658935546875, -0.704833984375, -0.678009033203125, -0.65118408203125, -0.624359130859375, -0.5975341796875, -0.570709228515625, -0.54388427734375, -0.517059326171875, -0.490234375, -0.463409423828125, -0.43658447265625, -0.409759521484375, -0.3829345703125, -0.356109619140625, -0.32928466796875, -0.302459716796875, -0.275634765625, -0.248809814453125, -0.22198486328125, -0.195159912109375, -0.1683349609375, -0.141510009765625, -0.11468505859375, -0.087860107421875, -0.06103515625, -0.034210205078125, -0.00738525390625, 0.019439697265625, 0.0462646484375, 0.073089599609375, 0.09991455078125, 0.126739501953125, 0.153564453125, 0.180389404296875, 0.20721435546875, 0.234039306640625, 0.2608642578125, 0.287689208984375, 0.31451416015625, 0.341339111328125, 0.3681640625, 0.394989013671875, 0.42181396484375, 0.448638916015625, 0.4754638671875, 0.502288818359375, 0.52911376953125, 0.555938720703125, 0.582763671875, 0.609588623046875, 0.63641357421875, 0.663238525390625, 0.6900634765625, 0.716888427734375, 0.74371337890625, 0.770538330078125, 0.79736328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 8.0, 5.0, 10.0, 7.0, 17.0, 15.0, 20.0, 24.0, 22.0, 29.0, 36.0, 32.0, 45.0, 33.0, 50.0, 47.0, 42.0, 47.0, 41.0, 54.0, 42.0, 38.0, 41.0, 40.0, 36.0, 28.0, 41.0, 24.0, 20.0, 20.0, 19.0, 21.0, 9.0, 8.0, 7.0, 7.0, 2.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3212890625, -1.2852249145507812, -1.2491607666015625, -1.2130966186523438, -1.177032470703125, -1.1409683227539062, -1.1049041748046875, -1.0688400268554688, -1.03277587890625, -0.9967117309570312, -0.9606475830078125, -0.9245834350585938, -0.888519287109375, -0.8524551391601562, -0.8163909912109375, -0.7803268432617188, -0.7442626953125, -0.7081985473632812, -0.6721343994140625, -0.6360702514648438, -0.600006103515625, -0.5639419555664062, -0.5278778076171875, -0.49181365966796875, -0.45574951171875, -0.41968536376953125, -0.3836212158203125, -0.34755706787109375, -0.311492919921875, -0.27542877197265625, -0.2393646240234375, -0.20330047607421875, -0.167236328125, -0.13117218017578125, -0.0951080322265625, -0.05904388427734375, -0.022979736328125, 0.01308441162109375, 0.0491485595703125, 0.08521270751953125, 0.12127685546875, 0.15734100341796875, 0.1934051513671875, 0.22946929931640625, 0.265533447265625, 0.30159759521484375, 0.3376617431640625, 0.37372589111328125, 0.4097900390625, 0.44585418701171875, 0.4819183349609375, 0.5179824829101562, 0.554046630859375, 0.5901107788085938, 0.6261749267578125, 0.6622390747070312, 0.69830322265625, 0.7343673706054688, 0.7704315185546875, 0.8064956665039062, 0.842559814453125, 0.8786239624023438, 0.9146881103515625, 0.9507522583007812, 0.98681640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 10.0, 13.0, 31.0, 55.0, 135.0, 333.0, 993.0, 3575.0, 21748.0, 423834.0, 566554.0, 25601.0, 4067.0, 1005.0, 334.0, 139.0, 64.0, 32.0, 13.0, 8.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1084136962890625, -1.067413330078125, -1.0264129638671875, -0.98541259765625, -0.9444122314453125, -0.903411865234375, -0.8624114990234375, -0.8214111328125, -0.7804107666015625, -0.739410400390625, -0.6984100341796875, -0.65740966796875, -0.6164093017578125, -0.575408935546875, -0.5344085693359375, -0.493408203125, -0.4524078369140625, -0.411407470703125, -0.3704071044921875, -0.32940673828125, -0.2884063720703125, -0.247406005859375, -0.2064056396484375, -0.1654052734375, -0.1244049072265625, -0.083404541015625, -0.0424041748046875, -0.00140380859375, 0.0395965576171875, 0.080596923828125, 0.1215972900390625, 0.16259765625, 0.2035980224609375, 0.244598388671875, 0.2855987548828125, 0.32659912109375, 0.3675994873046875, 0.408599853515625, 0.4496002197265625, 0.4906005859375, 0.5316009521484375, 0.572601318359375, 0.6136016845703125, 0.65460205078125, 0.6956024169921875, 0.736602783203125, 0.7776031494140625, 0.818603515625, 0.8596038818359375, 0.900604248046875, 0.9416046142578125, 0.98260498046875, 1.0236053466796875, 1.064605712890625, 1.1056060791015625, 1.1466064453125, 1.1876068115234375, 1.228607177734375, 1.2696075439453125, 1.31060791015625, 1.3516082763671875, 1.392608642578125, 1.4336090087890625, 1.474609375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 16.0, 17.0, 29.0, 38.0, 68.0, 95.0, 213.0, 185.0, 97.0, 69.0, 46.0, 33.0, 21.0, 10.0, 10.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0002237558364868164, -0.0002175401896238327, -0.000211324542760849, -0.0002051088958978653, -0.0001988932490348816, -0.0001926776021718979, -0.00018646195530891418, -0.00018024630844593048, -0.00017403066158294678, -0.00016781501471996307, -0.00016159936785697937, -0.00015538372099399567, -0.00014916807413101196, -0.00014295242726802826, -0.00013673678040504456, -0.00013052113354206085, -0.00012430548667907715, -0.00011808983981609344, -0.00011187419295310974, -0.00010565854609012604, -9.944289922714233e-05, -9.322725236415863e-05, -8.701160550117493e-05, -8.079595863819122e-05, -7.458031177520752e-05, -6.836466491222382e-05, -6.214901804924011e-05, -5.593337118625641e-05, -4.9717724323272705e-05, -4.3502077460289e-05, -3.72864305973053e-05, -3.1070783734321594e-05, -2.485513687133789e-05, -1.8639490008354187e-05, -1.2423843145370483e-05, -6.20819628238678e-06, 7.450580596923828e-09, 6.2230974435806274e-06, 1.2438744306564331e-05, 1.8654391169548035e-05, 2.4870038032531738e-05, 3.108568489551544e-05, 3.7301331758499146e-05, 4.351697862148285e-05, 4.973262548446655e-05, 5.5948272347450256e-05, 6.216391921043396e-05, 6.837956607341766e-05, 7.459521293640137e-05, 8.081085979938507e-05, 8.702650666236877e-05, 9.324215352535248e-05, 9.945780038833618e-05, 0.00010567344725131989, 0.00011188909411430359, 0.00011810474097728729, 0.000124320387840271, 0.0001305360347032547, 0.0001367516815662384, 0.0001429673284292221, 0.0001491829752922058, 0.00015539862215518951, 0.00016161426901817322, 0.00016782991588115692, 0.00017404556274414062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 6.0, 9.0, 2.0, 6.0, 10.0, 20.0, 49.0, 65.0, 112.0, 163.0, 294.0, 491.0, 1061.0, 2417.0, 6516.0, 23285.0, 123556.0, 706337.0, 145752.0, 26242.0, 7223.0, 2589.0, 1081.0, 539.0, 270.0, 185.0, 85.0, 64.0, 32.0, 25.0, 16.0, 11.0, 13.0, 9.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.82373046875, -0.7958450317382812, -0.7679595947265625, -0.7400741577148438, -0.712188720703125, -0.6843032836914062, -0.6564178466796875, -0.6285324096679688, -0.60064697265625, -0.5727615356445312, -0.5448760986328125, -0.5169906616210938, -0.489105224609375, -0.46121978759765625, -0.4333343505859375, -0.40544891357421875, -0.3775634765625, -0.34967803955078125, -0.3217926025390625, -0.29390716552734375, -0.266021728515625, -0.23813629150390625, -0.2102508544921875, -0.18236541748046875, -0.15447998046875, -0.12659454345703125, -0.0987091064453125, -0.07082366943359375, -0.042938232421875, -0.01505279541015625, 0.0128326416015625, 0.04071807861328125, 0.068603515625, 0.09648895263671875, 0.1243743896484375, 0.15225982666015625, 0.180145263671875, 0.20803070068359375, 0.2359161376953125, 0.26380157470703125, 0.29168701171875, 0.31957244873046875, 0.3474578857421875, 0.37534332275390625, 0.403228759765625, 0.43111419677734375, 0.4589996337890625, 0.48688507080078125, 0.5147705078125, 0.5426559448242188, 0.5705413818359375, 0.5984268188476562, 0.626312255859375, 0.6541976928710938, 0.6820831298828125, 0.7099685668945312, 0.73785400390625, 0.7657394409179688, 0.7936248779296875, 0.8215103149414062, 0.849395751953125, 0.8772811889648438, 0.9051666259765625, 0.9330520629882812, 0.9609375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 4.0, 9.0, 8.0, 11.0, 17.0, 29.0, 39.0, 34.0, 87.0, 116.0, 168.0, 143.0, 101.0, 73.0, 34.0, 25.0, 32.0, 20.0, 13.0, 8.0, 6.0, 6.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6015625, -0.5762786865234375, -0.550994873046875, -0.5257110595703125, -0.50042724609375, -0.4751434326171875, -0.449859619140625, -0.4245758056640625, -0.3992919921875, -0.3740081787109375, -0.348724365234375, -0.3234405517578125, -0.29815673828125, -0.2728729248046875, -0.247589111328125, -0.2223052978515625, -0.197021484375, -0.1717376708984375, -0.146453857421875, -0.1211700439453125, -0.09588623046875, -0.0706024169921875, -0.045318603515625, -0.0200347900390625, 0.0052490234375, 0.0305328369140625, 0.055816650390625, 0.0811004638671875, 0.10638427734375, 0.1316680908203125, 0.156951904296875, 0.1822357177734375, 0.20751953125, 0.2328033447265625, 0.258087158203125, 0.2833709716796875, 0.30865478515625, 0.3339385986328125, 0.359222412109375, 0.3845062255859375, 0.4097900390625, 0.4350738525390625, 0.460357666015625, 0.4856414794921875, 0.51092529296875, 0.5362091064453125, 0.561492919921875, 0.5867767333984375, 0.612060546875, 0.6373443603515625, 0.662628173828125, 0.6879119873046875, 0.71319580078125, 0.7384796142578125, 0.763763427734375, 0.7890472412109375, 0.8143310546875, 0.8396148681640625, 0.864898681640625, 0.8901824951171875, 0.91546630859375, 0.9407501220703125, 0.966033935546875, 0.9913177490234375, 1.0166015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 16.0, 45.0, 139.0, 303.0, 301.0, 134.0, 46.0, 17.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.357422828674316, -9.661396980285645, -8.965370178222656, -8.269344329833984, -7.5733184814453125, -6.877292633056641, -6.1812663078308105, -5.4852399826049805, -4.789214134216309, -4.093188285827637, -3.3971619606018066, -2.7011358737945557, -2.0051097869873047, -1.3090837001800537, -0.6130576133728027, 0.08296871185302734, 0.7789945602416992, 1.4750206470489502, 2.171046733856201, 2.867072820663452, 3.563098907470703, 4.259124755859375, 4.955151081085205, 5.651177406311035, 6.347203254699707, 7.043229103088379, 7.739255428314209, 8.435281753540039, 9.131307601928711, 9.827333450317383, 10.523359298706055, 11.219386100769043, 11.915412902832031, 12.611438751220703, 13.307464599609375, 14.003491401672363, 14.699517250061035, 15.395543098449707, 16.091569900512695, 16.787595748901367, 17.48362159729004, 18.17964744567871, 18.875673294067383, 19.571699142456055, 20.26772689819336, 20.96375274658203, 21.659778594970703, 22.355804443359375, 23.051830291748047, 23.74785614013672, 24.44388198852539, 25.139907836914062, 25.835933685302734, 26.53196144104004, 27.22798728942871, 27.924013137817383, 28.620038986206055, 29.316064834594727, 30.0120906829834, 30.70811653137207, 31.404144287109375, 32.10017013549805, 32.79619598388672, 33.49222183227539, 34.18824768066406]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 4.0, 8.0, 8.0, 9.0, 9.0, 14.0, 11.0, 17.0, 13.0, 25.0, 26.0, 29.0, 30.0, 23.0, 25.0, 27.0, 30.0, 33.0, 26.0, 28.0, 41.0, 32.0, 33.0, 33.0, 43.0, 41.0, 38.0, 37.0, 32.0, 21.0, 26.0, 27.0, 33.0, 19.0, 17.0, 24.0, 7.0, 13.0, 11.0, 8.0, 13.0, 6.0, 9.0, 9.0, 4.0, 4.0, 6.0, 0.0, 1.0, 5.0, 2.0, 2.0], "bins": [-4.9556121826171875, -4.808562755584717, -4.661513328552246, -4.514464378356934, -4.367414951324463, -4.220365524291992, -4.0733160972595215, -3.926266670227051, -3.779217481613159, -3.6321680545806885, -3.485118865966797, -3.338069438934326, -3.1910200119018555, -3.043970823287964, -2.896921396255493, -2.7498722076416016, -2.602822780609131, -2.45577335357666, -2.3087241649627686, -2.161674737930298, -2.0146255493164062, -1.8675761222839355, -1.7205266952514648, -1.5734773874282837, -1.4264280796051025, -1.2793787717819214, -1.1323294639587402, -0.9852800369262695, -0.8382307291030884, -0.6911814212799072, -0.5441320538520813, -0.39708268642425537, -0.2500333786010742, -0.10298404097557068, 0.04406529664993286, 0.1911146342754364, 0.33816397190093994, 0.4852132797241211, 0.632262647151947, 0.779312014579773, 0.9263613224029541, 1.0734106302261353, 1.2204599380493164, 1.367509365081787, 1.5145586729049683, 1.6616079807281494, 1.8086574077606201, 1.9557067155838013, 2.1027560234069824, 2.249805450439453, 2.3968546390533447, 2.5439040660858154, 2.690953254699707, 2.8380026817321777, 2.9850521087646484, 3.132101535797119, 3.2791507244110107, 3.4262001514434814, 3.573249340057373, 3.7202987670898438, 3.8673481941223145, 4.014397621154785, 4.161446571350098, 4.308495998382568, 4.455545425415039]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 4.0, 11.0, 20.0, 27.0, 30.0, 51.0, 64.0, 119.0, 169.0, 244.0, 486.0, 877.0, 2113.0, 6469.0, 33016.0, 3890135.0, 237338.0, 15803.0, 4101.0, 1547.0, 692.0, 363.0, 191.0, 129.0, 80.0, 58.0, 40.0, 25.0, 16.0, 8.0, 7.0, 6.0, 8.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.537109375, -3.425872802734375, -3.31463623046875, -3.203399658203125, -3.0921630859375, -2.980926513671875, -2.86968994140625, -2.758453369140625, -2.647216796875, -2.535980224609375, -2.42474365234375, -2.313507080078125, -2.2022705078125, -2.091033935546875, -1.97979736328125, -1.868560791015625, -1.75732421875, -1.646087646484375, -1.53485107421875, -1.423614501953125, -1.3123779296875, -1.201141357421875, -1.08990478515625, -0.978668212890625, -0.867431640625, -0.756195068359375, -0.64495849609375, -0.533721923828125, -0.4224853515625, -0.311248779296875, -0.20001220703125, -0.088775634765625, 0.0224609375, 0.133697509765625, 0.24493408203125, 0.356170654296875, 0.4674072265625, 0.578643798828125, 0.68988037109375, 0.801116943359375, 0.912353515625, 1.023590087890625, 1.13482666015625, 1.246063232421875, 1.3572998046875, 1.468536376953125, 1.57977294921875, 1.691009521484375, 1.80224609375, 1.913482666015625, 2.02471923828125, 2.135955810546875, 2.2471923828125, 2.358428955078125, 2.46966552734375, 2.580902099609375, 2.692138671875, 2.803375244140625, 2.91461181640625, 3.025848388671875, 3.1370849609375, 3.248321533203125, 3.35955810546875, 3.470794677734375, 3.58203125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 11.0, 13.0, 17.0, 27.0, 32.0, 38.0, 47.0, 67.0, 61.0, 59.0, 70.0, 60.0, 70.0, 64.0, 71.0, 69.0, 50.0, 35.0, 40.0, 27.0, 18.0, 13.0, 15.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.398193359375, -0.38513946533203125, -0.3720855712890625, -0.35903167724609375, -0.345977783203125, -0.33292388916015625, -0.3198699951171875, -0.30681610107421875, -0.29376220703125, -0.28070831298828125, -0.2676544189453125, -0.25460052490234375, -0.241546630859375, -0.22849273681640625, -0.2154388427734375, -0.20238494873046875, -0.1893310546875, -0.17627716064453125, -0.1632232666015625, -0.15016937255859375, -0.137115478515625, -0.12406158447265625, -0.1110076904296875, -0.09795379638671875, -0.08489990234375, -0.07184600830078125, -0.0587921142578125, -0.04573822021484375, -0.032684326171875, -0.01963043212890625, -0.0065765380859375, 0.00647735595703125, 0.01953125, 0.03258514404296875, 0.0456390380859375, 0.05869293212890625, 0.071746826171875, 0.08480072021484375, 0.0978546142578125, 0.11090850830078125, 0.12396240234375, 0.13701629638671875, 0.1500701904296875, 0.16312408447265625, 0.176177978515625, 0.18923187255859375, 0.2022857666015625, 0.21533966064453125, 0.2283935546875, 0.24144744873046875, 0.2545013427734375, 0.26755523681640625, 0.280609130859375, 0.29366302490234375, 0.3067169189453125, 0.31977081298828125, 0.33282470703125, 0.34587860107421875, 0.3589324951171875, 0.37198638916015625, 0.385040283203125, 0.39809417724609375, 0.4111480712890625, 0.42420196533203125, 0.437255859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 8.0, 4.0, 9.0, 13.0, 17.0, 17.0, 16.0, 32.0, 33.0, 57.0, 46.0, 76.0, 140.0, 198.0, 366.0, 646.0, 1260.0, 2844.0, 7486.0, 24250.0, 146692.0, 3809241.0, 161855.0, 25177.0, 7615.0, 3045.0, 1389.0, 703.0, 379.0, 192.0, 135.0, 88.0, 52.0, 49.0, 37.0, 24.0, 17.0, 16.0, 16.0, 7.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.159271240234375, -2.08612060546875, -2.012969970703125, -1.9398193359375, -1.866668701171875, -1.79351806640625, -1.720367431640625, -1.647216796875, -1.574066162109375, -1.50091552734375, -1.427764892578125, -1.3546142578125, -1.281463623046875, -1.20831298828125, -1.135162353515625, -1.06201171875, -0.988861083984375, -0.91571044921875, -0.842559814453125, -0.7694091796875, -0.696258544921875, -0.62310791015625, -0.549957275390625, -0.476806640625, -0.403656005859375, -0.33050537109375, -0.257354736328125, -0.1842041015625, -0.111053466796875, -0.03790283203125, 0.035247802734375, 0.1083984375, 0.181549072265625, 0.25469970703125, 0.327850341796875, 0.4010009765625, 0.474151611328125, 0.54730224609375, 0.620452880859375, 0.693603515625, 0.766754150390625, 0.83990478515625, 0.913055419921875, 0.9862060546875, 1.059356689453125, 1.13250732421875, 1.205657958984375, 1.27880859375, 1.351959228515625, 1.42510986328125, 1.498260498046875, 1.5714111328125, 1.644561767578125, 1.71771240234375, 1.790863037109375, 1.864013671875, 1.937164306640625, 2.01031494140625, 2.083465576171875, 2.1566162109375, 2.229766845703125, 2.30291748046875, 2.376068115234375, 2.44921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 11.0, 8.0, 17.0, 23.0, 37.0, 68.0, 171.0, 802.0, 2355.0, 337.0, 112.0, 54.0, 28.0, 19.0, 13.0, 3.0, 5.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4609222412109375, -1.416961669921875, -1.3730010986328125, -1.32904052734375, -1.2850799560546875, -1.241119384765625, -1.1971588134765625, -1.1531982421875, -1.1092376708984375, -1.065277099609375, -1.0213165283203125, -0.97735595703125, -0.9333953857421875, -0.889434814453125, -0.8454742431640625, -0.801513671875, -0.7575531005859375, -0.713592529296875, -0.6696319580078125, -0.62567138671875, -0.5817108154296875, -0.537750244140625, -0.4937896728515625, -0.4498291015625, -0.4058685302734375, -0.361907958984375, -0.3179473876953125, -0.27398681640625, -0.2300262451171875, -0.186065673828125, -0.1421051025390625, -0.09814453125, -0.0541839599609375, -0.010223388671875, 0.0337371826171875, 0.07769775390625, 0.1216583251953125, 0.165618896484375, 0.2095794677734375, 0.2535400390625, 0.2975006103515625, 0.341461181640625, 0.3854217529296875, 0.42938232421875, 0.4733428955078125, 0.517303466796875, 0.5612640380859375, 0.605224609375, 0.6491851806640625, 0.693145751953125, 0.7371063232421875, 0.78106689453125, 0.8250274658203125, 0.868988037109375, 0.9129486083984375, 0.9569091796875, 1.0008697509765625, 1.044830322265625, 1.0887908935546875, 1.13275146484375, 1.1767120361328125, 1.220672607421875, 1.2646331787109375, 1.30859375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 8.0, 23.0, 59.0, 110.0, 225.0, 260.0, 163.0, 85.0, 34.0, 17.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.926462173461914, -13.630342483520508, -13.334223747253418, -13.038104057312012, -12.741984367370605, -12.4458646774292, -12.14974594116211, -11.853626251220703, -11.557506561279297, -11.26138687133789, -10.9652681350708, -10.669148445129395, -10.373028755187988, -10.076909065246582, -9.780790328979492, -9.484670639038086, -9.18855094909668, -8.892431259155273, -8.596312522888184, -8.300192832946777, -8.004073143005371, -7.707953929901123, -7.411834716796875, -7.115715026855469, -6.819596290588379, -6.523477077484131, -6.227357387542725, -5.931238174438477, -5.63511848449707, -5.338999271392822, -5.042880058288574, -4.746760368347168, -4.4506402015686035, -4.1545209884643555, -3.858401298522949, -3.562282085418701, -3.266162395477295, -2.970043182373047, -2.6739237308502197, -2.3778042793273926, -2.0816848278045654, -1.7855653762817383, -1.4894459247589111, -1.1933265924453735, -0.8972071409225464, -0.6010876893997192, -0.30496835708618164, -0.008848905563354492, 0.28727054595947266, 0.5833899974822998, 0.8795093894004822, 1.1756287813186646, 1.4717482328414917, 1.7678676843643188, 2.0639870166778564, 2.3601064682006836, 2.6562259197235107, 2.952345371246338, 3.248464822769165, 3.544584274291992, 3.8407034873962402, 4.1368231773376465, 4.4329423904418945, 4.729062080383301, 5.025181293487549]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 12.0, 21.0, 21.0, 20.0, 28.0, 30.0, 29.0, 43.0, 54.0, 56.0, 51.0, 58.0, 60.0, 64.0, 46.0, 59.0, 58.0, 51.0, 38.0, 45.0, 35.0, 32.0, 20.0, 16.0, 13.0, 7.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.5452940464019775, -3.439828395843506, -3.334362745285034, -3.2288970947265625, -3.1234312057495117, -3.017965793609619, -2.9124999046325684, -2.8070342540740967, -2.701568603515625, -2.5961029529571533, -2.4906373023986816, -2.38517165184021, -2.2797060012817383, -2.1742401123046875, -2.068774461746216, -1.9633088111877441, -1.8578431606292725, -1.7523775100708008, -1.646911859512329, -1.5414460897445679, -1.4359804391860962, -1.3305147886276245, -1.2250490188598633, -1.1195833683013916, -1.01411771774292, -0.9086520671844482, -0.8031863570213318, -0.6977206468582153, -0.5922549962997437, -0.486789345741272, -0.3813236355781555, -0.27585792541503906, -0.17039251327514648, -0.06492683291435242, 0.04053884744644165, 0.14600452780723572, 0.2514702081680298, 0.35693585872650146, 0.4624015688896179, 0.5678672790527344, 0.673332929611206, 0.7787985801696777, 0.8842642903327942, 0.9897300004959106, 1.0951956510543823, 1.200661301612854, 1.3061270713806152, 1.411592721939087, 1.5170583724975586, 1.6225240230560303, 1.727989673614502, 1.8334554433822632, 1.9389210939407349, 2.044386863708496, 2.1498525142669678, 2.2553181648254395, 2.360783815383911, 2.466249465942383, 2.5717151165008545, 2.677180767059326, 2.782646656036377, 2.8881120681762695, 2.9935779571533203, 3.099043607711792, 3.2045092582702637]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 5.0, 13.0, 11.0, 13.0, 27.0, 58.0, 91.0, 147.0, 243.0, 542.0, 1243.0, 3367.0, 12917.0, 83437.0, 646667.0, 260109.0, 29885.0, 6250.0, 1891.0, 765.0, 380.0, 190.0, 106.0, 63.0, 38.0, 32.0, 14.0, 14.0, 8.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.751953125, -2.662445068359375, -2.57293701171875, -2.483428955078125, -2.3939208984375, -2.304412841796875, -2.21490478515625, -2.125396728515625, -2.035888671875, -1.946380615234375, -1.85687255859375, -1.767364501953125, -1.6778564453125, -1.588348388671875, -1.49884033203125, -1.409332275390625, -1.31982421875, -1.230316162109375, -1.14080810546875, -1.051300048828125, -0.9617919921875, -0.872283935546875, -0.78277587890625, -0.693267822265625, -0.603759765625, -0.514251708984375, -0.42474365234375, -0.335235595703125, -0.2457275390625, -0.156219482421875, -0.06671142578125, 0.022796630859375, 0.1123046875, 0.201812744140625, 0.29132080078125, 0.380828857421875, 0.4703369140625, 0.559844970703125, 0.64935302734375, 0.738861083984375, 0.828369140625, 0.917877197265625, 1.00738525390625, 1.096893310546875, 1.1864013671875, 1.275909423828125, 1.36541748046875, 1.454925537109375, 1.54443359375, 1.633941650390625, 1.72344970703125, 1.812957763671875, 1.9024658203125, 1.991973876953125, 2.08148193359375, 2.170989990234375, 2.260498046875, 2.350006103515625, 2.43951416015625, 2.529022216796875, 2.6185302734375, 2.708038330078125, 2.79754638671875, 2.887054443359375, 2.9765625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 13.0, 15.0, 27.0, 25.0, 42.0, 62.0, 53.0, 90.0, 80.0, 88.0, 92.0, 91.0, 78.0, 69.0, 47.0, 33.0, 24.0, 23.0, 17.0, 13.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63818359375, -0.6199264526367188, -0.6016693115234375, -0.5834121704101562, -0.565155029296875, -0.5468978881835938, -0.5286407470703125, -0.5103836059570312, -0.49212646484375, -0.47386932373046875, -0.4556121826171875, -0.43735504150390625, -0.419097900390625, -0.40084075927734375, -0.3825836181640625, -0.36432647705078125, -0.3460693359375, -0.32781219482421875, -0.3095550537109375, -0.29129791259765625, -0.273040771484375, -0.25478363037109375, -0.2365264892578125, -0.21826934814453125, -0.20001220703125, -0.18175506591796875, -0.1634979248046875, -0.14524078369140625, -0.126983642578125, -0.10872650146484375, -0.0904693603515625, -0.07221221923828125, -0.053955078125, -0.03569793701171875, -0.0174407958984375, 0.00081634521484375, 0.019073486328125, 0.03733062744140625, 0.0555877685546875, 0.07384490966796875, 0.09210205078125, 0.11035919189453125, 0.1286163330078125, 0.14687347412109375, 0.165130615234375, 0.18338775634765625, 0.2016448974609375, 0.21990203857421875, 0.2381591796875, 0.25641632080078125, 0.2746734619140625, 0.29293060302734375, 0.311187744140625, 0.32944488525390625, 0.3477020263671875, 0.36595916748046875, 0.38421630859375, 0.40247344970703125, 0.4207305908203125, 0.43898773193359375, 0.457244873046875, 0.47550201416015625, 0.4937591552734375, 0.5120162963867188, 0.5302734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 9.0, 12.0, 14.0, 10.0, 31.0, 29.0, 52.0, 89.0, 123.0, 184.0, 263.0, 482.0, 867.0, 1751.0, 3553.0, 8215.0, 20729.0, 57746.0, 192856.0, 467853.0, 197738.0, 59014.0, 21018.0, 8409.0, 3639.0, 1698.0, 850.0, 467.0, 293.0, 166.0, 108.0, 79.0, 63.0, 42.0, 22.0, 16.0, 17.0, 14.0, 5.0, 9.0, 6.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0947265625, -1.054931640625, -1.01513671875, -0.975341796875, -0.935546875, -0.895751953125, -0.85595703125, -0.816162109375, -0.7763671875, -0.736572265625, -0.69677734375, -0.656982421875, -0.6171875, -0.577392578125, -0.53759765625, -0.497802734375, -0.4580078125, -0.418212890625, -0.37841796875, -0.338623046875, -0.298828125, -0.259033203125, -0.21923828125, -0.179443359375, -0.1396484375, -0.099853515625, -0.06005859375, -0.020263671875, 0.01953125, 0.059326171875, 0.09912109375, 0.138916015625, 0.1787109375, 0.218505859375, 0.25830078125, 0.298095703125, 0.337890625, 0.377685546875, 0.41748046875, 0.457275390625, 0.4970703125, 0.536865234375, 0.57666015625, 0.616455078125, 0.65625, 0.696044921875, 0.73583984375, 0.775634765625, 0.8154296875, 0.855224609375, 0.89501953125, 0.934814453125, 0.974609375, 1.014404296875, 1.05419921875, 1.093994140625, 1.1337890625, 1.173583984375, 1.21337890625, 1.253173828125, 1.29296875, 1.332763671875, 1.37255859375, 1.412353515625, 1.4521484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 1.0, 4.0, 4.0, 3.0, 6.0, 7.0, 15.0, 12.0, 16.0, 24.0, 24.0, 23.0, 35.0, 28.0, 30.0, 34.0, 33.0, 41.0, 38.0, 45.0, 37.0, 39.0, 48.0, 48.0, 51.0, 45.0, 35.0, 33.0, 28.0, 24.0, 34.0, 28.0, 23.0, 25.0, 11.0, 16.0, 11.0, 12.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.49609375, -1.448974609375, -1.40185546875, -1.354736328125, -1.3076171875, -1.260498046875, -1.21337890625, -1.166259765625, -1.119140625, -1.072021484375, -1.02490234375, -0.977783203125, -0.9306640625, -0.883544921875, -0.83642578125, -0.789306640625, -0.7421875, -0.695068359375, -0.64794921875, -0.600830078125, -0.5537109375, -0.506591796875, -0.45947265625, -0.412353515625, -0.365234375, -0.318115234375, -0.27099609375, -0.223876953125, -0.1767578125, -0.129638671875, -0.08251953125, -0.035400390625, 0.01171875, 0.058837890625, 0.10595703125, 0.153076171875, 0.2001953125, 0.247314453125, 0.29443359375, 0.341552734375, 0.388671875, 0.435791015625, 0.48291015625, 0.530029296875, 0.5771484375, 0.624267578125, 0.67138671875, 0.718505859375, 0.765625, 0.812744140625, 0.85986328125, 0.906982421875, 0.9541015625, 1.001220703125, 1.04833984375, 1.095458984375, 1.142578125, 1.189697265625, 1.23681640625, 1.283935546875, 1.3310546875, 1.378173828125, 1.42529296875, 1.472412109375, 1.51953125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 9.0, 11.0, 12.0, 27.0, 41.0, 64.0, 92.0, 165.0, 323.0, 633.0, 1395.0, 3405.0, 9954.0, 39735.0, 241191.0, 580491.0, 134770.0, 24670.0, 6790.0, 2635.0, 1064.0, 480.0, 264.0, 141.0, 79.0, 33.0, 22.0, 17.0, 15.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56982421875, -0.5481948852539062, -0.5265655517578125, -0.5049362182617188, -0.483306884765625, -0.46167755126953125, -0.4400482177734375, -0.41841888427734375, -0.39678955078125, -0.37516021728515625, -0.3535308837890625, -0.33190155029296875, -0.310272216796875, -0.28864288330078125, -0.2670135498046875, -0.24538421630859375, -0.2237548828125, -0.20212554931640625, -0.1804962158203125, -0.15886688232421875, -0.137237548828125, -0.11560821533203125, -0.0939788818359375, -0.07234954833984375, -0.05072021484375, -0.02909088134765625, -0.0074615478515625, 0.01416778564453125, 0.035797119140625, 0.05742645263671875, 0.0790557861328125, 0.10068511962890625, 0.122314453125, 0.14394378662109375, 0.1655731201171875, 0.18720245361328125, 0.208831787109375, 0.23046112060546875, 0.2520904541015625, 0.27371978759765625, 0.29534912109375, 0.31697845458984375, 0.3386077880859375, 0.36023712158203125, 0.381866455078125, 0.40349578857421875, 0.4251251220703125, 0.44675445556640625, 0.4683837890625, 0.49001312255859375, 0.5116424560546875, 0.5332717895507812, 0.554901123046875, 0.5765304565429688, 0.5981597900390625, 0.6197891235351562, 0.64141845703125, 0.6630477905273438, 0.6846771240234375, 0.7063064575195312, 0.727935791015625, 0.7495651245117188, 0.7711944580078125, 0.7928237915039062, 0.814453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 7.0, 5.0, 9.0, 14.0, 23.0, 20.0, 23.0, 20.0, 50.0, 67.0, 62.0, 72.0, 74.0, 106.0, 75.0, 76.0, 59.0, 45.0, 29.0, 39.0, 26.0, 15.0, 17.0, 17.0, 9.0, 3.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011795759201049805, -0.00011461973190307617, -0.0001112818717956543, -0.00010794401168823242, -0.00010460615158081055, -0.00010126829147338867, -9.79304313659668e-05, -9.459257125854492e-05, -9.125471115112305e-05, -8.791685104370117e-05, -8.45789909362793e-05, -8.124113082885742e-05, -7.790327072143555e-05, -7.456541061401367e-05, -7.12275505065918e-05, -6.788969039916992e-05, -6.455183029174805e-05, -6.121397018432617e-05, -5.78761100769043e-05, -5.453824996948242e-05, -5.120038986206055e-05, -4.786252975463867e-05, -4.45246696472168e-05, -4.118680953979492e-05, -3.784894943237305e-05, -3.451108932495117e-05, -3.11732292175293e-05, -2.7835369110107422e-05, -2.4497509002685547e-05, -2.1159648895263672e-05, -1.7821788787841797e-05, -1.4483928680419922e-05, -1.1146068572998047e-05, -7.808208465576172e-06, -4.470348358154297e-06, -1.1324882507324219e-06, 2.205371856689453e-06, 5.543231964111328e-06, 8.881092071533203e-06, 1.2218952178955078e-05, 1.5556812286376953e-05, 1.8894672393798828e-05, 2.2232532501220703e-05, 2.5570392608642578e-05, 2.8908252716064453e-05, 3.224611282348633e-05, 3.55839729309082e-05, 3.892183303833008e-05, 4.225969314575195e-05, 4.559755325317383e-05, 4.89354133605957e-05, 5.227327346801758e-05, 5.561113357543945e-05, 5.894899368286133e-05, 6.22868537902832e-05, 6.562471389770508e-05, 6.896257400512695e-05, 7.230043411254883e-05, 7.56382942199707e-05, 7.897615432739258e-05, 8.231401443481445e-05, 8.565187454223633e-05, 8.89897346496582e-05, 9.232759475708008e-05, 9.566545486450195e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 3.0, 5.0, 11.0, 12.0, 11.0, 13.0, 32.0, 40.0, 41.0, 67.0, 114.0, 159.0, 263.0, 460.0, 764.0, 1517.0, 2899.0, 6152.0, 15138.0, 43561.0, 147426.0, 407335.0, 290175.0, 86116.0, 26992.0, 9966.0, 4358.0, 2140.0, 1140.0, 604.0, 351.0, 215.0, 159.0, 87.0, 68.0, 45.0, 32.0, 28.0, 18.0, 11.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.55810546875, -0.5420608520507812, -0.5260162353515625, -0.5099716186523438, -0.493927001953125, -0.47788238525390625, -0.4618377685546875, -0.44579315185546875, -0.42974853515625, -0.41370391845703125, -0.3976593017578125, -0.38161468505859375, -0.365570068359375, -0.34952545166015625, -0.3334808349609375, -0.31743621826171875, -0.3013916015625, -0.28534698486328125, -0.2693023681640625, -0.25325775146484375, -0.237213134765625, -0.22116851806640625, -0.2051239013671875, -0.18907928466796875, -0.17303466796875, -0.15699005126953125, -0.1409454345703125, -0.12490081787109375, -0.108856201171875, -0.09281158447265625, -0.0767669677734375, -0.06072235107421875, -0.044677734375, -0.02863311767578125, -0.0125885009765625, 0.00345611572265625, 0.019500732421875, 0.03554534912109375, 0.0515899658203125, 0.06763458251953125, 0.08367919921875, 0.09972381591796875, 0.1157684326171875, 0.13181304931640625, 0.147857666015625, 0.16390228271484375, 0.1799468994140625, 0.19599151611328125, 0.2120361328125, 0.22808074951171875, 0.2441253662109375, 0.26016998291015625, 0.276214599609375, 0.29225921630859375, 0.3083038330078125, 0.32434844970703125, 0.34039306640625, 0.35643768310546875, 0.3724822998046875, 0.38852691650390625, 0.404571533203125, 0.42061614990234375, 0.4366607666015625, 0.45270538330078125, 0.46875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 7.0, 6.0, 9.0, 10.0, 12.0, 12.0, 19.0, 22.0, 29.0, 30.0, 28.0, 36.0, 48.0, 58.0, 52.0, 62.0, 67.0, 68.0, 64.0, 55.0, 48.0, 50.0, 33.0, 39.0, 35.0, 19.0, 19.0, 11.0, 8.0, 10.0, 10.0, 7.0, 4.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4384765625, -0.42322540283203125, -0.4079742431640625, -0.39272308349609375, -0.377471923828125, -0.36222076416015625, -0.3469696044921875, -0.33171844482421875, -0.31646728515625, -0.30121612548828125, -0.2859649658203125, -0.27071380615234375, -0.255462646484375, -0.24021148681640625, -0.2249603271484375, -0.20970916748046875, -0.1944580078125, -0.17920684814453125, -0.1639556884765625, -0.14870452880859375, -0.133453369140625, -0.11820220947265625, -0.1029510498046875, -0.08769989013671875, -0.07244873046875, -0.05719757080078125, -0.0419464111328125, -0.02669525146484375, -0.011444091796875, 0.00380706787109375, 0.0190582275390625, 0.03430938720703125, 0.049560546875, 0.06481170654296875, 0.0800628662109375, 0.09531402587890625, 0.110565185546875, 0.12581634521484375, 0.1410675048828125, 0.15631866455078125, 0.17156982421875, 0.18682098388671875, 0.2020721435546875, 0.21732330322265625, 0.232574462890625, 0.24782562255859375, 0.2630767822265625, 0.27832794189453125, 0.2935791015625, 0.30883026123046875, 0.3240814208984375, 0.33933258056640625, 0.354583740234375, 0.36983489990234375, 0.3850860595703125, 0.40033721923828125, 0.41558837890625, 0.43083953857421875, 0.4460906982421875, 0.46134185791015625, 0.476593017578125, 0.49184417724609375, 0.5070953369140625, 0.5223464965820312, 0.53759765625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 9.0, 13.0, 37.0, 57.0, 124.0, 173.0, 216.0, 170.0, 91.0, 45.0, 28.0, 15.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.201919555664062, -17.713300704956055, -17.224681854248047, -16.73606300354004, -16.24744415283203, -15.75882625579834, -15.270207405090332, -14.781588554382324, -14.292969703674316, -13.804350852966309, -13.3157320022583, -12.82711410522461, -12.338495254516602, -11.849876403808594, -11.361257553100586, -10.872638702392578, -10.38401985168457, -9.895401000976562, -9.406782150268555, -8.918163299560547, -8.429545402526855, -7.940926551818848, -7.45230770111084, -6.963688850402832, -6.475070953369141, -5.986452102661133, -5.497833728790283, -5.009214878082275, -4.520596027374268, -4.031977653503418, -3.54335880279541, -3.0547399520874023, -2.5661211013793945, -2.077502489089966, -1.588883638381958, -1.1002650260925293, -0.611646294593811, -0.12302756309509277, 0.36559104919433594, 0.8542098999023438, 1.3428285121917725, 1.8314472436904907, 2.320065975189209, 2.8086845874786377, 3.2973031997680664, 3.785922050476074, 4.274540901184082, 4.76315975189209, 5.2517781257629395, 5.740396976470947, 6.229015350341797, 6.717634201049805, 7.2062530517578125, 7.69487190246582, 8.183490753173828, 8.672109603881836, 9.160727500915527, 9.649346351623535, 10.137965202331543, 10.626583099365234, 11.115201950073242, 11.60382080078125, 12.092439651489258, 12.581058502197266, 13.069677352905273]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 1.0, 3.0, 8.0, 5.0, 7.0, 8.0, 6.0, 12.0, 11.0, 22.0, 18.0, 21.0, 19.0, 35.0, 33.0, 28.0, 29.0, 32.0, 29.0, 34.0, 37.0, 44.0, 45.0, 37.0, 39.0, 47.0, 47.0, 41.0, 41.0, 37.0, 24.0, 23.0, 31.0, 22.0, 11.0, 23.0, 10.0, 14.0, 13.0, 16.0, 10.0, 4.0, 6.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 1.0], "bins": [-7.130097389221191, -6.913196086883545, -6.696294784545898, -6.479393482208252, -6.2624921798706055, -6.045590400695801, -5.828689098358154, -5.611787796020508, -5.394886493682861, -5.177985191345215, -4.961083889007568, -4.744182586669922, -4.527280807495117, -4.310379981994629, -4.093478202819824, -3.8765769004821777, -3.6596755981445312, -3.4427742958068848, -3.2258729934692383, -3.0089714527130127, -2.792070150375366, -2.5751688480377197, -2.358267307281494, -2.1413660049438477, -1.9244647026062012, -1.7075634002685547, -1.4906619787216187, -1.2737605571746826, -1.0568592548370361, -0.8399579524993896, -0.6230565309524536, -0.4061551094055176, -0.1892533302307129, 0.02764803171157837, 0.24454939365386963, 0.4614507555961609, 0.6783521175384521, 0.8952534198760986, 1.1121548414230347, 1.3290562629699707, 1.5459575653076172, 1.7628588676452637, 1.9797602891921997, 2.1966617107391357, 2.4135630130767822, 2.6304643154144287, 2.8473658561706543, 3.064267158508301, 3.2811684608459473, 3.4980697631835938, 3.7149710655212402, 3.931872606277466, 4.148774147033691, 4.36567497253418, 4.582576751708984, 4.799478054046631, 5.016379356384277, 5.233280658721924, 5.45018196105957, 5.667083263397217, 5.883984565734863, 6.100886344909668, 6.3177876472473145, 6.534688949584961, 6.751590251922607]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 8.0, 6.0, 16.0, 26.0, 27.0, 52.0, 67.0, 140.0, 241.0, 586.0, 1647.0, 8318.0, 4104591.0, 72613.0, 3931.0, 1074.0, 391.0, 208.0, 131.0, 75.0, 37.0, 24.0, 19.0, 15.0, 5.0, 9.0, 6.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.390625, -4.271331787109375, -4.15203857421875, -4.032745361328125, -3.9134521484375, -3.794158935546875, -3.67486572265625, -3.555572509765625, -3.436279296875, -3.316986083984375, -3.19769287109375, -3.078399658203125, -2.9591064453125, -2.839813232421875, -2.72052001953125, -2.601226806640625, -2.48193359375, -2.362640380859375, -2.24334716796875, -2.124053955078125, -2.0047607421875, -1.885467529296875, -1.76617431640625, -1.646881103515625, -1.527587890625, -1.408294677734375, -1.28900146484375, -1.169708251953125, -1.0504150390625, -0.931121826171875, -0.81182861328125, -0.692535400390625, -0.5732421875, -0.453948974609375, -0.33465576171875, -0.215362548828125, -0.0960693359375, 0.023223876953125, 0.14251708984375, 0.261810302734375, 0.381103515625, 0.500396728515625, 0.61968994140625, 0.738983154296875, 0.8582763671875, 0.977569580078125, 1.09686279296875, 1.216156005859375, 1.33544921875, 1.454742431640625, 1.57403564453125, 1.693328857421875, 1.8126220703125, 1.931915283203125, 2.05120849609375, 2.170501708984375, 2.289794921875, 2.409088134765625, 2.52838134765625, 2.647674560546875, 2.7669677734375, 2.886260986328125, 3.00555419921875, 3.124847412109375, 3.244140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 8.0, 10.0, 11.0, 12.0, 17.0, 7.0, 30.0, 24.0, 40.0, 36.0, 54.0, 53.0, 66.0, 68.0, 67.0, 72.0, 55.0, 69.0, 58.0, 41.0, 32.0, 27.0, 24.0, 29.0, 27.0, 21.0, 8.0, 7.0, 8.0, 1.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5102920532226562, -0.4956817626953125, -0.48107147216796875, -0.466461181640625, -0.45185089111328125, -0.4372406005859375, -0.42263031005859375, -0.40802001953125, -0.39340972900390625, -0.3787994384765625, -0.36418914794921875, -0.349578857421875, -0.33496856689453125, -0.3203582763671875, -0.30574798583984375, -0.2911376953125, -0.27652740478515625, -0.2619171142578125, -0.24730682373046875, -0.232696533203125, -0.21808624267578125, -0.2034759521484375, -0.18886566162109375, -0.17425537109375, -0.15964508056640625, -0.1450347900390625, -0.13042449951171875, -0.115814208984375, -0.10120391845703125, -0.0865936279296875, -0.07198333740234375, -0.057373046875, -0.04276275634765625, -0.0281524658203125, -0.01354217529296875, 0.001068115234375, 0.01567840576171875, 0.0302886962890625, 0.04489898681640625, 0.05950927734375, 0.07411956787109375, 0.0887298583984375, 0.10334014892578125, 0.117950439453125, 0.13256072998046875, 0.1471710205078125, 0.16178131103515625, 0.1763916015625, 0.19100189208984375, 0.2056121826171875, 0.22022247314453125, 0.234832763671875, 0.24944305419921875, 0.2640533447265625, 0.27866363525390625, 0.29327392578125, 0.30788421630859375, 0.3224945068359375, 0.33710479736328125, 0.351715087890625, 0.36632537841796875, 0.3809356689453125, 0.39554595947265625, 0.41015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 7.0, 16.0, 15.0, 13.0, 26.0, 24.0, 41.0, 41.0, 57.0, 68.0, 105.0, 105.0, 169.0, 262.0, 544.0, 1206.0, 3263.0, 12439.0, 135899.0, 3989635.0, 39826.0, 6603.0, 1938.0, 815.0, 351.0, 225.0, 128.0, 95.0, 76.0, 57.0, 52.0, 38.0, 34.0, 22.0, 20.0, 13.0, 13.0, 5.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.041015625, -1.977813720703125, -1.91461181640625, -1.851409912109375, -1.7882080078125, -1.725006103515625, -1.66180419921875, -1.598602294921875, -1.535400390625, -1.472198486328125, -1.40899658203125, -1.345794677734375, -1.2825927734375, -1.219390869140625, -1.15618896484375, -1.092987060546875, -1.02978515625, -0.966583251953125, -0.90338134765625, -0.840179443359375, -0.7769775390625, -0.713775634765625, -0.65057373046875, -0.587371826171875, -0.524169921875, -0.460968017578125, -0.39776611328125, -0.334564208984375, -0.2713623046875, -0.208160400390625, -0.14495849609375, -0.081756591796875, -0.0185546875, 0.044647216796875, 0.10784912109375, 0.171051025390625, 0.2342529296875, 0.297454833984375, 0.36065673828125, 0.423858642578125, 0.487060546875, 0.550262451171875, 0.61346435546875, 0.676666259765625, 0.7398681640625, 0.803070068359375, 0.86627197265625, 0.929473876953125, 0.99267578125, 1.055877685546875, 1.11907958984375, 1.182281494140625, 1.2454833984375, 1.308685302734375, 1.37188720703125, 1.435089111328125, 1.498291015625, 1.561492919921875, 1.62469482421875, 1.687896728515625, 1.7510986328125, 1.814300537109375, 1.87750244140625, 1.940704345703125, 2.00390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 2.0, 7.0, 10.0, 18.0, 32.0, 71.0, 233.0, 3275.0, 270.0, 77.0, 33.0, 18.0, 9.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30712890625, -0.2946014404296875, -0.282073974609375, -0.2695465087890625, -0.25701904296875, -0.2444915771484375, -0.231964111328125, -0.2194366455078125, -0.2069091796875, -0.1943817138671875, -0.181854248046875, -0.1693267822265625, -0.15679931640625, -0.1442718505859375, -0.131744384765625, -0.1192169189453125, -0.106689453125, -0.0941619873046875, -0.081634521484375, -0.0691070556640625, -0.05657958984375, -0.0440521240234375, -0.031524658203125, -0.0189971923828125, -0.0064697265625, 0.0060577392578125, 0.018585205078125, 0.0311126708984375, 0.04364013671875, 0.0561676025390625, 0.068695068359375, 0.0812225341796875, 0.09375, 0.1062774658203125, 0.118804931640625, 0.1313323974609375, 0.14385986328125, 0.1563873291015625, 0.168914794921875, 0.1814422607421875, 0.1939697265625, 0.2064971923828125, 0.219024658203125, 0.2315521240234375, 0.24407958984375, 0.2566070556640625, 0.269134521484375, 0.2816619873046875, 0.294189453125, 0.3067169189453125, 0.319244384765625, 0.3317718505859375, 0.34429931640625, 0.3568267822265625, 0.369354248046875, 0.3818817138671875, 0.3944091796875, 0.4069366455078125, 0.419464111328125, 0.4319915771484375, 0.44451904296875, 0.4570465087890625, 0.469573974609375, 0.4821014404296875, 0.49462890625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 9.0, 8.0, 19.0, 23.0, 27.0, 41.0, 49.0, 76.0, 88.0, 107.0, 80.0, 102.0, 82.0, 79.0, 51.0, 54.0, 26.0, 23.0, 14.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.655744194984436, -0.6270523071289062, -0.5983604788780212, -0.5696685910224915, -0.5409767627716064, -0.5122848749160767, -0.48359301686286926, -0.45490115880966187, -0.4262092709541321, -0.3975174129009247, -0.3688255548477173, -0.3401336669921875, -0.3114418089389801, -0.2827499508857727, -0.2540580928325653, -0.22536621987819672, -0.1966743767261505, -0.16798251867294312, -0.13929064571857452, -0.11059878766536713, -0.08190692216157913, -0.05321505665779114, -0.02452319860458374, 0.004168674349784851, 0.03286053240299225, 0.06155239790678024, 0.09024426341056824, 0.11893612146377563, 0.14762797951698303, 0.17631985247135162, 0.20501171052455902, 0.2337035834789276, 0.262395441532135, 0.2910872995853424, 0.3197791576385498, 0.3484710454940796, 0.377162903547287, 0.4058547616004944, 0.4345466196537018, 0.4632384777069092, 0.49193036556243896, 0.5206222534179688, 0.5493140816688538, 0.5780059695243835, 0.6066977977752686, 0.6353896856307983, 0.6640815734863281, 0.6927734017372131, 0.7214652299880981, 0.7501571178436279, 0.7788489460945129, 0.8075408339500427, 0.8362326622009277, 0.8649245500564575, 0.8936164379119873, 0.9223082661628723, 0.9510001540184021, 0.9796920418739319, 1.008383870124817, 1.0370757579803467, 1.0657676458358765, 1.0944595336914062, 1.1231513023376465, 1.1518431901931763, 1.180535078048706]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 7.0, 4.0, 5.0, 8.0, 5.0, 14.0, 15.0, 20.0, 17.0, 22.0, 16.0, 24.0, 29.0, 19.0, 33.0, 37.0, 48.0, 31.0, 30.0, 43.0, 39.0, 33.0, 37.0, 54.0, 48.0, 41.0, 25.0, 43.0, 42.0, 36.0, 25.0, 27.0, 24.0, 13.0, 11.0, 10.0, 10.0, 13.0, 8.0, 9.0, 8.0, 5.0, 9.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.539333701133728, -0.5228256583213806, -0.506317675113678, -0.48980966210365295, -0.47330164909362793, -0.4567936360836029, -0.4402856230735779, -0.42377758026123047, -0.40726959705352783, -0.3907615840435028, -0.3742535710334778, -0.35774555802345276, -0.34123754501342773, -0.3247295320034027, -0.3082215189933777, -0.2917134761810303, -0.27520546317100525, -0.2586974501609802, -0.2421894371509552, -0.22568142414093018, -0.20917341113090515, -0.19266539812088013, -0.1761573702096939, -0.15964935719966888, -0.14314134418964386, -0.12663333117961884, -0.11012531816959381, -0.09361729770898819, -0.07710928469896317, -0.06060127168893814, -0.04409325122833252, -0.027585238218307495, -0.01107722520828247, 0.005430789664387703, 0.021938804537057877, 0.0384468212723732, 0.054954834282398224, 0.07146284729242325, 0.08797086775302887, 0.1044788807630539, 0.12098689377307892, 0.13749490678310394, 0.15400291979312897, 0.17051094770431519, 0.1870189607143402, 0.20352697372436523, 0.22003498673439026, 0.23654299974441528, 0.2530510127544403, 0.26955902576446533, 0.28606703877449036, 0.3025750517845154, 0.3190830647945404, 0.33559107780456543, 0.35209912061691284, 0.3686071038246155, 0.3851151466369629, 0.4016231596469879, 0.41813117265701294, 0.43463918566703796, 0.451147198677063, 0.467655211687088, 0.48416322469711304, 0.5006712675094604, 0.5171792507171631]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 7.0, 10.0, 22.0, 21.0, 31.0, 44.0, 98.0, 168.0, 279.0, 562.0, 1235.0, 3231.0, 10478.0, 49377.0, 413206.0, 491427.0, 60219.0, 11823.0, 3518.0, 1387.0, 634.0, 305.0, 172.0, 103.0, 55.0, 39.0, 19.0, 25.0, 12.0, 12.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.279296875, -2.195037841796875, -2.11077880859375, -2.026519775390625, -1.9422607421875, -1.858001708984375, -1.77374267578125, -1.689483642578125, -1.605224609375, -1.520965576171875, -1.43670654296875, -1.352447509765625, -1.2681884765625, -1.183929443359375, -1.09967041015625, -1.015411376953125, -0.93115234375, -0.846893310546875, -0.76263427734375, -0.678375244140625, -0.5941162109375, -0.509857177734375, -0.42559814453125, -0.341339111328125, -0.257080078125, -0.172821044921875, -0.08856201171875, -0.004302978515625, 0.0799560546875, 0.164215087890625, 0.24847412109375, 0.332733154296875, 0.4169921875, 0.501251220703125, 0.58551025390625, 0.669769287109375, 0.7540283203125, 0.838287353515625, 0.92254638671875, 1.006805419921875, 1.091064453125, 1.175323486328125, 1.25958251953125, 1.343841552734375, 1.4281005859375, 1.512359619140625, 1.59661865234375, 1.680877685546875, 1.76513671875, 1.849395751953125, 1.93365478515625, 2.017913818359375, 2.1021728515625, 2.186431884765625, 2.27069091796875, 2.354949951171875, 2.439208984375, 2.523468017578125, 2.60772705078125, 2.691986083984375, 2.7762451171875, 2.860504150390625, 2.94476318359375, 3.029022216796875, 3.11328125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 9.0, 19.0, 22.0, 29.0, 37.0, 24.0, 38.0, 48.0, 52.0, 75.0, 56.0, 67.0, 75.0, 83.0, 82.0, 51.0, 37.0, 29.0, 42.0, 22.0, 22.0, 21.0, 12.0, 13.0, 5.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6474609375, -0.6308135986328125, -0.614166259765625, -0.5975189208984375, -0.58087158203125, -0.5642242431640625, -0.547576904296875, -0.5309295654296875, -0.5142822265625, -0.4976348876953125, -0.480987548828125, -0.4643402099609375, -0.44769287109375, -0.4310455322265625, -0.414398193359375, -0.3977508544921875, -0.381103515625, -0.3644561767578125, -0.347808837890625, -0.3311614990234375, -0.31451416015625, -0.2978668212890625, -0.281219482421875, -0.2645721435546875, -0.2479248046875, -0.2312774658203125, -0.214630126953125, -0.1979827880859375, -0.18133544921875, -0.1646881103515625, -0.148040771484375, -0.1313934326171875, -0.11474609375, -0.0980987548828125, -0.081451416015625, -0.0648040771484375, -0.04815673828125, -0.0315093994140625, -0.014862060546875, 0.0017852783203125, 0.0184326171875, 0.0350799560546875, 0.051727294921875, 0.0683746337890625, 0.08502197265625, 0.1016693115234375, 0.118316650390625, 0.1349639892578125, 0.151611328125, 0.1682586669921875, 0.184906005859375, 0.2015533447265625, 0.21820068359375, 0.2348480224609375, 0.251495361328125, 0.2681427001953125, 0.2847900390625, 0.3014373779296875, 0.318084716796875, 0.3347320556640625, 0.35137939453125, 0.3680267333984375, 0.384674072265625, 0.4013214111328125, 0.41796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 1.0, 2.0, 2.0, 6.0, 8.0, 10.0, 7.0, 19.0, 29.0, 27.0, 39.0, 44.0, 71.0, 95.0, 123.0, 175.0, 289.0, 425.0, 673.0, 1241.0, 2294.0, 4903.0, 10946.0, 27380.0, 77284.0, 249294.0, 433104.0, 155179.0, 50113.0, 18675.0, 7830.0, 3638.0, 1872.0, 979.0, 544.0, 335.0, 247.0, 156.0, 118.0, 87.0, 63.0, 50.0, 45.0, 28.0, 26.0, 18.0, 17.0, 15.0, 12.0, 7.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.9013671875, -0.87060546875, -0.83984375, -0.80908203125, -0.7783203125, -0.74755859375, -0.716796875, -0.68603515625, -0.6552734375, -0.62451171875, -0.59375, -0.56298828125, -0.5322265625, -0.50146484375, -0.470703125, -0.43994140625, -0.4091796875, -0.37841796875, -0.34765625, -0.31689453125, -0.2861328125, -0.25537109375, -0.224609375, -0.19384765625, -0.1630859375, -0.13232421875, -0.1015625, -0.07080078125, -0.0400390625, -0.00927734375, 0.021484375, 0.05224609375, 0.0830078125, 0.11376953125, 0.14453125, 0.17529296875, 0.2060546875, 0.23681640625, 0.267578125, 0.29833984375, 0.3291015625, 0.35986328125, 0.390625, 0.42138671875, 0.4521484375, 0.48291015625, 0.513671875, 0.54443359375, 0.5751953125, 0.60595703125, 0.63671875, 0.66748046875, 0.6982421875, 0.72900390625, 0.759765625, 0.79052734375, 0.8212890625, 0.85205078125, 0.8828125, 0.91357421875, 0.9443359375, 0.97509765625, 1.005859375, 1.03662109375, 1.0673828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 11.0, 11.0, 18.0, 21.0, 21.0, 19.0, 30.0, 21.0, 19.0, 27.0, 35.0, 40.0, 35.0, 56.0, 43.0, 36.0, 35.0, 44.0, 45.0, 52.0, 35.0, 29.0, 33.0, 36.0, 39.0, 16.0, 25.0, 30.0, 22.0, 13.0, 17.0, 17.0, 8.0, 14.0, 11.0, 4.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.865234375, -1.813995361328125, -1.76275634765625, -1.711517333984375, -1.6602783203125, -1.609039306640625, -1.55780029296875, -1.506561279296875, -1.455322265625, -1.404083251953125, -1.35284423828125, -1.301605224609375, -1.2503662109375, -1.199127197265625, -1.14788818359375, -1.096649169921875, -1.04541015625, -0.994171142578125, -0.94293212890625, -0.891693115234375, -0.8404541015625, -0.789215087890625, -0.73797607421875, -0.686737060546875, -0.635498046875, -0.584259033203125, -0.53302001953125, -0.481781005859375, -0.4305419921875, -0.379302978515625, -0.32806396484375, -0.276824951171875, -0.2255859375, -0.174346923828125, -0.12310791015625, -0.071868896484375, -0.0206298828125, 0.030609130859375, 0.08184814453125, 0.133087158203125, 0.184326171875, 0.235565185546875, 0.28680419921875, 0.338043212890625, 0.3892822265625, 0.440521240234375, 0.49176025390625, 0.542999267578125, 0.59423828125, 0.645477294921875, 0.69671630859375, 0.747955322265625, 0.7991943359375, 0.850433349609375, 0.90167236328125, 0.952911376953125, 1.004150390625, 1.055389404296875, 1.10662841796875, 1.157867431640625, 1.2091064453125, 1.260345458984375, 1.31158447265625, 1.362823486328125, 1.4140625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 8.0, 8.0, 13.0, 10.0, 19.0, 23.0, 41.0, 77.0, 93.0, 176.0, 227.0, 524.0, 1079.0, 3111.0, 12088.0, 106646.0, 836521.0, 73166.0, 9938.0, 2670.0, 1001.0, 456.0, 238.0, 154.0, 69.0, 59.0, 36.0, 35.0, 21.0, 11.0, 8.0, 5.0, 7.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.2889556884765625, -1.241973876953125, -1.1949920654296875, -1.14801025390625, -1.1010284423828125, -1.054046630859375, -1.0070648193359375, -0.9600830078125, -0.9131011962890625, -0.866119384765625, -0.8191375732421875, -0.77215576171875, -0.7251739501953125, -0.678192138671875, -0.6312103271484375, -0.584228515625, -0.5372467041015625, -0.490264892578125, -0.4432830810546875, -0.39630126953125, -0.3493194580078125, -0.302337646484375, -0.2553558349609375, -0.2083740234375, -0.1613922119140625, -0.114410400390625, -0.0674285888671875, -0.02044677734375, 0.0265350341796875, 0.073516845703125, 0.1204986572265625, 0.16748046875, 0.2144622802734375, 0.261444091796875, 0.3084259033203125, 0.35540771484375, 0.4023895263671875, 0.449371337890625, 0.4963531494140625, 0.5433349609375, 0.5903167724609375, 0.637298583984375, 0.6842803955078125, 0.73126220703125, 0.7782440185546875, 0.825225830078125, 0.8722076416015625, 0.919189453125, 0.9661712646484375, 1.013153076171875, 1.0601348876953125, 1.10711669921875, 1.1540985107421875, 1.201080322265625, 1.2480621337890625, 1.2950439453125, 1.3420257568359375, 1.389007568359375, 1.4359893798828125, 1.48297119140625, 1.5299530029296875, 1.576934814453125, 1.6239166259765625, 1.6708984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 9.0, 13.0, 18.0, 19.0, 36.0, 46.0, 77.0, 99.0, 120.0, 135.0, 118.0, 77.0, 64.0, 39.0, 25.0, 29.0, 22.0, 11.0, 5.0, 1.0, 7.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002149343490600586, -0.00020903907716274261, -0.00020314380526542664, -0.00019724853336811066, -0.00019135326147079468, -0.0001854579895734787, -0.00017956271767616272, -0.00017366744577884674, -0.00016777217388153076, -0.00016187690198421478, -0.0001559816300868988, -0.00015008635818958282, -0.00014419108629226685, -0.00013829581439495087, -0.0001324005424976349, -0.0001265052706003189, -0.00012060999870300293, -0.00011471472680568695, -0.00010881945490837097, -0.00010292418301105499, -9.702891111373901e-05, -9.113363921642303e-05, -8.523836731910706e-05, -7.934309542179108e-05, -7.34478235244751e-05, -6.755255162715912e-05, -6.165727972984314e-05, -5.576200783252716e-05, -4.986673593521118e-05, -4.39714640378952e-05, -3.8076192140579224e-05, -3.2180920243263245e-05, -2.6285648345947266e-05, -2.0390376448631287e-05, -1.4495104551315308e-05, -8.599832653999329e-06, -2.7045607566833496e-06, 3.1907111406326294e-06, 9.085983037948608e-06, 1.4981254935264587e-05, 2.0876526832580566e-05, 2.6771798729896545e-05, 3.2667070627212524e-05, 3.8562342524528503e-05, 4.445761442184448e-05, 5.035288631916046e-05, 5.624815821647644e-05, 6.214343011379242e-05, 6.80387020111084e-05, 7.393397390842438e-05, 7.982924580574036e-05, 8.572451770305634e-05, 9.161978960037231e-05, 9.75150614976883e-05, 0.00010341033339500427, 0.00010930560529232025, 0.00011520087718963623, 0.00012109614908695221, 0.0001269914209842682, 0.00013288669288158417, 0.00013878196477890015, 0.00014467723667621613, 0.0001505725085735321, 0.00015646778047084808, 0.00016236305236816406]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 15.0, 14.0, 19.0, 29.0, 43.0, 64.0, 85.0, 130.0, 216.0, 330.0, 624.0, 1202.0, 2558.0, 6033.0, 19218.0, 97896.0, 676768.0, 198562.0, 29611.0, 8409.0, 3259.0, 1514.0, 769.0, 454.0, 234.0, 147.0, 104.0, 54.0, 40.0, 29.0, 18.0, 17.0, 20.0, 12.0, 8.0, 8.0, 6.0, 3.0, 1.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1650390625, -1.1314239501953125, -1.097808837890625, -1.0641937255859375, -1.03057861328125, -0.9969635009765625, -0.963348388671875, -0.9297332763671875, -0.8961181640625, -0.8625030517578125, -0.828887939453125, -0.7952728271484375, -0.76165771484375, -0.7280426025390625, -0.694427490234375, -0.6608123779296875, -0.627197265625, -0.5935821533203125, -0.559967041015625, -0.5263519287109375, -0.49273681640625, -0.4591217041015625, -0.425506591796875, -0.3918914794921875, -0.3582763671875, -0.3246612548828125, -0.291046142578125, -0.2574310302734375, -0.22381591796875, -0.1902008056640625, -0.156585693359375, -0.1229705810546875, -0.08935546875, -0.0557403564453125, -0.022125244140625, 0.0114898681640625, 0.04510498046875, 0.0787200927734375, 0.112335205078125, 0.1459503173828125, 0.1795654296875, 0.2131805419921875, 0.246795654296875, 0.2804107666015625, 0.31402587890625, 0.3476409912109375, 0.381256103515625, 0.4148712158203125, 0.448486328125, 0.4821014404296875, 0.515716552734375, 0.5493316650390625, 0.58294677734375, 0.6165618896484375, 0.650177001953125, 0.6837921142578125, 0.7174072265625, 0.7510223388671875, 0.784637451171875, 0.8182525634765625, 0.85186767578125, 0.8854827880859375, 0.919097900390625, 0.9527130126953125, 0.986328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 9.0, 9.0, 8.0, 12.0, 7.0, 14.0, 13.0, 38.0, 40.0, 61.0, 60.0, 78.0, 94.0, 101.0, 87.0, 78.0, 67.0, 44.0, 37.0, 25.0, 28.0, 17.0, 14.0, 14.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.95361328125, -0.92413330078125, -0.8946533203125, -0.86517333984375, -0.835693359375, -0.80621337890625, -0.7767333984375, -0.74725341796875, -0.7177734375, -0.68829345703125, -0.6588134765625, -0.62933349609375, -0.599853515625, -0.57037353515625, -0.5408935546875, -0.51141357421875, -0.48193359375, -0.45245361328125, -0.4229736328125, -0.39349365234375, -0.364013671875, -0.33453369140625, -0.3050537109375, -0.27557373046875, -0.24609375, -0.21661376953125, -0.1871337890625, -0.15765380859375, -0.128173828125, -0.09869384765625, -0.0692138671875, -0.03973388671875, -0.01025390625, 0.01922607421875, 0.0487060546875, 0.07818603515625, 0.107666015625, 0.13714599609375, 0.1666259765625, 0.19610595703125, 0.2255859375, 0.25506591796875, 0.2845458984375, 0.31402587890625, 0.343505859375, 0.37298583984375, 0.4024658203125, 0.43194580078125, 0.46142578125, 0.49090576171875, 0.5203857421875, 0.54986572265625, 0.579345703125, 0.60882568359375, 0.6383056640625, 0.66778564453125, 0.697265625, 0.72674560546875, 0.7562255859375, 0.78570556640625, 0.815185546875, 0.84466552734375, 0.8741455078125, 0.90362548828125, 0.93310546875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 9.0, 16.0, 32.0, 27.0, 51.0, 79.0, 100.0, 103.0, 122.0, 123.0, 98.0, 76.0, 69.0, 41.0, 22.0, 10.0, 5.0, 6.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.934856414794922, -10.563733100891113, -10.192610740661621, -9.821487426757812, -9.450364112854004, -9.079240798950195, -8.708118438720703, -8.336995124816895, -7.965871810913086, -7.5947489738464355, -7.223625659942627, -6.852502822875977, -6.481379508972168, -6.110256671905518, -5.739133834838867, -5.368010520935059, -4.996887683868408, -4.625764846801758, -4.254641532897949, -3.883518695831299, -3.5123953819274902, -3.14127254486084, -2.7701494693756104, -2.399026393890381, -2.0279033184051514, -1.6567802429199219, -1.2856571674346924, -0.9145342111587524, -0.543411135673523, -0.17228806018829346, 0.19883489608764648, 0.569957971572876, 0.9410810470581055, 1.312204122543335, 1.6833271980285645, 2.054450035095215, 2.4255733489990234, 2.796696186065674, 3.1678192615509033, 3.538942337036133, 3.9100654125213623, 4.281188488006592, 4.652311325073242, 5.023434638977051, 5.394557476043701, 5.76568078994751, 6.13680362701416, 6.507926940917969, 6.879049777984619, 7.2501726150512695, 7.621295928955078, 7.9924187660217285, 8.363541603088379, 8.734664916992188, 9.105788230895996, 9.476911544799805, 9.848033905029297, 10.219157218933105, 10.590279579162598, 10.961402893066406, 11.332526206970215, 11.703649520874023, 12.074771881103516, 12.445895195007324, 12.817018508911133]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 8.0, 11.0, 9.0, 12.0, 15.0, 19.0, 19.0, 25.0, 35.0, 34.0, 43.0, 29.0, 46.0, 53.0, 53.0, 34.0, 44.0, 56.0, 51.0, 56.0, 44.0, 39.0, 42.0, 30.0, 36.0, 16.0, 28.0, 22.0, 15.0, 16.0, 8.0, 17.0, 6.0, 7.0, 2.0, 7.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.743335723876953, -9.455294609069824, -9.167252540588379, -8.87921142578125, -8.591169357299805, -8.303128242492676, -8.01508617401123, -7.727045059204102, -7.4390034675598145, -7.150961875915527, -6.86292028427124, -6.574878692626953, -6.286837577819824, -5.998795509338379, -5.71075439453125, -5.422712802886963, -5.134671211242676, -4.846629619598389, -4.558588027954102, -4.2705464363098145, -3.9825050830841064, -3.6944634914398193, -3.4064221382141113, -3.118380546569824, -2.830338954925537, -2.54229736328125, -2.254255771636963, -1.9662144184112549, -1.6781728267669678, -1.3901312351226807, -1.102089762687683, -0.8140482902526855, -0.5260066986083984, -0.2379651665687561, 0.05007636547088623, 0.33811789751052856, 0.6261594295501709, 0.914201021194458, 1.2022424936294556, 1.4902839660644531, 1.7783255577087402, 2.0663671493530273, 2.3544087409973145, 2.6424500942230225, 2.9304916858673096, 3.2185332775115967, 3.5065746307373047, 3.794616222381592, 4.082657814025879, 4.370699405670166, 4.658740997314453, 4.94678258895874, 5.234824180603027, 5.522865295410156, 5.810906887054443, 6.0989484786987305, 6.386990070343018, 6.675031661987305, 6.963073253631592, 7.251114845275879, 7.539155960083008, 7.827198028564453, 8.115239143371582, 8.403280258178711, 8.691322326660156]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 4.0, 2.0, 7.0, 14.0, 27.0, 41.0, 74.0, 104.0, 170.0, 327.0, 663.0, 1457.0, 4272.0, 22699.0, 4056233.0, 95594.0, 8132.0, 2345.0, 999.0, 482.0, 259.0, 147.0, 71.0, 63.0, 31.0, 10.0, 18.0, 12.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.330078125, -3.231353759765625, -3.13262939453125, -3.033905029296875, -2.9351806640625, -2.836456298828125, -2.73773193359375, -2.639007568359375, -2.540283203125, -2.441558837890625, -2.34283447265625, -2.244110107421875, -2.1453857421875, -2.046661376953125, -1.94793701171875, -1.849212646484375, -1.75048828125, -1.651763916015625, -1.55303955078125, -1.454315185546875, -1.3555908203125, -1.256866455078125, -1.15814208984375, -1.059417724609375, -0.960693359375, -0.861968994140625, -0.76324462890625, -0.664520263671875, -0.5657958984375, -0.467071533203125, -0.36834716796875, -0.269622802734375, -0.1708984375, -0.072174072265625, 0.02655029296875, 0.125274658203125, 0.2239990234375, 0.322723388671875, 0.42144775390625, 0.520172119140625, 0.618896484375, 0.717620849609375, 0.81634521484375, 0.915069580078125, 1.0137939453125, 1.112518310546875, 1.21124267578125, 1.309967041015625, 1.40869140625, 1.507415771484375, 1.60614013671875, 1.704864501953125, 1.8035888671875, 1.902313232421875, 2.00103759765625, 2.099761962890625, 2.198486328125, 2.297210693359375, 2.39593505859375, 2.494659423828125, 2.5933837890625, 2.692108154296875, 2.79083251953125, 2.889556884765625, 2.98828125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 12.0, 10.0, 15.0, 10.0, 19.0, 20.0, 32.0, 35.0, 30.0, 42.0, 57.0, 59.0, 69.0, 65.0, 67.0, 47.0, 62.0, 57.0, 54.0, 41.0, 52.0, 18.0, 19.0, 22.0, 19.0, 23.0, 6.0, 8.0, 6.0, 1.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.529296875, -0.5138778686523438, -0.4984588623046875, -0.48303985595703125, -0.467620849609375, -0.45220184326171875, -0.4367828369140625, -0.42136383056640625, -0.40594482421875, -0.39052581787109375, -0.3751068115234375, -0.35968780517578125, -0.344268798828125, -0.32884979248046875, -0.3134307861328125, -0.29801177978515625, -0.2825927734375, -0.26717376708984375, -0.2517547607421875, -0.23633575439453125, -0.220916748046875, -0.20549774169921875, -0.1900787353515625, -0.17465972900390625, -0.15924072265625, -0.14382171630859375, -0.1284027099609375, -0.11298370361328125, -0.097564697265625, -0.08214569091796875, -0.0667266845703125, -0.05130767822265625, -0.035888671875, -0.02046966552734375, -0.0050506591796875, 0.01036834716796875, 0.025787353515625, 0.04120635986328125, 0.0566253662109375, 0.07204437255859375, 0.08746337890625, 0.10288238525390625, 0.1183013916015625, 0.13372039794921875, 0.149139404296875, 0.16455841064453125, 0.1799774169921875, 0.19539642333984375, 0.2108154296875, 0.22623443603515625, 0.2416534423828125, 0.25707244873046875, 0.272491455078125, 0.28791046142578125, 0.3033294677734375, 0.31874847412109375, 0.33416748046875, 0.34958648681640625, 0.3650054931640625, 0.38042449951171875, 0.395843505859375, 0.41126251220703125, 0.4266815185546875, 0.44210052490234375, 0.45751953125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 9.0, 6.0, 10.0, 10.0, 12.0, 24.0, 40.0, 44.0, 62.0, 75.0, 123.0, 169.0, 279.0, 345.0, 518.0, 810.0, 1289.0, 2243.0, 5131.0, 18946.0, 369307.0, 3750127.0, 30601.0, 6843.0, 2876.0, 1478.0, 924.0, 624.0, 399.0, 273.0, 210.0, 135.0, 82.0, 75.0, 47.0, 30.0, 32.0, 15.0, 23.0, 9.0, 7.0, 4.0, 3.0, 5.0, 0.0, 0.0, 2.0], "bins": [-4.0390625, -3.933135986328125, -3.82720947265625, -3.721282958984375, -3.6153564453125, -3.509429931640625, -3.40350341796875, -3.297576904296875, -3.191650390625, -3.085723876953125, -2.97979736328125, -2.873870849609375, -2.7679443359375, -2.662017822265625, -2.55609130859375, -2.450164794921875, -2.34423828125, -2.238311767578125, -2.13238525390625, -2.026458740234375, -1.9205322265625, -1.814605712890625, -1.70867919921875, -1.602752685546875, -1.496826171875, -1.390899658203125, -1.28497314453125, -1.179046630859375, -1.0731201171875, -0.967193603515625, -0.86126708984375, -0.755340576171875, -0.6494140625, -0.543487548828125, -0.43756103515625, -0.331634521484375, -0.2257080078125, -0.119781494140625, -0.01385498046875, 0.092071533203125, 0.197998046875, 0.303924560546875, 0.40985107421875, 0.515777587890625, 0.6217041015625, 0.727630615234375, 0.83355712890625, 0.939483642578125, 1.04541015625, 1.151336669921875, 1.25726318359375, 1.363189697265625, 1.4691162109375, 1.575042724609375, 1.68096923828125, 1.786895751953125, 1.892822265625, 1.998748779296875, 2.10467529296875, 2.210601806640625, 2.3165283203125, 2.422454833984375, 2.52838134765625, 2.634307861328125, 2.740234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 9.0, 6.0, 12.0, 19.0, 31.0, 55.0, 144.0, 737.0, 2718.0, 199.0, 60.0, 27.0, 11.0, 15.0, 9.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54052734375, -0.5161514282226562, -0.4917755126953125, -0.46739959716796875, -0.443023681640625, -0.41864776611328125, -0.3942718505859375, -0.36989593505859375, -0.34552001953125, -0.32114410400390625, -0.2967681884765625, -0.27239227294921875, -0.248016357421875, -0.22364044189453125, -0.1992645263671875, -0.17488861083984375, -0.1505126953125, -0.12613677978515625, -0.1017608642578125, -0.07738494873046875, -0.053009033203125, -0.02863311767578125, -0.0042572021484375, 0.02011871337890625, 0.04449462890625, 0.06887054443359375, 0.0932464599609375, 0.11762237548828125, 0.141998291015625, 0.16637420654296875, 0.1907501220703125, 0.21512603759765625, 0.239501953125, 0.26387786865234375, 0.2882537841796875, 0.31262969970703125, 0.337005615234375, 0.36138153076171875, 0.3857574462890625, 0.41013336181640625, 0.43450927734375, 0.45888519287109375, 0.4832611083984375, 0.5076370239257812, 0.532012939453125, 0.5563888549804688, 0.5807647705078125, 0.6051406860351562, 0.6295166015625, 0.6538925170898438, 0.6782684326171875, 0.7026443481445312, 0.727020263671875, 0.7513961791992188, 0.7757720947265625, 0.8001480102539062, 0.82452392578125, 0.8488998413085938, 0.8732757568359375, 0.8976516723632812, 0.922027587890625, 0.9464035034179688, 0.9707794189453125, 0.9951553344726562, 1.01953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 11.0, 12.0, 23.0, 31.0, 53.0, 100.0, 159.0, 184.0, 130.0, 104.0, 57.0, 42.0, 24.0, 19.0, 16.0, 5.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.534883499145508, -4.373327255249023, -4.211770534515381, -4.0502142906188965, -3.888657808303833, -3.7271013259887695, -3.565545082092285, -3.4039885997772217, -3.242432117462158, -3.0808756351470947, -2.9193191528320312, -2.757762908935547, -2.5962064266204834, -2.43464994430542, -2.2730937004089355, -2.111537218093872, -1.9499807357788086, -1.7884242534637451, -1.6268678903579712, -1.4653115272521973, -1.3037550449371338, -1.1421985626220703, -0.9806421995162964, -0.8190858364105225, -0.657529354095459, -0.4959729313850403, -0.3344165086746216, -0.17286008596420288, -0.01130366325378418, 0.15025275945663452, 0.3118091821670532, 0.47336554527282715, 0.6349220275878906, 0.7964784502983093, 0.958034873008728, 1.119591236114502, 1.2811477184295654, 1.442704200744629, 1.6042605638504028, 1.7658169269561768, 1.9273734092712402, 2.0889298915863037, 2.250486373901367, 2.4120426177978516, 2.573599100112915, 2.7351555824279785, 2.896711826324463, 3.0582683086395264, 3.21982479095459, 3.3813812732696533, 3.542937755584717, 3.704493999481201, 3.8660504817962646, 4.027606964111328, 4.1891632080078125, 4.350719451904297, 4.5122761726379395, 4.673832416534424, 4.835389137268066, 4.996945381164551, 5.158501625061035, 5.320058345794678, 5.481614589691162, 5.643171310424805, 5.804727554321289]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 9.0, 14.0, 17.0, 10.0, 15.0, 20.0, 19.0, 16.0, 27.0, 30.0, 27.0, 33.0, 33.0, 41.0, 37.0, 30.0, 32.0, 47.0, 36.0, 44.0, 39.0, 37.0, 32.0, 31.0, 36.0, 35.0, 36.0, 35.0, 21.0, 18.0, 23.0, 12.0, 16.0, 12.0, 14.0, 13.0, 7.0, 9.0, 4.0, 6.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.083937406539917, -2.0216033458709717, -1.959269404411316, -1.8969354629516602, -1.8346015214920044, -1.7722675800323486, -1.7099335193634033, -1.6475995779037476, -1.5852656364440918, -1.522931694984436, -1.4605976343154907, -1.398263692855835, -1.3359297513961792, -1.2735958099365234, -1.2112617492675781, -1.1489278078079224, -1.0865938663482666, -1.0242599248886108, -0.9619259238243103, -0.8995919227600098, -0.837257981300354, -0.7749239802360535, -0.7125899791717529, -0.6502560377120972, -0.5879219770431519, -0.5255879759788513, -0.46325403451919556, -0.400920033454895, -0.33858609199523926, -0.2762520909309387, -0.21391811966896057, -0.15158414840698242, -0.08925020694732666, -0.026916231960058212, 0.035417743027210236, 0.09775172173976898, 0.16008569300174713, 0.22241967916488647, 0.2847536504268646, 0.3470876216888428, 0.4094215929508209, 0.4717555642127991, 0.5340895652770996, 0.5964235067367554, 0.6587575078010559, 0.7210915088653564, 0.7834254503250122, 0.845759391784668, 0.9080933928489685, 0.970427393913269, 1.0327613353729248, 1.0950952768325806, 1.1574293375015259, 1.2197632789611816, 1.2820972204208374, 1.3444311618804932, 1.4067652225494385, 1.4690991640090942, 1.5314332246780396, 1.5937671661376953, 1.656101107597351, 1.7184350490570068, 1.7807691097259521, 1.843103051185608, 1.9054369926452637]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 5.0, 16.0, 15.0, 34.0, 39.0, 56.0, 98.0, 169.0, 379.0, 980.0, 2652.0, 10109.0, 51604.0, 380506.0, 508559.0, 74695.0, 13139.0, 3363.0, 1187.0, 451.0, 207.0, 106.0, 74.0, 34.0, 21.0, 22.0, 9.0, 10.0, 8.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.212890625, -2.146026611328125, -2.07916259765625, -2.012298583984375, -1.9454345703125, -1.878570556640625, -1.81170654296875, -1.744842529296875, -1.677978515625, -1.611114501953125, -1.54425048828125, -1.477386474609375, -1.4105224609375, -1.343658447265625, -1.27679443359375, -1.209930419921875, -1.14306640625, -1.076202392578125, -1.00933837890625, -0.942474365234375, -0.8756103515625, -0.808746337890625, -0.74188232421875, -0.675018310546875, -0.608154296875, -0.541290283203125, -0.47442626953125, -0.407562255859375, -0.3406982421875, -0.273834228515625, -0.20697021484375, -0.140106201171875, -0.0732421875, -0.006378173828125, 0.06048583984375, 0.127349853515625, 0.1942138671875, 0.261077880859375, 0.32794189453125, 0.394805908203125, 0.461669921875, 0.528533935546875, 0.59539794921875, 0.662261962890625, 0.7291259765625, 0.795989990234375, 0.86285400390625, 0.929718017578125, 0.99658203125, 1.063446044921875, 1.13031005859375, 1.197174072265625, 1.2640380859375, 1.330902099609375, 1.39776611328125, 1.464630126953125, 1.531494140625, 1.598358154296875, 1.66522216796875, 1.732086181640625, 1.7989501953125, 1.865814208984375, 1.93267822265625, 1.999542236328125, 2.06640625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 10.0, 17.0, 13.0, 18.0, 18.0, 32.0, 35.0, 40.0, 30.0, 57.0, 50.0, 57.0, 60.0, 54.0, 64.0, 55.0, 43.0, 52.0, 36.0, 41.0, 37.0, 22.0, 38.0, 21.0, 22.0, 11.0, 20.0, 8.0, 8.0, 9.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.56884765625, -0.5492706298828125, -0.529693603515625, -0.5101165771484375, -0.49053955078125, -0.4709625244140625, -0.451385498046875, -0.4318084716796875, -0.4122314453125, -0.3926544189453125, -0.373077392578125, -0.3535003662109375, -0.33392333984375, -0.3143463134765625, -0.294769287109375, -0.2751922607421875, -0.255615234375, -0.2360382080078125, -0.216461181640625, -0.1968841552734375, -0.17730712890625, -0.1577301025390625, -0.138153076171875, -0.1185760498046875, -0.0989990234375, -0.0794219970703125, -0.059844970703125, -0.0402679443359375, -0.02069091796875, -0.0011138916015625, 0.018463134765625, 0.0380401611328125, 0.0576171875, 0.0771942138671875, 0.096771240234375, 0.1163482666015625, 0.13592529296875, 0.1555023193359375, 0.175079345703125, 0.1946563720703125, 0.2142333984375, 0.2338104248046875, 0.253387451171875, 0.2729644775390625, 0.29254150390625, 0.3121185302734375, 0.331695556640625, 0.3512725830078125, 0.370849609375, 0.3904266357421875, 0.410003662109375, 0.4295806884765625, 0.44915771484375, 0.4687347412109375, 0.488311767578125, 0.5078887939453125, 0.5274658203125, 0.5470428466796875, 0.566619873046875, 0.5861968994140625, 0.60577392578125, 0.6253509521484375, 0.644927978515625, 0.6645050048828125, 0.68408203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 7.0, 13.0, 26.0, 36.0, 53.0, 112.0, 240.0, 476.0, 1457.0, 9876.0, 466220.0, 556375.0, 11175.0, 1547.0, 469.0, 223.0, 111.0, 55.0, 29.0, 24.0, 17.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.761566162109375, -2.59930419921875, -2.437042236328125, -2.2747802734375, -2.112518310546875, -1.95025634765625, -1.787994384765625, -1.625732421875, -1.463470458984375, -1.30120849609375, -1.138946533203125, -0.9766845703125, -0.814422607421875, -0.65216064453125, -0.489898681640625, -0.32763671875, -0.165374755859375, -0.00311279296875, 0.159149169921875, 0.3214111328125, 0.483673095703125, 0.64593505859375, 0.808197021484375, 0.970458984375, 1.132720947265625, 1.29498291015625, 1.457244873046875, 1.6195068359375, 1.781768798828125, 1.94403076171875, 2.106292724609375, 2.2685546875, 2.430816650390625, 2.59307861328125, 2.755340576171875, 2.9176025390625, 3.079864501953125, 3.24212646484375, 3.404388427734375, 3.566650390625, 3.728912353515625, 3.89117431640625, 4.053436279296875, 4.2156982421875, 4.377960205078125, 4.54022216796875, 4.702484130859375, 4.86474609375, 5.027008056640625, 5.18927001953125, 5.351531982421875, 5.5137939453125, 5.676055908203125, 5.83831787109375, 6.000579833984375, 6.162841796875, 6.325103759765625, 6.48736572265625, 6.649627685546875, 6.8118896484375, 6.974151611328125, 7.13641357421875, 7.298675537109375, 7.4609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 2.0, 4.0, 8.0, 13.0, 15.0, 20.0, 22.0, 23.0, 30.0, 42.0, 49.0, 43.0, 38.0, 57.0, 44.0, 65.0, 58.0, 50.0, 58.0, 43.0, 42.0, 33.0, 43.0, 32.0, 41.0, 23.0, 19.0, 22.0, 13.0, 8.0, 7.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.06640625, -2.969482421875, -2.87255859375, -2.775634765625, -2.6787109375, -2.581787109375, -2.48486328125, -2.387939453125, -2.291015625, -2.194091796875, -2.09716796875, -2.000244140625, -1.9033203125, -1.806396484375, -1.70947265625, -1.612548828125, -1.515625, -1.418701171875, -1.32177734375, -1.224853515625, -1.1279296875, -1.031005859375, -0.93408203125, -0.837158203125, -0.740234375, -0.643310546875, -0.54638671875, -0.449462890625, -0.3525390625, -0.255615234375, -0.15869140625, -0.061767578125, 0.03515625, 0.132080078125, 0.22900390625, 0.325927734375, 0.4228515625, 0.519775390625, 0.61669921875, 0.713623046875, 0.810546875, 0.907470703125, 1.00439453125, 1.101318359375, 1.1982421875, 1.295166015625, 1.39208984375, 1.489013671875, 1.5859375, 1.682861328125, 1.77978515625, 1.876708984375, 1.9736328125, 2.070556640625, 2.16748046875, 2.264404296875, 2.361328125, 2.458251953125, 2.55517578125, 2.652099609375, 2.7490234375, 2.845947265625, 2.94287109375, 3.039794921875, 3.13671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 16.0, 13.0, 30.0, 32.0, 60.0, 92.0, 154.0, 276.0, 651.0, 1552.0, 5613.0, 39073.0, 792539.0, 190972.0, 12812.0, 2780.0, 920.0, 442.0, 197.0, 100.0, 73.0, 52.0, 26.0, 25.0, 13.0, 11.0, 7.0, 7.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.033203125, -1.97296142578125, -1.9127197265625, -1.85247802734375, -1.792236328125, -1.73199462890625, -1.6717529296875, -1.61151123046875, -1.55126953125, -1.49102783203125, -1.4307861328125, -1.37054443359375, -1.310302734375, -1.25006103515625, -1.1898193359375, -1.12957763671875, -1.0693359375, -1.00909423828125, -0.9488525390625, -0.88861083984375, -0.828369140625, -0.76812744140625, -0.7078857421875, -0.64764404296875, -0.58740234375, -0.52716064453125, -0.4669189453125, -0.40667724609375, -0.346435546875, -0.28619384765625, -0.2259521484375, -0.16571044921875, -0.10546875, -0.04522705078125, 0.0150146484375, 0.07525634765625, 0.135498046875, 0.19573974609375, 0.2559814453125, 0.31622314453125, 0.37646484375, 0.43670654296875, 0.4969482421875, 0.55718994140625, 0.617431640625, 0.67767333984375, 0.7379150390625, 0.79815673828125, 0.8583984375, 0.91864013671875, 0.9788818359375, 1.03912353515625, 1.099365234375, 1.15960693359375, 1.2198486328125, 1.28009033203125, 1.34033203125, 1.40057373046875, 1.4608154296875, 1.52105712890625, 1.581298828125, 1.64154052734375, 1.7017822265625, 1.76202392578125, 1.822265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 4.0, 4.0, 9.0, 6.0, 7.0, 16.0, 13.0, 23.0, 19.0, 34.0, 43.0, 64.0, 71.0, 85.0, 96.0, 104.0, 97.0, 70.0, 49.0, 53.0, 26.0, 21.0, 16.0, 5.0, 10.0, 5.0, 6.0, 8.0, 2.0, 5.0, 8.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017321109771728516, -0.00016699917614459991, -0.00016078725457191467, -0.00015457533299922943, -0.0001483634114265442, -0.00014215148985385895, -0.0001359395682811737, -0.00012972764670848846, -0.00012351572513580322, -0.00011730380356311798, -0.00011109188199043274, -0.0001048799604177475, -9.866803884506226e-05, -9.245611727237701e-05, -8.624419569969177e-05, -8.003227412700653e-05, -7.382035255432129e-05, -6.760843098163605e-05, -6.13965094089508e-05, -5.5184587836265564e-05, -4.897266626358032e-05, -4.276074469089508e-05, -3.654882311820984e-05, -3.0336901545524597e-05, -2.4124979972839355e-05, -1.7913058400154114e-05, -1.1701136827468872e-05, -5.48921525478363e-06, 7.227063179016113e-07, 6.934627890586853e-06, 1.3146549463272095e-05, 1.9358471035957336e-05, 2.5570392608642578e-05, 3.178231418132782e-05, 3.799423575401306e-05, 4.42061573266983e-05, 5.0418078899383545e-05, 5.663000047206879e-05, 6.284192204475403e-05, 6.905384361743927e-05, 7.526576519012451e-05, 8.147768676280975e-05, 8.7689608335495e-05, 9.390152990818024e-05, 0.00010011345148086548, 0.00010632537305355072, 0.00011253729462623596, 0.0001187492161989212, 0.00012496113777160645, 0.0001311730593442917, 0.00013738498091697693, 0.00014359690248966217, 0.0001498088240623474, 0.00015602074563503265, 0.0001622326672077179, 0.00016844458878040314, 0.00017465651035308838, 0.00018086843192577362, 0.00018708035349845886, 0.0001932922750711441, 0.00019950419664382935, 0.0002057161182165146, 0.00021192803978919983, 0.00021813996136188507, 0.0002243518829345703]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 6.0, 12.0, 13.0, 14.0, 16.0, 43.0, 89.0, 140.0, 260.0, 560.0, 1670.0, 9561.0, 483700.0, 539474.0, 10019.0, 1799.0, 569.0, 278.0, 130.0, 79.0, 35.0, 20.0, 23.0, 14.0, 7.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.130859375, -2.0421142578125, -1.953369140625, -1.8646240234375, -1.77587890625, -1.6871337890625, -1.598388671875, -1.5096435546875, -1.4208984375, -1.3321533203125, -1.243408203125, -1.1546630859375, -1.06591796875, -0.9771728515625, -0.888427734375, -0.7996826171875, -0.7109375, -0.6221923828125, -0.533447265625, -0.4447021484375, -0.35595703125, -0.2672119140625, -0.178466796875, -0.0897216796875, -0.0009765625, 0.0877685546875, 0.176513671875, 0.2652587890625, 0.35400390625, 0.4427490234375, 0.531494140625, 0.6202392578125, 0.708984375, 0.7977294921875, 0.886474609375, 0.9752197265625, 1.06396484375, 1.1527099609375, 1.241455078125, 1.3302001953125, 1.4189453125, 1.5076904296875, 1.596435546875, 1.6851806640625, 1.77392578125, 1.8626708984375, 1.951416015625, 2.0401611328125, 2.12890625, 2.2176513671875, 2.306396484375, 2.3951416015625, 2.48388671875, 2.5726318359375, 2.661376953125, 2.7501220703125, 2.8388671875, 2.9276123046875, 3.016357421875, 3.1051025390625, 3.19384765625, 3.2825927734375, 3.371337890625, 3.4600830078125, 3.548828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 13.0, 8.0, 19.0, 41.0, 76.0, 127.0, 165.0, 190.0, 151.0, 84.0, 63.0, 26.0, 12.0, 13.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.4765625, -3.4074172973632812, -3.3382720947265625, -3.2691268920898438, -3.199981689453125, -3.1308364868164062, -3.0616912841796875, -2.9925460815429688, -2.92340087890625, -2.8542556762695312, -2.7851104736328125, -2.7159652709960938, -2.646820068359375, -2.5776748657226562, -2.5085296630859375, -2.4393844604492188, -2.3702392578125, -2.3010940551757812, -2.2319488525390625, -2.1628036499023438, -2.093658447265625, -2.0245132446289062, -1.9553680419921875, -1.8862228393554688, -1.81707763671875, -1.7479324340820312, -1.6787872314453125, -1.6096420288085938, -1.540496826171875, -1.4713516235351562, -1.4022064208984375, -1.3330612182617188, -1.263916015625, -1.1947708129882812, -1.1256256103515625, -1.0564804077148438, -0.987335205078125, -0.9181900024414062, -0.8490447998046875, -0.7798995971679688, -0.71075439453125, -0.6416091918945312, -0.5724639892578125, -0.5033187866210938, -0.434173583984375, -0.36502838134765625, -0.2958831787109375, -0.22673797607421875, -0.1575927734375, -0.08844757080078125, -0.0193023681640625, 0.04984283447265625, 0.118988037109375, 0.18813323974609375, 0.2572784423828125, 0.32642364501953125, 0.39556884765625, 0.46471405029296875, 0.5338592529296875, 0.6030044555664062, 0.672149658203125, 0.7412948608398438, 0.8104400634765625, 0.8795852661132812, 0.94873046875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 13.0, 34.0, 74.0, 180.0, 286.0, 231.0, 122.0, 36.0, 12.0, 12.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.703693389892578, -15.476158142089844, -14.248623847961426, -13.021089553833008, -11.793554306030273, -10.566019058227539, -9.338484764099121, -8.110950469970703, -6.883415222167969, -5.655880451202393, -4.428345680236816, -3.2008109092712402, -1.973276138305664, -0.7457413673400879, 0.4817934036254883, 1.7093276977539062, 2.9368629455566406, 4.164397716522217, 5.391932487487793, 6.619467258453369, 7.847002029418945, 9.07453727722168, 10.302071571350098, 11.529605865478516, 12.75714111328125, 13.984676361083984, 15.212210655212402, 16.43974494934082, 17.667280197143555, 18.89481544494629, 20.12234878540039, 21.349884033203125, 22.577415466308594, 23.804950714111328, 25.032485961914062, 26.260019302368164, 27.4875545501709, 28.715089797973633, 29.942623138427734, 31.17015838623047, 32.3976936340332, 33.62522888183594, 34.85276412963867, 36.080299377441406, 37.307830810546875, 38.53536605834961, 39.762901306152344, 40.99043655395508, 42.21797180175781, 43.44550704956055, 44.67304229736328, 45.900577545166016, 47.12811279296875, 48.35564422607422, 49.58317947387695, 50.81071472167969, 52.03824996948242, 53.265785217285156, 54.49332046508789, 55.720855712890625, 56.948387145996094, 58.17592239379883, 59.40345764160156, 60.6309928894043, 61.85852813720703]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 9.0, 13.0, 22.0, 21.0, 19.0, 21.0, 35.0, 35.0, 29.0, 47.0, 55.0, 71.0, 53.0, 70.0, 53.0, 75.0, 52.0, 47.0, 47.0, 49.0, 32.0, 29.0, 17.0, 15.0, 16.0, 14.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.874217987060547, -18.343677520751953, -17.813138961791992, -17.2825984954834, -16.752058029174805, -16.221519470214844, -15.69097900390625, -15.160439491271973, -14.629899978637695, -14.099360466003418, -13.568819999694824, -13.038280487060547, -12.50774097442627, -11.977201461791992, -11.446660995483398, -10.916121482849121, -10.385581016540527, -9.85504150390625, -9.324501037597656, -8.793961524963379, -8.263422012329102, -7.732882022857666, -7.2023420333862305, -6.671802520751953, -6.141262531280518, -5.610722541809082, -5.080183029174805, -4.549643039703369, -4.019103050231934, -3.4885635375976562, -2.9580235481262207, -2.4274837970733643, -1.8969440460205078, -1.3664042949676514, -0.8358644247055054, -0.3053245544433594, 0.22521519660949707, 0.7557549476623535, 1.286294937133789, 1.8168346881866455, 2.347374439239502, 2.8779141902923584, 3.408453941345215, 3.9389939308166504, 4.469533920288086, 5.000073432922363, 5.530613422393799, 6.061153411865234, 6.591692924499512, 7.122232913970947, 7.652772426605225, 8.18331241607666, 8.713851928710938, 9.244392395019531, 9.774931907653809, 10.305471420288086, 10.83601188659668, 11.366551399230957, 11.89709186553955, 12.427631378173828, 12.958170890808105, 13.488710403442383, 14.019250869750977, 14.549790382385254, 15.080329895019531]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 7.0, 9.0, 12.0, 10.0, 25.0, 36.0, 37.0, 64.0, 76.0, 125.0, 161.0, 311.0, 541.0, 1045.0, 2609.0, 9764.0, 304368.0, 3857752.0, 11778.0, 2905.0, 1116.0, 563.0, 315.0, 220.0, 144.0, 82.0, 58.0, 35.0, 36.0, 27.0, 11.0, 9.0, 5.0, 9.0, 4.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.896484375, -1.823699951171875, -1.75091552734375, -1.678131103515625, -1.6053466796875, -1.532562255859375, -1.45977783203125, -1.386993408203125, -1.314208984375, -1.241424560546875, -1.16864013671875, -1.095855712890625, -1.0230712890625, -0.950286865234375, -0.87750244140625, -0.804718017578125, -0.73193359375, -0.659149169921875, -0.58636474609375, -0.513580322265625, -0.4407958984375, -0.368011474609375, -0.29522705078125, -0.222442626953125, -0.149658203125, -0.076873779296875, -0.00408935546875, 0.068695068359375, 0.1414794921875, 0.214263916015625, 0.28704833984375, 0.359832763671875, 0.4326171875, 0.505401611328125, 0.57818603515625, 0.650970458984375, 0.7237548828125, 0.796539306640625, 0.86932373046875, 0.942108154296875, 1.014892578125, 1.087677001953125, 1.16046142578125, 1.233245849609375, 1.3060302734375, 1.378814697265625, 1.45159912109375, 1.524383544921875, 1.59716796875, 1.669952392578125, 1.74273681640625, 1.815521240234375, 1.8883056640625, 1.961090087890625, 2.03387451171875, 2.106658935546875, 2.179443359375, 2.252227783203125, 2.32501220703125, 2.397796630859375, 2.4705810546875, 2.543365478515625, 2.61614990234375, 2.688934326171875, 2.76171875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 13.0, 7.0, 19.0, 27.0, 21.0, 29.0, 46.0, 67.0, 65.0, 67.0, 71.0, 62.0, 82.0, 71.0, 61.0, 54.0, 54.0, 40.0, 40.0, 21.0, 13.0, 12.0, 14.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8837890625, -0.8555984497070312, -0.8274078369140625, -0.7992172241210938, -0.771026611328125, -0.7428359985351562, -0.7146453857421875, -0.6864547729492188, -0.65826416015625, -0.6300735473632812, -0.6018829345703125, -0.5736923217773438, -0.545501708984375, -0.5173110961914062, -0.4891204833984375, -0.46092987060546875, -0.4327392578125, -0.40454864501953125, -0.3763580322265625, -0.34816741943359375, -0.319976806640625, -0.29178619384765625, -0.2635955810546875, -0.23540496826171875, -0.20721435546875, -0.17902374267578125, -0.1508331298828125, -0.12264251708984375, -0.094451904296875, -0.06626129150390625, -0.0380706787109375, -0.00988006591796875, 0.018310546875, 0.04650115966796875, 0.0746917724609375, 0.10288238525390625, 0.131072998046875, 0.15926361083984375, 0.1874542236328125, 0.21564483642578125, 0.24383544921875, 0.27202606201171875, 0.3002166748046875, 0.32840728759765625, 0.356597900390625, 0.38478851318359375, 0.4129791259765625, 0.44116973876953125, 0.4693603515625, 0.49755096435546875, 0.5257415771484375, 0.5539321899414062, 0.582122802734375, 0.6103134155273438, 0.6385040283203125, 0.6666946411132812, 0.69488525390625, 0.7230758666992188, 0.7512664794921875, 0.7794570922851562, 0.807647705078125, 0.8358383178710938, 0.8640289306640625, 0.8922195434570312, 0.92041015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 11.0, 8.0, 10.0, 16.0, 21.0, 22.0, 33.0, 22.0, 34.0, 51.0, 66.0, 103.0, 138.0, 251.0, 483.0, 914.0, 1985.0, 5531.0, 25656.0, 3917987.0, 219870.0, 13881.0, 3851.0, 1481.0, 722.0, 391.0, 211.0, 138.0, 103.0, 55.0, 51.0, 34.0, 29.0, 26.0, 24.0, 15.0, 13.0, 11.0, 9.0, 5.0, 5.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.845703125, -2.756317138671875, -2.66693115234375, -2.577545166015625, -2.4881591796875, -2.398773193359375, -2.30938720703125, -2.220001220703125, -2.130615234375, -2.041229248046875, -1.95184326171875, -1.862457275390625, -1.7730712890625, -1.683685302734375, -1.59429931640625, -1.504913330078125, -1.41552734375, -1.326141357421875, -1.23675537109375, -1.147369384765625, -1.0579833984375, -0.968597412109375, -0.87921142578125, -0.789825439453125, -0.700439453125, -0.611053466796875, -0.52166748046875, -0.432281494140625, -0.3428955078125, -0.253509521484375, -0.16412353515625, -0.074737548828125, 0.0146484375, 0.104034423828125, 0.19342041015625, 0.282806396484375, 0.3721923828125, 0.461578369140625, 0.55096435546875, 0.640350341796875, 0.729736328125, 0.819122314453125, 0.90850830078125, 0.997894287109375, 1.0872802734375, 1.176666259765625, 1.26605224609375, 1.355438232421875, 1.44482421875, 1.534210205078125, 1.62359619140625, 1.712982177734375, 1.8023681640625, 1.891754150390625, 1.98114013671875, 2.070526123046875, 2.159912109375, 2.249298095703125, 2.33868408203125, 2.428070068359375, 2.5174560546875, 2.606842041015625, 2.69622802734375, 2.785614013671875, 2.875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 6.0, 19.0, 26.0, 92.0, 497.0, 3242.0, 112.0, 41.0, 14.0, 15.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8322677612304688, -0.8046722412109375, -0.7770767211914062, -0.749481201171875, -0.7218856811523438, -0.6942901611328125, -0.6666946411132812, -0.63909912109375, -0.6115036010742188, -0.5839080810546875, -0.5563125610351562, -0.528717041015625, -0.5011215209960938, -0.4735260009765625, -0.44593048095703125, -0.4183349609375, -0.39073944091796875, -0.3631439208984375, -0.33554840087890625, -0.307952880859375, -0.28035736083984375, -0.2527618408203125, -0.22516632080078125, -0.19757080078125, -0.16997528076171875, -0.1423797607421875, -0.11478424072265625, -0.087188720703125, -0.05959320068359375, -0.0319976806640625, -0.00440216064453125, 0.023193359375, 0.05078887939453125, 0.0783843994140625, 0.10597991943359375, 0.133575439453125, 0.16117095947265625, 0.1887664794921875, 0.21636199951171875, 0.24395751953125, 0.27155303955078125, 0.2991485595703125, 0.32674407958984375, 0.354339599609375, 0.38193511962890625, 0.4095306396484375, 0.43712615966796875, 0.4647216796875, 0.49231719970703125, 0.5199127197265625, 0.5475082397460938, 0.575103759765625, 0.6026992797851562, 0.6302947998046875, 0.6578903198242188, 0.68548583984375, 0.7130813598632812, 0.7406768798828125, 0.7682723999023438, 0.795867919921875, 0.8234634399414062, 0.8510589599609375, 0.8786544799804688, 0.90625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 13.0, 28.0, 38.0, 57.0, 103.0, 162.0, 177.0, 158.0, 119.0, 56.0, 27.0, 14.0, 14.0, 10.0, 7.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.837955951690674, -2.7528116703033447, -2.6676676273345947, -2.5825233459472656, -2.4973790645599365, -2.4122347831726074, -2.3270907402038574, -2.2419464588165283, -2.156802177429199, -2.07165789604187, -1.9865137338638306, -1.901369571685791, -1.816225290298462, -1.7310811281204224, -1.6459369659423828, -1.5607926845550537, -1.4756485223770142, -1.3905043601989746, -1.3053600788116455, -1.220215916633606, -1.1350716352462769, -1.0499274730682373, -0.964783251285553, -0.8796390295028687, -0.7944948077201843, -0.7093505859375, -0.6242063641548157, -0.5390621423721313, -0.4539179503917694, -0.3687737286090851, -0.28362953662872314, -0.19848531484603882, -0.11334109306335449, -0.028196878731250763, 0.056947335600852966, 0.1420915424823761, 0.22723576426506042, 0.31237998604774475, 0.3975241780281067, 0.482668399810791, 0.5678126215934753, 0.6529568433761597, 0.738101065158844, 0.8232452869415283, 0.9083894491195679, 0.993533730506897, 1.0786778926849365, 1.1638221740722656, 1.2489663362503052, 1.3341104984283447, 1.4192547798156738, 1.5043989419937134, 1.5895432233810425, 1.674687385559082, 1.7598316669464111, 1.8449758291244507, 1.9301199913024902, 2.0152642726898193, 2.1004083156585693, 2.1855525970458984, 2.2706968784332275, 2.3558411598205566, 2.4409852027893066, 2.5261294841766357, 2.611273765563965]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 9.0, 5.0, 10.0, 3.0, 2.0, 10.0, 11.0, 13.0, 16.0, 19.0, 18.0, 18.0, 13.0, 16.0, 30.0, 36.0, 35.0, 28.0, 43.0, 48.0, 35.0, 52.0, 38.0, 46.0, 44.0, 51.0, 41.0, 44.0, 42.0, 30.0, 27.0, 25.0, 15.0, 25.0, 19.0, 15.0, 16.0, 10.0, 7.0, 10.0, 11.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.004260778427124, -0.9713153839111328, -0.9383699893951416, -0.9054246544837952, -0.872479259967804, -0.8395338654518127, -0.8065885305404663, -0.7736431360244751, -0.7406977415084839, -0.7077523469924927, -0.6748069524765015, -0.641861617565155, -0.6089162230491638, -0.5759708285331726, -0.5430254936218262, -0.510080099105835, -0.47713470458984375, -0.44418931007385254, -0.4112439453601837, -0.3782985806465149, -0.3453531861305237, -0.31240779161453247, -0.27946242690086365, -0.24651704728603363, -0.2135716676712036, -0.1806262880563736, -0.14768090844154358, -0.11473552882671356, -0.08179014921188354, -0.04884476959705353, -0.01589938998222351, 0.017045989632606506, 0.04999136924743652, 0.08293674886226654, 0.11588212847709656, 0.14882750809192657, 0.1817728877067566, 0.2147182673215866, 0.24766364693641663, 0.28060901165008545, 0.31355440616607666, 0.34649980068206787, 0.3794451653957367, 0.4123905301094055, 0.44533592462539673, 0.47828131914138794, 0.5112266540527344, 0.5441720485687256, 0.5771174430847168, 0.610062837600708, 0.6430082321166992, 0.6759535670280457, 0.7088989615440369, 0.7418443560600281, 0.7747896909713745, 0.8077350854873657, 0.8406804800033569, 0.8736258745193481, 0.9065712690353394, 0.9395166039466858, 0.972461998462677, 1.0054073333740234, 1.0383527278900146, 1.0712981224060059, 1.104243516921997]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 8.0, 7.0, 6.0, 9.0, 8.0, 20.0, 44.0, 54.0, 99.0, 187.0, 358.0, 706.0, 1509.0, 3615.0, 9928.0, 32428.0, 135364.0, 510995.0, 268633.0, 58627.0, 16090.0, 5502.0, 2235.0, 1005.0, 517.0, 268.0, 133.0, 80.0, 52.0, 25.0, 17.0, 12.0, 7.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.67413330078125, -1.6285400390625, -1.58294677734375, -1.537353515625, -1.49176025390625, -1.4461669921875, -1.40057373046875, -1.35498046875, -1.30938720703125, -1.2637939453125, -1.21820068359375, -1.172607421875, -1.12701416015625, -1.0814208984375, -1.03582763671875, -0.990234375, -0.94464111328125, -0.8990478515625, -0.85345458984375, -0.807861328125, -0.76226806640625, -0.7166748046875, -0.67108154296875, -0.62548828125, -0.57989501953125, -0.5343017578125, -0.48870849609375, -0.443115234375, -0.39752197265625, -0.3519287109375, -0.30633544921875, -0.2607421875, -0.21514892578125, -0.1695556640625, -0.12396240234375, -0.078369140625, -0.03277587890625, 0.0128173828125, 0.05841064453125, 0.10400390625, 0.14959716796875, 0.1951904296875, 0.24078369140625, 0.286376953125, 0.33197021484375, 0.3775634765625, 0.42315673828125, 0.46875, 0.51434326171875, 0.5599365234375, 0.60552978515625, 0.651123046875, 0.69671630859375, 0.7423095703125, 0.78790283203125, 0.83349609375, 0.87908935546875, 0.9246826171875, 0.97027587890625, 1.015869140625, 1.06146240234375, 1.1070556640625, 1.15264892578125, 1.1982421875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 9.0, 13.0, 19.0, 18.0, 25.0, 27.0, 33.0, 30.0, 56.0, 42.0, 54.0, 55.0, 52.0, 56.0, 57.0, 58.0, 49.0, 48.0, 50.0, 48.0, 43.0, 25.0, 26.0, 21.0, 11.0, 14.0, 7.0, 11.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73291015625, -0.7079238891601562, -0.6829376220703125, -0.6579513549804688, -0.632965087890625, -0.6079788208007812, -0.5829925537109375, -0.5580062866210938, -0.53302001953125, -0.5080337524414062, -0.4830474853515625, -0.45806121826171875, -0.433074951171875, -0.40808868408203125, -0.3831024169921875, -0.35811614990234375, -0.3331298828125, -0.30814361572265625, -0.2831573486328125, -0.25817108154296875, -0.233184814453125, -0.20819854736328125, -0.1832122802734375, -0.15822601318359375, -0.13323974609375, -0.10825347900390625, -0.0832672119140625, -0.05828094482421875, -0.033294677734375, -0.00830841064453125, 0.0166778564453125, 0.04166412353515625, 0.066650390625, 0.09163665771484375, 0.1166229248046875, 0.14160919189453125, 0.166595458984375, 0.19158172607421875, 0.2165679931640625, 0.24155426025390625, 0.26654052734375, 0.29152679443359375, 0.3165130615234375, 0.34149932861328125, 0.366485595703125, 0.39147186279296875, 0.4164581298828125, 0.44144439697265625, 0.4664306640625, 0.49141693115234375, 0.5164031982421875, 0.5413894653320312, 0.566375732421875, 0.5913619995117188, 0.6163482666015625, 0.6413345336914062, 0.66632080078125, 0.6913070678710938, 0.7162933349609375, 0.7412796020507812, 0.766265869140625, 0.7912521362304688, 0.8162384033203125, 0.8412246704101562, 0.8662109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 11.0, 19.0, 13.0, 37.0, 42.0, 69.0, 109.0, 216.0, 434.0, 911.0, 2455.0, 10777.0, 98940.0, 811096.0, 107570.0, 11226.0, 2640.0, 975.0, 446.0, 203.0, 122.0, 75.0, 50.0, 31.0, 22.0, 15.0, 14.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.93902587890625, -1.8565673828125, -1.77410888671875, -1.691650390625, -1.60919189453125, -1.5267333984375, -1.44427490234375, -1.36181640625, -1.27935791015625, -1.1968994140625, -1.11444091796875, -1.031982421875, -0.94952392578125, -0.8670654296875, -0.78460693359375, -0.7021484375, -0.61968994140625, -0.5372314453125, -0.45477294921875, -0.372314453125, -0.28985595703125, -0.2073974609375, -0.12493896484375, -0.04248046875, 0.03997802734375, 0.1224365234375, 0.20489501953125, 0.287353515625, 0.36981201171875, 0.4522705078125, 0.53472900390625, 0.6171875, 0.69964599609375, 0.7821044921875, 0.86456298828125, 0.947021484375, 1.02947998046875, 1.1119384765625, 1.19439697265625, 1.27685546875, 1.35931396484375, 1.4417724609375, 1.52423095703125, 1.606689453125, 1.68914794921875, 1.7716064453125, 1.85406494140625, 1.9365234375, 2.01898193359375, 2.1014404296875, 2.18389892578125, 2.266357421875, 2.34881591796875, 2.4312744140625, 2.51373291015625, 2.59619140625, 2.67864990234375, 2.7611083984375, 2.84356689453125, 2.926025390625, 3.00848388671875, 3.0909423828125, 3.17340087890625, 3.255859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 14.0, 16.0, 17.0, 20.0, 31.0, 42.0, 36.0, 52.0, 73.0, 67.0, 82.0, 77.0, 58.0, 58.0, 60.0, 67.0, 56.0, 52.0, 29.0, 27.0, 20.0, 14.0, 13.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.44140625, -6.291046142578125, -6.14068603515625, -5.990325927734375, -5.8399658203125, -5.689605712890625, -5.53924560546875, -5.388885498046875, -5.238525390625, -5.088165283203125, -4.93780517578125, -4.787445068359375, -4.6370849609375, -4.486724853515625, -4.33636474609375, -4.186004638671875, -4.03564453125, -3.885284423828125, -3.73492431640625, -3.584564208984375, -3.4342041015625, -3.283843994140625, -3.13348388671875, -2.983123779296875, -2.832763671875, -2.682403564453125, -2.53204345703125, -2.381683349609375, -2.2313232421875, -2.080963134765625, -1.93060302734375, -1.780242919921875, -1.6298828125, -1.479522705078125, -1.32916259765625, -1.178802490234375, -1.0284423828125, -0.878082275390625, -0.72772216796875, -0.577362060546875, -0.427001953125, -0.276641845703125, -0.12628173828125, 0.024078369140625, 0.1744384765625, 0.324798583984375, 0.47515869140625, 0.625518798828125, 0.77587890625, 0.926239013671875, 1.07659912109375, 1.226959228515625, 1.3773193359375, 1.527679443359375, 1.67803955078125, 1.828399658203125, 1.978759765625, 2.129119873046875, 2.27947998046875, 2.429840087890625, 2.5802001953125, 2.730560302734375, 2.88092041015625, 3.031280517578125, 3.181640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 9.0, 12.0, 13.0, 28.0, 46.0, 125.0, 325.0, 1548.0, 28577.0, 999236.0, 16801.0, 1319.0, 306.0, 99.0, 42.0, 13.0, 14.0, 15.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8828125, -2.8078155517578125, -2.732818603515625, -2.6578216552734375, -2.58282470703125, -2.5078277587890625, -2.432830810546875, -2.3578338623046875, -2.2828369140625, -2.2078399658203125, -2.132843017578125, -2.0578460693359375, -1.98284912109375, -1.9078521728515625, -1.832855224609375, -1.7578582763671875, -1.682861328125, -1.6078643798828125, -1.532867431640625, -1.4578704833984375, -1.38287353515625, -1.3078765869140625, -1.232879638671875, -1.1578826904296875, -1.0828857421875, -1.0078887939453125, -0.932891845703125, -0.8578948974609375, -0.78289794921875, -0.7079010009765625, -0.632904052734375, -0.5579071044921875, -0.48291015625, -0.4079132080078125, -0.332916259765625, -0.2579193115234375, -0.18292236328125, -0.1079254150390625, -0.032928466796875, 0.0420684814453125, 0.1170654296875, 0.1920623779296875, 0.267059326171875, 0.3420562744140625, 0.41705322265625, 0.4920501708984375, 0.567047119140625, 0.6420440673828125, 0.717041015625, 0.7920379638671875, 0.867034912109375, 0.9420318603515625, 1.01702880859375, 1.0920257568359375, 1.167022705078125, 1.2420196533203125, 1.3170166015625, 1.3920135498046875, 1.467010498046875, 1.5420074462890625, 1.61700439453125, 1.6920013427734375, 1.766998291015625, 1.8419952392578125, 1.9169921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 9.0, 11.0, 14.0, 37.0, 53.0, 100.0, 161.0, 207.0, 172.0, 100.0, 53.0, 40.0, 16.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002536773681640625, -0.00024447590112686157, -0.00023527443408966064, -0.00022607296705245972, -0.0002168715000152588, -0.00020767003297805786, -0.00019846856594085693, -0.000189267098903656, -0.00018006563186645508, -0.00017086416482925415, -0.00016166269779205322, -0.0001524612307548523, -0.00014325976371765137, -0.00013405829668045044, -0.0001248568296432495, -0.00011565536260604858, -0.00010645389556884766, -9.725242853164673e-05, -8.80509614944458e-05, -7.884949445724487e-05, -6.964802742004395e-05, -6.044656038284302e-05, -5.124509334564209e-05, -4.204362630844116e-05, -3.2842159271240234e-05, -2.3640692234039307e-05, -1.4439225196838379e-05, -5.237758159637451e-06, 3.9637088775634766e-06, 1.3165175914764404e-05, 2.2366642951965332e-05, 3.156810998916626e-05, 4.076957702636719e-05, 4.9971044063568115e-05, 5.917251110076904e-05, 6.837397813796997e-05, 7.75754451751709e-05, 8.677691221237183e-05, 9.597837924957275e-05, 0.00010517984628677368, 0.00011438131332397461, 0.00012358278036117554, 0.00013278424739837646, 0.0001419857144355774, 0.00015118718147277832, 0.00016038864850997925, 0.00016959011554718018, 0.0001787915825843811, 0.00018799304962158203, 0.00019719451665878296, 0.0002063959836959839, 0.00021559745073318481, 0.00022479891777038574, 0.00023400038480758667, 0.0002432018518447876, 0.0002524033188819885, 0.00026160478591918945, 0.0002708062529563904, 0.0002800077199935913, 0.00028920918703079224, 0.00029841065406799316, 0.0003076121211051941, 0.000316813588142395, 0.00032601505517959595, 0.0003352165222167969]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 15.0, 22.0, 37.0, 100.0, 216.0, 569.0, 1768.0, 9956.0, 290515.0, 724286.0, 17338.0, 2447.0, 734.0, 260.0, 124.0, 68.0, 36.0, 14.0, 11.0, 10.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6318359375, -1.5793914794921875, -1.526947021484375, -1.4745025634765625, -1.42205810546875, -1.3696136474609375, -1.317169189453125, -1.2647247314453125, -1.2122802734375, -1.1598358154296875, -1.107391357421875, -1.0549468994140625, -1.00250244140625, -0.9500579833984375, -0.897613525390625, -0.8451690673828125, -0.792724609375, -0.7402801513671875, -0.687835693359375, -0.6353912353515625, -0.58294677734375, -0.5305023193359375, -0.478057861328125, -0.4256134033203125, -0.3731689453125, -0.3207244873046875, -0.268280029296875, -0.2158355712890625, -0.16339111328125, -0.1109466552734375, -0.058502197265625, -0.0060577392578125, 0.04638671875, 0.0988311767578125, 0.151275634765625, 0.2037200927734375, 0.25616455078125, 0.3086090087890625, 0.361053466796875, 0.4134979248046875, 0.4659423828125, 0.5183868408203125, 0.570831298828125, 0.6232757568359375, 0.67572021484375, 0.7281646728515625, 0.780609130859375, 0.8330535888671875, 0.885498046875, 0.9379425048828125, 0.990386962890625, 1.0428314208984375, 1.09527587890625, 1.1477203369140625, 1.200164794921875, 1.2526092529296875, 1.3050537109375, 1.3574981689453125, 1.409942626953125, 1.4623870849609375, 1.51483154296875, 1.5672760009765625, 1.619720458984375, 1.6721649169921875, 1.724609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 2.0, 12.0, 8.0, 24.0, 27.0, 48.0, 60.0, 84.0, 133.0, 130.0, 121.0, 112.0, 82.0, 55.0, 37.0, 23.0, 17.0, 6.0, 5.0, 8.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92626953125, -0.8916091918945312, -0.8569488525390625, -0.8222885131835938, -0.787628173828125, -0.7529678344726562, -0.7183074951171875, -0.6836471557617188, -0.64898681640625, -0.6143264770507812, -0.5796661376953125, -0.5450057983398438, -0.510345458984375, -0.47568511962890625, -0.4410247802734375, -0.40636444091796875, -0.3717041015625, -0.33704376220703125, -0.3023834228515625, -0.26772308349609375, -0.233062744140625, -0.19840240478515625, -0.1637420654296875, -0.12908172607421875, -0.09442138671875, -0.05976104736328125, -0.0251007080078125, 0.00955963134765625, 0.044219970703125, 0.07888031005859375, 0.1135406494140625, 0.14820098876953125, 0.182861328125, 0.21752166748046875, 0.2521820068359375, 0.28684234619140625, 0.321502685546875, 0.35616302490234375, 0.3908233642578125, 0.42548370361328125, 0.46014404296875, 0.49480438232421875, 0.5294647216796875, 0.5641250610351562, 0.598785400390625, 0.6334457397460938, 0.6681060791015625, 0.7027664184570312, 0.7374267578125, 0.7720870971679688, 0.8067474365234375, 0.8414077758789062, 0.876068115234375, 0.9107284545898438, 0.9453887939453125, 0.9800491333007812, 1.01470947265625, 1.0493698120117188, 1.0840301513671875, 1.1186904907226562, 1.153350830078125, 1.1880111694335938, 1.2226715087890625, 1.2573318481445312, 1.2919921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 3.0, 12.0, 25.0, 25.0, 47.0, 107.0, 141.0, 190.0, 191.0, 117.0, 54.0, 27.0, 25.0, 9.0, 6.0, 1.0, 5.0, 1.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.30942153930664, -13.776330947875977, -13.243239402770996, -12.710147857666016, -12.177057266235352, -11.643966674804688, -11.110875129699707, -10.577783584594727, -10.044692993164062, -9.511602401733398, -8.978510856628418, -8.445419311523438, -7.912328720092773, -7.379237651824951, -6.846146583557129, -6.313055515289307, -5.779964447021484, -5.246873378753662, -4.71378231048584, -4.180691242218018, -3.6476001739501953, -3.114509105682373, -2.581418037414551, -2.0483269691467285, -1.5152359008789062, -0.982144832611084, -0.4490537643432617, 0.08403730392456055, 0.6171283721923828, 1.150219440460205, 1.6833105087280273, 2.2164015769958496, 2.749490737915039, 3.2825818061828613, 3.8156728744506836, 4.348763942718506, 4.881855010986328, 5.41494607925415, 5.948037147521973, 6.481128215789795, 7.014219284057617, 7.5473103523254395, 8.080401420593262, 8.613492965698242, 9.146583557128906, 9.67967414855957, 10.21276569366455, 10.745857238769531, 11.278947830200195, 11.81203842163086, 12.34512996673584, 12.87822151184082, 13.411312103271484, 13.944402694702148, 14.477494239807129, 15.01058578491211, 15.543676376342773, 16.076766967773438, 16.609859466552734, 17.1429500579834, 17.676040649414062, 18.209131240844727, 18.74222183227539, 19.275314331054688, 19.80840492248535]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 11.0, 7.0, 7.0, 10.0, 12.0, 18.0, 22.0, 25.0, 26.0, 30.0, 30.0, 55.0, 53.0, 62.0, 64.0, 70.0, 56.0, 63.0, 53.0, 57.0, 51.0, 41.0, 32.0, 31.0, 19.0, 20.0, 16.0, 13.0, 10.0, 6.0, 6.0, 7.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.503167152404785, -14.96397590637207, -14.424785614013672, -13.885594367980957, -13.346403121948242, -12.807212829589844, -12.268021583557129, -11.728830337524414, -11.189640045166016, -10.6504487991333, -10.111258506774902, -9.572067260742188, -9.032876968383789, -8.493685722351074, -7.954494476318359, -7.415303707122803, -6.876112937927246, -6.3369221687316895, -5.797731399536133, -5.258540153503418, -4.719349384307861, -4.180158615112305, -3.640967607498169, -3.101776599884033, -2.5625858306884766, -2.02339506149292, -1.4842040538787842, -0.945013165473938, -0.4058222770690918, 0.13336849212646484, 0.6725594997406006, 1.2117505073547363, 1.7509422302246094, 2.290132999420166, 2.8293240070343018, 3.3685150146484375, 3.907705783843994, 4.446896553039551, 4.986087799072266, 5.525278568267822, 6.064469337463379, 6.6036601066589355, 7.142850875854492, 7.682042121887207, 8.221233367919922, 8.76042366027832, 9.299614906311035, 9.83880615234375, 10.377996444702148, 10.917187690734863, 11.456377983093262, 11.995569229125977, 12.534759521484375, 13.07395076751709, 13.613142013549805, 14.152332305908203, 14.691523551940918, 15.230714797973633, 15.769905090332031, 16.30909538269043, 16.84828758239746, 17.38747787475586, 17.926668167114258, 18.46586036682129, 19.005050659179688]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 16.0, 21.0, 32.0, 46.0, 53.0, 82.0, 118.0, 194.0, 353.0, 675.0, 1837.0, 6241.0, 85784.0, 4073411.0, 19542.0, 3417.0, 1171.0, 517.0, 279.0, 151.0, 108.0, 80.0, 52.0, 43.0, 21.0, 12.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.478515625, -2.3992919921875, -2.320068359375, -2.2408447265625, -2.16162109375, -2.0823974609375, -2.003173828125, -1.9239501953125, -1.8447265625, -1.7655029296875, -1.686279296875, -1.6070556640625, -1.52783203125, -1.4486083984375, -1.369384765625, -1.2901611328125, -1.2109375, -1.1317138671875, -1.052490234375, -0.9732666015625, -0.89404296875, -0.8148193359375, -0.735595703125, -0.6563720703125, -0.5771484375, -0.4979248046875, -0.418701171875, -0.3394775390625, -0.26025390625, -0.1810302734375, -0.101806640625, -0.0225830078125, 0.056640625, 0.1358642578125, 0.215087890625, 0.2943115234375, 0.37353515625, 0.4527587890625, 0.531982421875, 0.6112060546875, 0.6904296875, 0.7696533203125, 0.848876953125, 0.9281005859375, 1.00732421875, 1.0865478515625, 1.165771484375, 1.2449951171875, 1.32421875, 1.4034423828125, 1.482666015625, 1.5618896484375, 1.64111328125, 1.7203369140625, 1.799560546875, 1.8787841796875, 1.9580078125, 2.0372314453125, 2.116455078125, 2.1956787109375, 2.27490234375, 2.3541259765625, 2.433349609375, 2.5125732421875, 2.591796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 10.0, 25.0, 24.0, 41.0, 50.0, 74.0, 83.0, 108.0, 88.0, 105.0, 94.0, 78.0, 88.0, 46.0, 32.0, 14.0, 15.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.787109375, -1.7452392578125, -1.703369140625, -1.6614990234375, -1.61962890625, -1.5777587890625, -1.535888671875, -1.4940185546875, -1.4521484375, -1.4102783203125, -1.368408203125, -1.3265380859375, -1.28466796875, -1.2427978515625, -1.200927734375, -1.1590576171875, -1.1171875, -1.0753173828125, -1.033447265625, -0.9915771484375, -0.94970703125, -0.9078369140625, -0.865966796875, -0.8240966796875, -0.7822265625, -0.7403564453125, -0.698486328125, -0.6566162109375, -0.61474609375, -0.5728759765625, -0.531005859375, -0.4891357421875, -0.447265625, -0.4053955078125, -0.363525390625, -0.3216552734375, -0.27978515625, -0.2379150390625, -0.196044921875, -0.1541748046875, -0.1123046875, -0.0704345703125, -0.028564453125, 0.0133056640625, 0.05517578125, 0.0970458984375, 0.138916015625, 0.1807861328125, 0.22265625, 0.2645263671875, 0.306396484375, 0.3482666015625, 0.39013671875, 0.4320068359375, 0.473876953125, 0.5157470703125, 0.5576171875, 0.5994873046875, 0.641357421875, 0.6832275390625, 0.72509765625, 0.7669677734375, 0.808837890625, 0.8507080078125, 0.892578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 8.0, 7.0, 6.0, 8.0, 15.0, 19.0, 24.0, 35.0, 41.0, 69.0, 70.0, 120.0, 199.0, 254.0, 420.0, 735.0, 1528.0, 3866.0, 18520.0, 390544.0, 3734189.0, 33459.0, 5948.0, 1900.0, 833.0, 482.0, 316.0, 196.0, 126.0, 90.0, 61.0, 49.0, 28.0, 26.0, 25.0, 8.0, 19.0, 11.0, 8.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.015625, -1.94647216796875, -1.8773193359375, -1.80816650390625, -1.739013671875, -1.66986083984375, -1.6007080078125, -1.53155517578125, -1.46240234375, -1.39324951171875, -1.3240966796875, -1.25494384765625, -1.185791015625, -1.11663818359375, -1.0474853515625, -0.97833251953125, -0.9091796875, -0.84002685546875, -0.7708740234375, -0.70172119140625, -0.632568359375, -0.56341552734375, -0.4942626953125, -0.42510986328125, -0.35595703125, -0.28680419921875, -0.2176513671875, -0.14849853515625, -0.079345703125, -0.01019287109375, 0.0589599609375, 0.12811279296875, 0.197265625, 0.26641845703125, 0.3355712890625, 0.40472412109375, 0.473876953125, 0.54302978515625, 0.6121826171875, 0.68133544921875, 0.75048828125, 0.81964111328125, 0.8887939453125, 0.95794677734375, 1.027099609375, 1.09625244140625, 1.1654052734375, 1.23455810546875, 1.3037109375, 1.37286376953125, 1.4420166015625, 1.51116943359375, 1.580322265625, 1.64947509765625, 1.7186279296875, 1.78778076171875, 1.85693359375, 1.92608642578125, 1.9952392578125, 2.06439208984375, 2.133544921875, 2.20269775390625, 2.2718505859375, 2.34100341796875, 2.41015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 11.0, 16.0, 25.0, 56.0, 139.0, 593.0, 2767.0, 271.0, 96.0, 37.0, 19.0, 15.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -1.0012893676757812, -0.9703521728515625, -0.9394149780273438, -0.908477783203125, -0.8775405883789062, -0.8466033935546875, -0.8156661987304688, -0.78472900390625, -0.7537918090820312, -0.7228546142578125, -0.6919174194335938, -0.660980224609375, -0.6300430297851562, -0.5991058349609375, -0.5681686401367188, -0.5372314453125, -0.5062942504882812, -0.4753570556640625, -0.44441986083984375, -0.413482666015625, -0.38254547119140625, -0.3516082763671875, -0.32067108154296875, -0.28973388671875, -0.25879669189453125, -0.2278594970703125, -0.19692230224609375, -0.165985107421875, -0.13504791259765625, -0.1041107177734375, -0.07317352294921875, -0.042236328125, -0.01129913330078125, 0.0196380615234375, 0.05057525634765625, 0.081512451171875, 0.11244964599609375, 0.1433868408203125, 0.17432403564453125, 0.20526123046875, 0.23619842529296875, 0.2671356201171875, 0.29807281494140625, 0.329010009765625, 0.35994720458984375, 0.3908843994140625, 0.42182159423828125, 0.4527587890625, 0.48369598388671875, 0.5146331787109375, 0.5455703735351562, 0.576507568359375, 0.6074447631835938, 0.6383819580078125, 0.6693191528320312, 0.70025634765625, 0.7311935424804688, 0.7621307373046875, 0.7930679321289062, 0.824005126953125, 0.8549423217773438, 0.8858795166015625, 0.9168167114257812, 0.94775390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 15.0, 22.0, 48.0, 98.0, 176.0, 255.0, 221.0, 90.0, 49.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.740829467773438, -8.528131484985352, -8.315434455871582, -8.102736473083496, -7.89003849029541, -7.677340984344482, -7.464643478393555, -7.251945495605469, -7.039247989654541, -6.826550483703613, -6.613852500915527, -6.4011549949646, -6.188457489013672, -5.975759506225586, -5.763062000274658, -5.5503644943237305, -5.3376665115356445, -5.124969005584717, -4.912271022796631, -4.699573516845703, -4.486875534057617, -4.2741780281066895, -4.061480522155762, -3.848782777786255, -3.636085033416748, -3.423387289047241, -3.2106895446777344, -2.9979920387268066, -2.7852942943573, -2.572596549987793, -2.3598990440368652, -2.1472012996673584, -1.9345040321350098, -1.721806287765503, -1.5091086626052856, -1.2964110374450684, -1.0837132930755615, -0.8710155487060547, -0.6583179235458374, -0.4456202983856201, -0.23292255401611328, -0.02022486925125122, 0.19247281551361084, 0.4051705002784729, 0.617868185043335, 0.8305659294128418, 1.043263554573059, 1.2559611797332764, 1.4686589241027832, 1.68135666847229, 1.8940542936325073, 2.1067519187927246, 2.3194496631622314, 2.5321474075317383, 2.744844913482666, 2.957542657852173, 3.1702404022216797, 3.3829381465911865, 3.5956358909606934, 3.808333396911621, 4.021031379699707, 4.233728885650635, 4.4464263916015625, 4.659124374389648, 4.871821880340576]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 7.0, 5.0, 8.0, 7.0, 8.0, 10.0, 15.0, 14.0, 28.0, 25.0, 24.0, 19.0, 49.0, 31.0, 44.0, 51.0, 40.0, 30.0, 27.0, 43.0, 54.0, 43.0, 32.0, 35.0, 42.0, 41.0, 32.0, 32.0, 29.0, 24.0, 19.0, 24.0, 18.0, 22.0, 19.0, 11.0, 9.0, 6.0, 5.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9902310371398926, -1.9276185035705566, -1.8650058507919312, -1.8023933172225952, -1.7397806644439697, -1.6771681308746338, -1.6145555973052979, -1.5519429445266724, -1.4893302917480469, -1.426717758178711, -1.3641051054000854, -1.3014925718307495, -1.238879919052124, -1.176267385482788, -1.1136548519134521, -1.0510421991348267, -0.9884296655654907, -0.92581707239151, -0.8632044792175293, -0.8005919456481934, -0.7379792928695679, -0.6753667593002319, -0.6127541661262512, -0.5501415729522705, -0.4875289797782898, -0.4249163866043091, -0.36230379343032837, -0.29969123005867004, -0.23707863688468933, -0.17446604371070862, -0.11185348033905029, -0.04924088716506958, 0.013371706008911133, 0.07598429173231125, 0.13859687745571136, 0.20120945572853088, 0.2638220489025116, 0.3264346420764923, 0.38904720544815063, 0.45165979862213135, 0.5142723917961121, 0.5768849849700928, 0.6394975781440735, 0.7021101713180542, 0.7647227048873901, 0.8273353576660156, 0.8899478912353516, 0.9525604844093323, 1.015173077583313, 1.077785611152649, 1.1403982639312744, 1.2030107975006104, 1.2656234502792358, 1.3282359838485718, 1.3908486366271973, 1.4534611701965332, 1.5160737037658691, 1.578686237335205, 1.6412988901138306, 1.7039114236831665, 1.766524076461792, 1.829136610031128, 1.8917491436004639, 1.9543617963790894, 2.016974449157715]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 4.0, 7.0, 14.0, 15.0, 33.0, 57.0, 45.0, 72.0, 122.0, 224.0, 413.0, 655.0, 1446.0, 2870.0, 6991.0, 20501.0, 71745.0, 277767.0, 460655.0, 145327.0, 38844.0, 11949.0, 4526.0, 1954.0, 984.0, 522.0, 305.0, 171.0, 95.0, 84.0, 41.0, 26.0, 21.0, 14.0, 16.0, 3.0, 9.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1181640625, -1.0785980224609375, -1.039031982421875, -0.9994659423828125, -0.95989990234375, -0.9203338623046875, -0.880767822265625, -0.8412017822265625, -0.8016357421875, -0.7620697021484375, -0.722503662109375, -0.6829376220703125, -0.64337158203125, -0.6038055419921875, -0.564239501953125, -0.5246734619140625, -0.485107421875, -0.4455413818359375, -0.405975341796875, -0.3664093017578125, -0.32684326171875, -0.2872772216796875, -0.247711181640625, -0.2081451416015625, -0.1685791015625, -0.1290130615234375, -0.089447021484375, -0.0498809814453125, -0.01031494140625, 0.0292510986328125, 0.068817138671875, 0.1083831787109375, 0.14794921875, 0.1875152587890625, 0.227081298828125, 0.2666473388671875, 0.30621337890625, 0.3457794189453125, 0.385345458984375, 0.4249114990234375, 0.4644775390625, 0.5040435791015625, 0.543609619140625, 0.5831756591796875, 0.62274169921875, 0.6623077392578125, 0.701873779296875, 0.7414398193359375, 0.781005859375, 0.8205718994140625, 0.860137939453125, 0.8997039794921875, 0.93927001953125, 0.9788360595703125, 1.018402099609375, 1.0579681396484375, 1.0975341796875, 1.1371002197265625, 1.176666259765625, 1.2162322998046875, 1.25579833984375, 1.2953643798828125, 1.334930419921875, 1.3744964599609375, 1.4140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 9.0, 17.0, 31.0, 33.0, 53.0, 65.0, 74.0, 85.0, 91.0, 89.0, 88.0, 85.0, 74.0, 49.0, 59.0, 29.0, 19.0, 14.0, 9.0, 4.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.474609375, -1.435943603515625, -1.39727783203125, -1.358612060546875, -1.3199462890625, -1.281280517578125, -1.24261474609375, -1.203948974609375, -1.165283203125, -1.126617431640625, -1.08795166015625, -1.049285888671875, -1.0106201171875, -0.971954345703125, -0.93328857421875, -0.894622802734375, -0.85595703125, -0.817291259765625, -0.77862548828125, -0.739959716796875, -0.7012939453125, -0.662628173828125, -0.62396240234375, -0.585296630859375, -0.546630859375, -0.507965087890625, -0.46929931640625, -0.430633544921875, -0.3919677734375, -0.353302001953125, -0.31463623046875, -0.275970458984375, -0.2373046875, -0.198638916015625, -0.15997314453125, -0.121307373046875, -0.0826416015625, -0.043975830078125, -0.00531005859375, 0.033355712890625, 0.072021484375, 0.110687255859375, 0.14935302734375, 0.188018798828125, 0.2266845703125, 0.265350341796875, 0.30401611328125, 0.342681884765625, 0.38134765625, 0.420013427734375, 0.45867919921875, 0.497344970703125, 0.5360107421875, 0.574676513671875, 0.61334228515625, 0.652008056640625, 0.690673828125, 0.729339599609375, 0.76800537109375, 0.806671142578125, 0.8453369140625, 0.884002685546875, 0.92266845703125, 0.961334228515625, 1.0]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 3.0, 4.0, 10.0, 9.0, 15.0, 14.0, 19.0, 29.0, 33.0, 54.0, 62.0, 110.0, 154.0, 222.0, 330.0, 605.0, 1115.0, 2348.0, 6888.0, 29306.0, 211395.0, 659628.0, 109031.0, 17980.0, 4999.0, 1840.0, 913.0, 532.0, 284.0, 200.0, 126.0, 81.0, 45.0, 39.0, 28.0, 28.0, 21.0, 14.0, 6.0, 3.0, 6.0, 10.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.685546875, -1.6300048828125, -1.574462890625, -1.5189208984375, -1.46337890625, -1.4078369140625, -1.352294921875, -1.2967529296875, -1.2412109375, -1.1856689453125, -1.130126953125, -1.0745849609375, -1.01904296875, -0.9635009765625, -0.907958984375, -0.8524169921875, -0.796875, -0.7413330078125, -0.685791015625, -0.6302490234375, -0.57470703125, -0.5191650390625, -0.463623046875, -0.4080810546875, -0.3525390625, -0.2969970703125, -0.241455078125, -0.1859130859375, -0.13037109375, -0.0748291015625, -0.019287109375, 0.0362548828125, 0.091796875, 0.1473388671875, 0.202880859375, 0.2584228515625, 0.31396484375, 0.3695068359375, 0.425048828125, 0.4805908203125, 0.5361328125, 0.5916748046875, 0.647216796875, 0.7027587890625, 0.75830078125, 0.8138427734375, 0.869384765625, 0.9249267578125, 0.98046875, 1.0360107421875, 1.091552734375, 1.1470947265625, 1.20263671875, 1.2581787109375, 1.313720703125, 1.3692626953125, 1.4248046875, 1.4803466796875, 1.535888671875, 1.5914306640625, 1.64697265625, 1.7025146484375, 1.758056640625, 1.8135986328125, 1.869140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 8.0, 14.0, 9.0, 16.0, 19.0, 22.0, 27.0, 47.0, 47.0, 52.0, 56.0, 57.0, 57.0, 39.0, 46.0, 60.0, 59.0, 41.0, 47.0, 38.0, 36.0, 38.0, 34.0, 20.0, 26.0, 11.0, 16.0, 16.0, 7.0, 6.0, 5.0, 10.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.494140625, -2.395843505859375, -2.29754638671875, -2.199249267578125, -2.1009521484375, -2.002655029296875, -1.90435791015625, -1.806060791015625, -1.707763671875, -1.609466552734375, -1.51116943359375, -1.412872314453125, -1.3145751953125, -1.216278076171875, -1.11798095703125, -1.019683837890625, -0.92138671875, -0.823089599609375, -0.72479248046875, -0.626495361328125, -0.5281982421875, -0.429901123046875, -0.33160400390625, -0.233306884765625, -0.135009765625, -0.036712646484375, 0.06158447265625, 0.159881591796875, 0.2581787109375, 0.356475830078125, 0.45477294921875, 0.553070068359375, 0.6513671875, 0.749664306640625, 0.84796142578125, 0.946258544921875, 1.0445556640625, 1.142852783203125, 1.24114990234375, 1.339447021484375, 1.437744140625, 1.536041259765625, 1.63433837890625, 1.732635498046875, 1.8309326171875, 1.929229736328125, 2.02752685546875, 2.125823974609375, 2.22412109375, 2.322418212890625, 2.42071533203125, 2.519012451171875, 2.6173095703125, 2.715606689453125, 2.81390380859375, 2.912200927734375, 3.010498046875, 3.108795166015625, 3.20709228515625, 3.305389404296875, 3.4036865234375, 3.501983642578125, 3.60028076171875, 3.698577880859375, 3.796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 15.0, 27.0, 31.0, 65.0, 84.0, 152.0, 273.0, 662.0, 1614.0, 5531.0, 32070.0, 608253.0, 368223.0, 24293.0, 4656.0, 1405.0, 585.0, 259.0, 114.0, 79.0, 34.0, 30.0, 20.0, 15.0, 10.0, 13.0, 5.0, 5.0, 2.0, 2.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.216796875, -1.1863250732421875, -1.155853271484375, -1.1253814697265625, -1.09490966796875, -1.0644378662109375, -1.033966064453125, -1.0034942626953125, -0.9730224609375, -0.9425506591796875, -0.912078857421875, -0.8816070556640625, -0.85113525390625, -0.8206634521484375, -0.790191650390625, -0.7597198486328125, -0.729248046875, -0.6987762451171875, -0.668304443359375, -0.6378326416015625, -0.60736083984375, -0.5768890380859375, -0.546417236328125, -0.5159454345703125, -0.4854736328125, -0.4550018310546875, -0.424530029296875, -0.3940582275390625, -0.36358642578125, -0.3331146240234375, -0.302642822265625, -0.2721710205078125, -0.24169921875, -0.2112274169921875, -0.180755615234375, -0.1502838134765625, -0.11981201171875, -0.0893402099609375, -0.058868408203125, -0.0283966064453125, 0.0020751953125, 0.0325469970703125, 0.063018798828125, 0.0934906005859375, 0.12396240234375, 0.1544342041015625, 0.184906005859375, 0.2153778076171875, 0.245849609375, 0.2763214111328125, 0.306793212890625, 0.3372650146484375, 0.36773681640625, 0.3982086181640625, 0.428680419921875, 0.4591522216796875, 0.4896240234375, 0.5200958251953125, 0.550567626953125, 0.5810394287109375, 0.61151123046875, 0.6419830322265625, 0.672454833984375, 0.7029266357421875, 0.7333984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 12.0, 9.0, 2.0, 12.0, 12.0, 20.0, 26.0, 28.0, 47.0, 48.0, 82.0, 133.0, 167.0, 98.0, 69.0, 31.0, 41.0, 35.0, 27.0, 24.0, 18.0, 13.0, 12.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00022590160369873047, -0.00021999888122081757, -0.00021409615874290466, -0.00020819343626499176, -0.00020229071378707886, -0.00019638799130916595, -0.00019048526883125305, -0.00018458254635334015, -0.00017867982387542725, -0.00017277710139751434, -0.00016687437891960144, -0.00016097165644168854, -0.00015506893396377563, -0.00014916621148586273, -0.00014326348900794983, -0.00013736076653003693, -0.00013145804405212402, -0.00012555532157421112, -0.00011965259909629822, -0.00011374987661838531, -0.00010784715414047241, -0.00010194443166255951, -9.60417091846466e-05, -9.01389867067337e-05, -8.42362642288208e-05, -7.83335417509079e-05, -7.2430819272995e-05, -6.652809679508209e-05, -6.062537431716919e-05, -5.472265183925629e-05, -4.8819929361343384e-05, -4.291720688343048e-05, -3.701448440551758e-05, -3.1111761927604675e-05, -2.5209039449691772e-05, -1.930631697177887e-05, -1.3403594493865967e-05, -7.500872015953064e-06, -1.5981495380401611e-06, 4.304572939872742e-06, 1.0207295417785645e-05, 1.6110017895698547e-05, 2.201274037361145e-05, 2.7915462851524353e-05, 3.3818185329437256e-05, 3.972090780735016e-05, 4.562363028526306e-05, 5.1526352763175964e-05, 5.742907524108887e-05, 6.333179771900177e-05, 6.923452019691467e-05, 7.513724267482758e-05, 8.103996515274048e-05, 8.694268763065338e-05, 9.284541010856628e-05, 9.874813258647919e-05, 0.00010465085506439209, 0.00011055357754230499, 0.0001164563000202179, 0.0001223590224981308, 0.0001282617449760437, 0.0001341644674539566, 0.0001400671899318695, 0.0001459699124097824, 0.0001518726348876953]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 4.0, 9.0, 22.0, 27.0, 45.0, 79.0, 139.0, 245.0, 523.0, 1334.0, 4683.0, 36203.0, 764433.0, 222998.0, 13369.0, 2660.0, 918.0, 382.0, 200.0, 104.0, 59.0, 35.0, 19.0, 19.0, 11.0, 7.0, 9.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.5498046875, -1.511810302734375, -1.47381591796875, -1.435821533203125, -1.3978271484375, -1.359832763671875, -1.32183837890625, -1.283843994140625, -1.245849609375, -1.207855224609375, -1.16986083984375, -1.131866455078125, -1.0938720703125, -1.055877685546875, -1.01788330078125, -0.979888916015625, -0.94189453125, -0.903900146484375, -0.86590576171875, -0.827911376953125, -0.7899169921875, -0.751922607421875, -0.71392822265625, -0.675933837890625, -0.637939453125, -0.599945068359375, -0.56195068359375, -0.523956298828125, -0.4859619140625, -0.447967529296875, -0.40997314453125, -0.371978759765625, -0.333984375, -0.295989990234375, -0.25799560546875, -0.220001220703125, -0.1820068359375, -0.144012451171875, -0.10601806640625, -0.068023681640625, -0.030029296875, 0.007965087890625, 0.04595947265625, 0.083953857421875, 0.1219482421875, 0.159942626953125, 0.19793701171875, 0.235931396484375, 0.27392578125, 0.311920166015625, 0.34991455078125, 0.387908935546875, 0.4259033203125, 0.463897705078125, 0.50189208984375, 0.539886474609375, 0.577880859375, 0.615875244140625, 0.65386962890625, 0.691864013671875, 0.7298583984375, 0.767852783203125, 0.80584716796875, 0.843841552734375, 0.8818359375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 2.0, 11.0, 13.0, 12.0, 25.0, 25.0, 31.0, 20.0, 50.0, 67.0, 96.0, 92.0, 92.0, 90.0, 76.0, 58.0, 44.0, 48.0, 32.0, 20.0, 22.0, 16.0, 14.0, 12.0, 9.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7099609375, -0.6882705688476562, -0.6665802001953125, -0.6448898315429688, -0.623199462890625, -0.6015090942382812, -0.5798187255859375, -0.5581283569335938, -0.53643798828125, -0.5147476196289062, -0.4930572509765625, -0.47136688232421875, -0.449676513671875, -0.42798614501953125, -0.4062957763671875, -0.38460540771484375, -0.3629150390625, -0.34122467041015625, -0.3195343017578125, -0.29784393310546875, -0.276153564453125, -0.25446319580078125, -0.2327728271484375, -0.21108245849609375, -0.18939208984375, -0.16770172119140625, -0.1460113525390625, -0.12432098388671875, -0.102630615234375, -0.08094024658203125, -0.0592498779296875, -0.03755950927734375, -0.015869140625, 0.00582122802734375, 0.0275115966796875, 0.04920196533203125, 0.070892333984375, 0.09258270263671875, 0.1142730712890625, 0.13596343994140625, 0.15765380859375, 0.17934417724609375, 0.2010345458984375, 0.22272491455078125, 0.244415283203125, 0.26610565185546875, 0.2877960205078125, 0.30948638916015625, 0.3311767578125, 0.35286712646484375, 0.3745574951171875, 0.39624786376953125, 0.417938232421875, 0.43962860107421875, 0.4613189697265625, 0.48300933837890625, 0.50469970703125, 0.5263900756835938, 0.5480804443359375, 0.5697708129882812, 0.591461181640625, 0.6131515502929688, 0.6348419189453125, 0.6565322875976562, 0.67822265625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 16.0, 41.0, 85.0, 145.0, 212.0, 209.0, 150.0, 56.0, 29.0, 16.0, 9.0, 9.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.551868438720703, -18.916439056396484, -18.281009674072266, -17.645578384399414, -17.010149002075195, -16.374719619750977, -15.739290237426758, -15.103860855102539, -14.468430519104004, -13.833001136779785, -13.19757080078125, -12.562141418457031, -11.926712036132812, -11.291281700134277, -10.655852317810059, -10.020421981811523, -9.384992599487305, -8.749563217163086, -8.11413288116455, -7.478703498840332, -6.843273639678955, -6.207843780517578, -5.572414398193359, -4.936984539031982, -4.3015546798706055, -3.6661248207092285, -3.0306951999664307, -2.395265579223633, -1.7598357200622559, -1.124405860900879, -0.48897624015808105, 0.1464533805847168, 0.7818832397460938, 1.4173129796981812, 2.0527427196502686, 2.6881723403930664, 3.3236021995544434, 3.9590320587158203, 4.594461441040039, 5.229891300201416, 5.865321159362793, 6.50075101852417, 7.136180877685547, 7.771610260009766, 8.407039642333984, 9.04246997833252, 9.677899360656738, 10.313329696655273, 10.948759078979492, 11.584188461303711, 12.219618797302246, 12.855048179626465, 13.490478515625, 14.125907897949219, 14.761337280273438, 15.396766662597656, 16.032196044921875, 16.667625427246094, 17.303054809570312, 17.938486099243164, 18.573915481567383, 19.2093448638916, 19.84477424621582, 20.48020362854004, 21.11563491821289]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 8.0, 13.0, 14.0, 15.0, 31.0, 23.0, 37.0, 36.0, 51.0, 66.0, 74.0, 67.0, 70.0, 62.0, 63.0, 67.0, 58.0, 46.0, 38.0, 30.0, 21.0, 28.0, 25.0, 9.0, 10.0, 11.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.532419204711914, -13.00814151763916, -12.48386287689209, -11.959585189819336, -11.435306549072266, -10.911028861999512, -10.386751174926758, -9.862472534179688, -9.338194847106934, -8.81391716003418, -8.28963851928711, -7.7653608322143555, -7.241082668304443, -6.716804504394531, -6.192526817321777, -5.668248653411865, -5.143970489501953, -4.619692325592041, -4.095414161682129, -3.571136474609375, -3.046858310699463, -2.522580146789551, -1.9983022212982178, -1.4740242958068848, -0.9497461318969727, -0.4254680871963501, 0.09880995750427246, 0.623088002204895, 1.1473660469055176, 1.6716442108154297, 2.1959221363067627, 2.7202000617980957, 3.244476318359375, 3.768754482269287, 4.293032646179199, 4.817310333251953, 5.341588497161865, 5.865866661071777, 6.390144348144531, 6.914422512054443, 7.4387006759643555, 7.962978839874268, 8.48725700378418, 9.011534690856934, 9.535812377929688, 10.060091018676758, 10.584368705749512, 11.108646392822266, 11.632925033569336, 12.15720272064209, 12.68148136138916, 13.205759048461914, 13.730037689208984, 14.254315376281738, 14.778593063354492, 15.302871704101562, 15.827149391174316, 16.35142707824707, 16.87570571899414, 17.39998435974121, 17.92426109313965, 18.44853973388672, 18.97281837463379, 19.497095108032227, 20.021373748779297]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 4.0, 4.0, 9.0, 6.0, 9.0, 21.0, 23.0, 32.0, 64.0, 95.0, 144.0, 219.0, 380.0, 520.0, 996.0, 1977.0, 4125.0, 12740.0, 71715.0, 2282186.0, 1737896.0, 61819.0, 11170.0, 3988.0, 1781.0, 930.0, 524.0, 319.0, 201.0, 123.0, 81.0, 53.0, 50.0, 20.0, 15.0, 11.0, 9.0, 5.0, 4.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4169921875, -1.3712310791015625, -1.325469970703125, -1.2797088623046875, -1.23394775390625, -1.1881866455078125, -1.142425537109375, -1.0966644287109375, -1.0509033203125, -1.0051422119140625, -0.959381103515625, -0.9136199951171875, -0.86785888671875, -0.8220977783203125, -0.776336669921875, -0.7305755615234375, -0.684814453125, -0.6390533447265625, -0.593292236328125, -0.5475311279296875, -0.50177001953125, -0.4560089111328125, -0.410247802734375, -0.3644866943359375, -0.3187255859375, -0.2729644775390625, -0.227203369140625, -0.1814422607421875, -0.13568115234375, -0.0899200439453125, -0.044158935546875, 0.0016021728515625, 0.04736328125, 0.0931243896484375, 0.138885498046875, 0.1846466064453125, 0.23040771484375, 0.2761688232421875, 0.321929931640625, 0.3676910400390625, 0.4134521484375, 0.4592132568359375, 0.504974365234375, 0.5507354736328125, 0.59649658203125, 0.6422576904296875, 0.688018798828125, 0.7337799072265625, 0.779541015625, 0.8253021240234375, 0.871063232421875, 0.9168243408203125, 0.96258544921875, 1.0083465576171875, 1.054107666015625, 1.0998687744140625, 1.1456298828125, 1.1913909912109375, 1.237152099609375, 1.2829132080078125, 1.32867431640625, 1.3744354248046875, 1.420196533203125, 1.4659576416015625, 1.51171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 8.0, 8.0, 3.0, 17.0, 12.0, 14.0, 14.0, 34.0, 34.0, 47.0, 44.0, 59.0, 51.0, 55.0, 46.0, 60.0, 58.0, 55.0, 52.0, 46.0, 40.0, 33.0, 45.0, 34.0, 27.0, 25.0, 17.0, 13.0, 15.0, 8.0, 9.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.56103515625, -0.5403289794921875, -0.519622802734375, -0.4989166259765625, -0.47821044921875, -0.4575042724609375, -0.436798095703125, -0.4160919189453125, -0.3953857421875, -0.3746795654296875, -0.353973388671875, -0.3332672119140625, -0.31256103515625, -0.2918548583984375, -0.271148681640625, -0.2504425048828125, -0.229736328125, -0.2090301513671875, -0.188323974609375, -0.1676177978515625, -0.14691162109375, -0.1262054443359375, -0.105499267578125, -0.0847930908203125, -0.0640869140625, -0.0433807373046875, -0.022674560546875, -0.0019683837890625, 0.01873779296875, 0.0394439697265625, 0.060150146484375, 0.0808563232421875, 0.1015625, 0.1222686767578125, 0.142974853515625, 0.1636810302734375, 0.18438720703125, 0.2050933837890625, 0.225799560546875, 0.2465057373046875, 0.2672119140625, 0.2879180908203125, 0.308624267578125, 0.3293304443359375, 0.35003662109375, 0.3707427978515625, 0.391448974609375, 0.4121551513671875, 0.432861328125, 0.4535675048828125, 0.474273681640625, 0.4949798583984375, 0.51568603515625, 0.5363922119140625, 0.557098388671875, 0.5778045654296875, 0.5985107421875, 0.6192169189453125, 0.639923095703125, 0.6606292724609375, 0.68133544921875, 0.7020416259765625, 0.722747802734375, 0.7434539794921875, 0.76416015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 11.0, 1.0, 12.0, 19.0, 10.0, 29.0, 64.0, 91.0, 165.0, 285.0, 570.0, 1185.0, 2924.0, 8579.0, 36778.0, 1065065.0, 3008404.0, 53168.0, 10613.0, 3446.0, 1473.0, 617.0, 350.0, 169.0, 84.0, 60.0, 42.0, 19.0, 23.0, 8.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.162872314453125, -2.09332275390625, -2.023773193359375, -1.9542236328125, -1.884674072265625, -1.81512451171875, -1.745574951171875, -1.676025390625, -1.606475830078125, -1.53692626953125, -1.467376708984375, -1.3978271484375, -1.328277587890625, -1.25872802734375, -1.189178466796875, -1.11962890625, -1.050079345703125, -0.98052978515625, -0.910980224609375, -0.8414306640625, -0.771881103515625, -0.70233154296875, -0.632781982421875, -0.563232421875, -0.493682861328125, -0.42413330078125, -0.354583740234375, -0.2850341796875, -0.215484619140625, -0.14593505859375, -0.076385498046875, -0.0068359375, 0.062713623046875, 0.13226318359375, 0.201812744140625, 0.2713623046875, 0.340911865234375, 0.41046142578125, 0.480010986328125, 0.549560546875, 0.619110107421875, 0.68865966796875, 0.758209228515625, 0.8277587890625, 0.897308349609375, 0.96685791015625, 1.036407470703125, 1.10595703125, 1.175506591796875, 1.24505615234375, 1.314605712890625, 1.3841552734375, 1.453704833984375, 1.52325439453125, 1.592803955078125, 1.662353515625, 1.731903076171875, 1.80145263671875, 1.871002197265625, 1.9405517578125, 2.010101318359375, 2.07965087890625, 2.149200439453125, 2.21875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 9.0, 7.0, 11.0, 16.0, 19.0, 18.0, 39.0, 74.0, 129.0, 274.0, 649.0, 1176.0, 856.0, 375.0, 166.0, 84.0, 59.0, 23.0, 15.0, 16.0, 8.0, 9.0, 6.0, 4.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.67578125, -1.617431640625, -1.55908203125, -1.500732421875, -1.4423828125, -1.384033203125, -1.32568359375, -1.267333984375, -1.208984375, -1.150634765625, -1.09228515625, -1.033935546875, -0.9755859375, -0.917236328125, -0.85888671875, -0.800537109375, -0.7421875, -0.683837890625, -0.62548828125, -0.567138671875, -0.5087890625, -0.450439453125, -0.39208984375, -0.333740234375, -0.275390625, -0.217041015625, -0.15869140625, -0.100341796875, -0.0419921875, 0.016357421875, 0.07470703125, 0.133056640625, 0.19140625, 0.249755859375, 0.30810546875, 0.366455078125, 0.4248046875, 0.483154296875, 0.54150390625, 0.599853515625, 0.658203125, 0.716552734375, 0.77490234375, 0.833251953125, 0.8916015625, 0.949951171875, 1.00830078125, 1.066650390625, 1.125, 1.183349609375, 1.24169921875, 1.300048828125, 1.3583984375, 1.416748046875, 1.47509765625, 1.533447265625, 1.591796875, 1.650146484375, 1.70849609375, 1.766845703125, 1.8251953125, 1.883544921875, 1.94189453125, 2.000244140625, 2.05859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 11.0, 28.0, 51.0, 87.0, 205.0, 238.0, 197.0, 96.0, 42.0, 17.0, 12.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.277074813842773, -26.692138671875, -26.107202529907227, -25.52226448059082, -24.937328338623047, -24.352392196655273, -23.7674560546875, -23.182518005371094, -22.59758186340332, -22.012645721435547, -21.427709579467773, -20.842771530151367, -20.257835388183594, -19.67289924621582, -19.087963104248047, -18.50302505493164, -17.9180908203125, -17.333154678344727, -16.748218536376953, -16.163280487060547, -15.578344345092773, -14.993408203125, -14.408472061157227, -13.823534965515137, -13.238597869873047, -12.653661727905273, -12.068724632263184, -11.48378849029541, -10.89885139465332, -10.313915252685547, -9.728979110717773, -9.144042015075684, -8.559103965759277, -7.974167346954346, -7.389230728149414, -6.804294586181641, -6.219357490539551, -5.634421348571777, -5.049484729766846, -4.464548110961914, -3.8796114921569824, -3.294674873352051, -2.709738254547119, -2.1248018741607666, -1.539865255355835, -0.9549286365509033, -0.3699922561645508, 0.21494436264038086, 0.7998809814453125, 1.3848176002502441, 1.9697540998458862, 2.5546905994415283, 3.13962721824646, 3.7245638370513916, 4.309500217437744, 4.894436836242676, 5.479373455047607, 6.064310073852539, 6.649246692657471, 7.234183311462402, 7.819119453430176, 8.404056549072266, 8.988992691040039, 9.573928833007812, 10.158865928649902]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 6.0, 9.0, 10.0, 16.0, 12.0, 19.0, 20.0, 21.0, 34.0, 33.0, 33.0, 30.0, 42.0, 35.0, 39.0, 50.0, 46.0, 57.0, 45.0, 57.0, 46.0, 43.0, 39.0, 25.0, 46.0, 33.0, 20.0, 26.0, 23.0, 19.0, 18.0, 8.0, 5.0, 11.0, 6.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.645757675170898, -6.436529159545898, -6.227300643920898, -6.018072128295898, -5.808843612670898, -5.599615097045898, -5.390387058258057, -5.181158542633057, -4.971930027008057, -4.762701511383057, -4.553472995758057, -4.344244480133057, -4.135016441345215, -3.9257876873016357, -3.716559410095215, -3.507330894470215, -3.298102378845215, -3.088873863220215, -2.879645347595215, -2.670417070388794, -2.461188554763794, -2.251960039138794, -2.042731761932373, -1.833503246307373, -1.624274730682373, -1.415046215057373, -1.2058178186416626, -0.9965893626213074, -0.7873609066009521, -0.5781323909759521, -0.3689039945602417, -0.15967559814453125, 0.04955291748046875, 0.258781373500824, 0.4680098295211792, 0.6772382855415344, 0.8864667415618896, 1.0956952571868896, 1.3049236536026, 1.5141520500183105, 1.7233805656433105, 1.9326090812683105, 2.1418375968933105, 2.3510658740997314, 2.5602943897247314, 2.7695229053497314, 2.9787511825561523, 3.1879796981811523, 3.3972082138061523, 3.6064367294311523, 3.8156652450561523, 4.024893760681152, 4.234122276306152, 4.443350791931152, 4.652578830718994, 4.861807346343994, 5.071035861968994, 5.280264377593994, 5.489492893218994, 5.698721408843994, 5.907949447631836, 6.117177963256836, 6.326406478881836, 6.535634994506836, 6.744863510131836]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 5.0, 3.0, 13.0, 22.0, 40.0, 51.0, 81.0, 142.0, 266.0, 438.0, 761.0, 1567.0, 3210.0, 7118.0, 16684.0, 44104.0, 131104.0, 377710.0, 306521.0, 99683.0, 34464.0, 13258.0, 5642.0, 2703.0, 1303.0, 681.0, 385.0, 221.0, 124.0, 79.0, 57.0, 30.0, 20.0, 21.0, 9.0, 5.0, 10.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98046875, -0.9487152099609375, -0.916961669921875, -0.8852081298828125, -0.85345458984375, -0.8217010498046875, -0.789947509765625, -0.7581939697265625, -0.7264404296875, -0.6946868896484375, -0.662933349609375, -0.6311798095703125, -0.59942626953125, -0.5676727294921875, -0.535919189453125, -0.5041656494140625, -0.472412109375, -0.4406585693359375, -0.408905029296875, -0.3771514892578125, -0.34539794921875, -0.3136444091796875, -0.281890869140625, -0.2501373291015625, -0.2183837890625, -0.1866302490234375, -0.154876708984375, -0.1231231689453125, -0.09136962890625, -0.0596160888671875, -0.027862548828125, 0.0038909912109375, 0.03564453125, 0.0673980712890625, 0.099151611328125, 0.1309051513671875, 0.16265869140625, 0.1944122314453125, 0.226165771484375, 0.2579193115234375, 0.2896728515625, 0.3214263916015625, 0.353179931640625, 0.3849334716796875, 0.41668701171875, 0.4484405517578125, 0.480194091796875, 0.5119476318359375, 0.543701171875, 0.5754547119140625, 0.607208251953125, 0.6389617919921875, 0.67071533203125, 0.7024688720703125, 0.734222412109375, 0.7659759521484375, 0.7977294921875, 0.8294830322265625, 0.861236572265625, 0.8929901123046875, 0.92474365234375, 0.9564971923828125, 0.988250732421875, 1.0200042724609375, 1.0517578125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 11.0, 12.0, 16.0, 23.0, 28.0, 31.0, 34.0, 42.0, 48.0, 66.0, 45.0, 55.0, 47.0, 60.0, 54.0, 56.0, 44.0, 55.0, 40.0, 31.0, 46.0, 30.0, 26.0, 21.0, 11.0, 8.0, 11.0, 16.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.590545654296875, -0.56976318359375, -0.548980712890625, -0.5281982421875, -0.507415771484375, -0.48663330078125, -0.465850830078125, -0.445068359375, -0.424285888671875, -0.40350341796875, -0.382720947265625, -0.3619384765625, -0.341156005859375, -0.32037353515625, -0.299591064453125, -0.27880859375, -0.258026123046875, -0.23724365234375, -0.216461181640625, -0.1956787109375, -0.174896240234375, -0.15411376953125, -0.133331298828125, -0.112548828125, -0.091766357421875, -0.07098388671875, -0.050201416015625, -0.0294189453125, -0.008636474609375, 0.01214599609375, 0.032928466796875, 0.0537109375, 0.074493408203125, 0.09527587890625, 0.116058349609375, 0.1368408203125, 0.157623291015625, 0.17840576171875, 0.199188232421875, 0.219970703125, 0.240753173828125, 0.26153564453125, 0.282318115234375, 0.3031005859375, 0.323883056640625, 0.34466552734375, 0.365447998046875, 0.38623046875, 0.407012939453125, 0.42779541015625, 0.448577880859375, 0.4693603515625, 0.490142822265625, 0.51092529296875, 0.531707763671875, 0.552490234375, 0.573272705078125, 0.59405517578125, 0.614837646484375, 0.6356201171875, 0.656402587890625, 0.67718505859375, 0.697967529296875, 0.71875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 4.0, 8.0, 9.0, 15.0, 14.0, 20.0, 24.0, 33.0, 58.0, 82.0, 136.0, 174.0, 295.0, 524.0, 1240.0, 3153.0, 13020.0, 122266.0, 808242.0, 83790.0, 10315.0, 2733.0, 1074.0, 513.0, 283.0, 183.0, 108.0, 63.0, 40.0, 37.0, 17.0, 13.0, 16.0, 15.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-2.419921875, -2.3475341796875, -2.275146484375, -2.2027587890625, -2.13037109375, -2.0579833984375, -1.985595703125, -1.9132080078125, -1.8408203125, -1.7684326171875, -1.696044921875, -1.6236572265625, -1.55126953125, -1.4788818359375, -1.406494140625, -1.3341064453125, -1.26171875, -1.1893310546875, -1.116943359375, -1.0445556640625, -0.97216796875, -0.8997802734375, -0.827392578125, -0.7550048828125, -0.6826171875, -0.6102294921875, -0.537841796875, -0.4654541015625, -0.39306640625, -0.3206787109375, -0.248291015625, -0.1759033203125, -0.103515625, -0.0311279296875, 0.041259765625, 0.1136474609375, 0.18603515625, 0.2584228515625, 0.330810546875, 0.4031982421875, 0.4755859375, 0.5479736328125, 0.620361328125, 0.6927490234375, 0.76513671875, 0.8375244140625, 0.909912109375, 0.9822998046875, 1.0546875, 1.1270751953125, 1.199462890625, 1.2718505859375, 1.34423828125, 1.4166259765625, 1.489013671875, 1.5614013671875, 1.6337890625, 1.7061767578125, 1.778564453125, 1.8509521484375, 1.92333984375, 1.9957275390625, 2.068115234375, 2.1405029296875, 2.212890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 8.0, 10.0, 20.0, 25.0, 28.0, 33.0, 41.0, 35.0, 44.0, 48.0, 53.0, 58.0, 65.0, 55.0, 49.0, 44.0, 50.0, 48.0, 41.0, 40.0, 34.0, 29.0, 25.0, 20.0, 18.0, 9.0, 7.0, 7.0, 7.0, 6.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.271148681640625, -2.18096923828125, -2.090789794921875, -2.0006103515625, -1.910430908203125, -1.82025146484375, -1.730072021484375, -1.639892578125, -1.549713134765625, -1.45953369140625, -1.369354248046875, -1.2791748046875, -1.188995361328125, -1.09881591796875, -1.008636474609375, -0.91845703125, -0.828277587890625, -0.73809814453125, -0.647918701171875, -0.5577392578125, -0.467559814453125, -0.37738037109375, -0.287200927734375, -0.197021484375, -0.106842041015625, -0.01666259765625, 0.073516845703125, 0.1636962890625, 0.253875732421875, 0.34405517578125, 0.434234619140625, 0.5244140625, 0.614593505859375, 0.70477294921875, 0.794952392578125, 0.8851318359375, 0.975311279296875, 1.06549072265625, 1.155670166015625, 1.245849609375, 1.336029052734375, 1.42620849609375, 1.516387939453125, 1.6065673828125, 1.696746826171875, 1.78692626953125, 1.877105712890625, 1.96728515625, 2.057464599609375, 2.14764404296875, 2.237823486328125, 2.3280029296875, 2.418182373046875, 2.50836181640625, 2.598541259765625, 2.688720703125, 2.778900146484375, 2.86907958984375, 2.959259033203125, 3.0494384765625, 3.139617919921875, 3.22979736328125, 3.319976806640625, 3.41015625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 10.0, 25.0, 32.0, 46.0, 108.0, 201.0, 460.0, 1262.0, 5820.0, 69834.0, 908248.0, 55364.0, 5108.0, 1215.0, 401.0, 188.0, 80.0, 53.0, 30.0, 17.0, 13.0, 7.0, 9.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3349609375, -1.2938385009765625, -1.252716064453125, -1.2115936279296875, -1.17047119140625, -1.1293487548828125, -1.088226318359375, -1.0471038818359375, -1.0059814453125, -0.9648590087890625, -0.923736572265625, -0.8826141357421875, -0.84149169921875, -0.8003692626953125, -0.759246826171875, -0.7181243896484375, -0.677001953125, -0.6358795166015625, -0.594757080078125, -0.5536346435546875, -0.51251220703125, -0.4713897705078125, -0.430267333984375, -0.3891448974609375, -0.3480224609375, -0.3069000244140625, -0.265777587890625, -0.2246551513671875, -0.18353271484375, -0.1424102783203125, -0.101287841796875, -0.0601654052734375, -0.01904296875, 0.0220794677734375, 0.063201904296875, 0.1043243408203125, 0.14544677734375, 0.1865692138671875, 0.227691650390625, 0.2688140869140625, 0.3099365234375, 0.3510589599609375, 0.392181396484375, 0.4333038330078125, 0.47442626953125, 0.5155487060546875, 0.556671142578125, 0.5977935791015625, 0.638916015625, 0.6800384521484375, 0.721160888671875, 0.7622833251953125, 0.80340576171875, 0.8445281982421875, 0.885650634765625, 0.9267730712890625, 0.9678955078125, 1.0090179443359375, 1.050140380859375, 1.0912628173828125, 1.13238525390625, 1.1735076904296875, 1.214630126953125, 1.2557525634765625, 1.296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 6.0, 3.0, 4.0, 4.0, 10.0, 5.0, 11.0, 14.0, 11.0, 20.0, 23.0, 31.0, 39.0, 94.0, 119.0, 145.0, 163.0, 74.0, 43.0, 50.0, 34.0, 24.0, 18.0, 18.0, 11.0, 8.0, 4.0, 5.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.00025391578674316406, -0.0002478398382663727, -0.0002417638897895813, -0.00023568794131278992, -0.00022961199283599854, -0.00022353604435920715, -0.00021746009588241577, -0.0002113841474056244, -0.000205308198928833, -0.00019923225045204163, -0.00019315630197525024, -0.00018708035349845886, -0.00018100440502166748, -0.0001749284565448761, -0.00016885250806808472, -0.00016277655959129333, -0.00015670061111450195, -0.00015062466263771057, -0.0001445487141609192, -0.0001384727656841278, -0.00013239681720733643, -0.00012632086873054504, -0.00012024492025375366, -0.00011416897177696228, -0.0001080930233001709, -0.00010201707482337952, -9.594112634658813e-05, -8.986517786979675e-05, -8.378922939300537e-05, -7.771328091621399e-05, -7.163733243942261e-05, -6.556138396263123e-05, -5.9485435485839844e-05, -5.340948700904846e-05, -4.733353853225708e-05, -4.12575900554657e-05, -3.5181641578674316e-05, -2.9105693101882935e-05, -2.3029744625091553e-05, -1.695379614830017e-05, -1.0877847671508789e-05, -4.801899194717407e-06, 1.2740492820739746e-06, 7.3499977588653564e-06, 1.3425946235656738e-05, 1.950189471244812e-05, 2.5577843189239502e-05, 3.1653791666030884e-05, 3.7729740142822266e-05, 4.380568861961365e-05, 4.988163709640503e-05, 5.595758557319641e-05, 6.203353404998779e-05, 6.810948252677917e-05, 7.418543100357056e-05, 8.026137948036194e-05, 8.633732795715332e-05, 9.24132764339447e-05, 9.848922491073608e-05, 0.00010456517338752747, 0.00011064112186431885, 0.00011671707034111023, 0.0001227930188179016, 0.000128868967294693, 0.00013494491577148438]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 9.0, 4.0, 6.0, 14.0, 15.0, 26.0, 30.0, 37.0, 47.0, 56.0, 89.0, 135.0, 182.0, 350.0, 551.0, 1055.0, 2117.0, 5610.0, 20081.0, 101511.0, 691769.0, 180445.0, 30734.0, 7885.0, 2733.0, 1226.0, 674.0, 349.0, 229.0, 149.0, 98.0, 74.0, 63.0, 40.0, 24.0, 31.0, 21.0, 11.0, 16.0, 10.0, 12.0, 7.0, 7.0, 3.0, 2.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.65087890625, -0.6264495849609375, -0.602020263671875, -0.5775909423828125, -0.55316162109375, -0.5287322998046875, -0.504302978515625, -0.4798736572265625, -0.4554443359375, -0.4310150146484375, -0.406585693359375, -0.3821563720703125, -0.35772705078125, -0.3332977294921875, -0.308868408203125, -0.2844390869140625, -0.260009765625, -0.2355804443359375, -0.211151123046875, -0.1867218017578125, -0.16229248046875, -0.1378631591796875, -0.113433837890625, -0.0890045166015625, -0.0645751953125, -0.0401458740234375, -0.015716552734375, 0.0087127685546875, 0.03314208984375, 0.0575714111328125, 0.082000732421875, 0.1064300537109375, 0.130859375, 0.1552886962890625, 0.179718017578125, 0.2041473388671875, 0.22857666015625, 0.2530059814453125, 0.277435302734375, 0.3018646240234375, 0.3262939453125, 0.3507232666015625, 0.375152587890625, 0.3995819091796875, 0.42401123046875, 0.4484405517578125, 0.472869873046875, 0.4972991943359375, 0.521728515625, 0.5461578369140625, 0.570587158203125, 0.5950164794921875, 0.61944580078125, 0.6438751220703125, 0.668304443359375, 0.6927337646484375, 0.7171630859375, 0.7415924072265625, 0.766021728515625, 0.7904510498046875, 0.81488037109375, 0.8393096923828125, 0.863739013671875, 0.8881683349609375, 0.91259765625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 14.0, 26.0, 26.0, 40.0, 49.0, 71.0, 97.0, 157.0, 157.0, 126.0, 76.0, 58.0, 32.0, 23.0, 17.0, 7.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.431640625, -1.3940277099609375, -1.356414794921875, -1.3188018798828125, -1.28118896484375, -1.2435760498046875, -1.205963134765625, -1.1683502197265625, -1.1307373046875, -1.0931243896484375, -1.055511474609375, -1.0178985595703125, -0.98028564453125, -0.9426727294921875, -0.905059814453125, -0.8674468994140625, -0.829833984375, -0.7922210693359375, -0.754608154296875, -0.7169952392578125, -0.67938232421875, -0.6417694091796875, -0.604156494140625, -0.5665435791015625, -0.5289306640625, -0.4913177490234375, -0.453704833984375, -0.4160919189453125, -0.37847900390625, -0.3408660888671875, -0.303253173828125, -0.2656402587890625, -0.22802734375, -0.1904144287109375, -0.152801513671875, -0.1151885986328125, -0.07757568359375, -0.0399627685546875, -0.002349853515625, 0.0352630615234375, 0.0728759765625, 0.1104888916015625, 0.148101806640625, 0.1857147216796875, 0.22332763671875, 0.2609405517578125, 0.298553466796875, 0.3361663818359375, 0.373779296875, 0.4113922119140625, 0.449005126953125, 0.4866180419921875, 0.52423095703125, 0.5618438720703125, 0.599456787109375, 0.6370697021484375, 0.6746826171875, 0.7122955322265625, 0.749908447265625, 0.7875213623046875, 0.82513427734375, 0.8627471923828125, 0.900360107421875, 0.9379730224609375, 0.9755859375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 29.0, 65.0, 203.0, 354.0, 202.0, 82.0, 35.0, 12.0, 6.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.49456024169922, -29.683015823364258, -28.871469497680664, -28.059925079345703, -27.248380661010742, -26.43683624267578, -25.625289916992188, -24.813745498657227, -24.002201080322266, -23.190656661987305, -22.37911033630371, -21.56756591796875, -20.75602149963379, -19.944477081298828, -19.132930755615234, -18.321386337280273, -17.50984001159668, -16.69829559326172, -15.886750221252441, -15.075204849243164, -14.263660430908203, -13.452115058898926, -12.640569686889648, -11.829025268554688, -11.01747989654541, -10.205934524536133, -9.394390106201172, -8.582844734191895, -7.771299839019775, -6.959754943847656, -6.148209571838379, -5.33666467666626, -4.525121688842773, -3.7135767936706543, -2.902031660079956, -2.090486526489258, -1.2789416313171387, -0.46739673614501953, 0.3441486358642578, 1.155693531036377, 1.967238426208496, 2.7787833213806152, 3.5903284549713135, 4.401873588562012, 5.213418483734131, 6.02496337890625, 6.836508750915527, 7.6480536460876465, 8.459598541259766, 9.271143913269043, 10.082688331604004, 10.894233703613281, 11.705778121948242, 12.51732349395752, 13.328868865966797, 14.140413284301758, 14.951958656311035, 15.763504028320312, 16.575048446655273, 17.386592864990234, 18.198139190673828, 19.00968360900879, 19.82122802734375, 20.632774353027344, 21.444318771362305]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 13.0, 12.0, 17.0, 15.0, 20.0, 23.0, 25.0, 37.0, 24.0, 39.0, 30.0, 42.0, 58.0, 58.0, 60.0, 59.0, 56.0, 54.0, 37.0, 42.0, 43.0, 28.0, 28.0, 29.0, 22.0, 26.0, 17.0, 16.0, 10.0, 7.0, 11.0, 10.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.786921501159668, -11.452144622802734, -11.1173677444458, -10.782590866088867, -10.447813987731934, -10.113037109375, -9.778260231018066, -9.443483352661133, -9.1087064743042, -8.773929595947266, -8.439152717590332, -8.104375839233398, -7.769598960876465, -7.434822082519531, -7.100045204162598, -6.765268325805664, -6.430490970611572, -6.095714092254639, -5.760937213897705, -5.4261603355407715, -5.091383457183838, -4.756606578826904, -4.4218292236328125, -4.087052345275879, -3.7522757053375244, -3.417498826980591, -3.0827219486236572, -2.7479448318481445, -2.413167953491211, -2.0783910751342773, -1.7436141967773438, -1.4088373184204102, -1.0740604400634766, -0.739283561706543, -0.4045066237449646, -0.06972968578338623, 0.26504719257354736, 0.599824070930481, 0.9346010684967041, 1.2693779468536377, 1.6041548252105713, 1.9389317035675049, 2.2737085819244385, 2.608485698699951, 2.9432625770568848, 3.2780394554138184, 3.612816333770752, 3.9475932121276855, 4.282370090484619, 4.617146968841553, 4.951923847198486, 5.28670072555542, 5.6214776039123535, 5.956254482269287, 6.291031837463379, 6.6258087158203125, 6.960585594177246, 7.29536247253418, 7.630139350891113, 7.964916229248047, 8.29969310760498, 8.634469985961914, 8.969246864318848, 9.304023742675781, 9.638800621032715]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 14.0, 18.0, 41.0, 62.0, 127.0, 284.0, 548.0, 1415.0, 5396.0, 85282.0, 4047531.0, 47111.0, 4241.0, 1214.0, 490.0, 243.0, 97.0, 49.0, 45.0, 21.0, 10.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.78619384765625, -2.6915283203125, -2.59686279296875, -2.502197265625, -2.40753173828125, -2.3128662109375, -2.21820068359375, -2.12353515625, -2.02886962890625, -1.9342041015625, -1.83953857421875, -1.744873046875, -1.65020751953125, -1.5555419921875, -1.46087646484375, -1.3662109375, -1.27154541015625, -1.1768798828125, -1.08221435546875, -0.987548828125, -0.89288330078125, -0.7982177734375, -0.70355224609375, -0.60888671875, -0.51422119140625, -0.4195556640625, -0.32489013671875, -0.230224609375, -0.13555908203125, -0.0408935546875, 0.05377197265625, 0.1484375, 0.24310302734375, 0.3377685546875, 0.43243408203125, 0.527099609375, 0.62176513671875, 0.7164306640625, 0.81109619140625, 0.90576171875, 1.00042724609375, 1.0950927734375, 1.18975830078125, 1.284423828125, 1.37908935546875, 1.4737548828125, 1.56842041015625, 1.6630859375, 1.75775146484375, 1.8524169921875, 1.94708251953125, 2.041748046875, 2.13641357421875, 2.2310791015625, 2.32574462890625, 2.42041015625, 2.51507568359375, 2.6097412109375, 2.70440673828125, 2.799072265625, 2.89373779296875, 2.9884033203125, 3.08306884765625, 3.177734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 9.0, 18.0, 11.0, 19.0, 30.0, 28.0, 38.0, 39.0, 42.0, 39.0, 46.0, 52.0, 45.0, 52.0, 50.0, 48.0, 46.0, 42.0, 41.0, 36.0, 33.0, 37.0, 24.0, 26.0, 26.0, 17.0, 20.0, 14.0, 6.0, 10.0, 7.0, 11.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5048828125, -0.48712158203125, -0.4693603515625, -0.45159912109375, -0.433837890625, -0.41607666015625, -0.3983154296875, -0.38055419921875, -0.36279296875, -0.34503173828125, -0.3272705078125, -0.30950927734375, -0.291748046875, -0.27398681640625, -0.2562255859375, -0.23846435546875, -0.220703125, -0.20294189453125, -0.1851806640625, -0.16741943359375, -0.149658203125, -0.13189697265625, -0.1141357421875, -0.09637451171875, -0.07861328125, -0.06085205078125, -0.0430908203125, -0.02532958984375, -0.007568359375, 0.01019287109375, 0.0279541015625, 0.04571533203125, 0.0634765625, 0.08123779296875, 0.0989990234375, 0.11676025390625, 0.134521484375, 0.15228271484375, 0.1700439453125, 0.18780517578125, 0.20556640625, 0.22332763671875, 0.2410888671875, 0.25885009765625, 0.276611328125, 0.29437255859375, 0.3121337890625, 0.32989501953125, 0.34765625, 0.36541748046875, 0.3831787109375, 0.40093994140625, 0.418701171875, 0.43646240234375, 0.4542236328125, 0.47198486328125, 0.48974609375, 0.50750732421875, 0.5252685546875, 0.54302978515625, 0.560791015625, 0.57855224609375, 0.5963134765625, 0.61407470703125, 0.6318359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 5.0, 2.0, 9.0, 14.0, 13.0, 14.0, 38.0, 51.0, 77.0, 106.0, 152.0, 262.0, 371.0, 601.0, 966.0, 1648.0, 3163.0, 6618.0, 18303.0, 81299.0, 1502227.0, 2430995.0, 108641.0, 22412.0, 7917.0, 3600.0, 1884.0, 1064.0, 667.0, 406.0, 252.0, 166.0, 106.0, 83.0, 51.0, 45.0, 13.0, 14.0, 13.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.4572296142578125, -1.414459228515625, -1.3716888427734375, -1.32891845703125, -1.2861480712890625, -1.243377685546875, -1.2006072998046875, -1.1578369140625, -1.1150665283203125, -1.072296142578125, -1.0295257568359375, -0.98675537109375, -0.9439849853515625, -0.901214599609375, -0.8584442138671875, -0.815673828125, -0.7729034423828125, -0.730133056640625, -0.6873626708984375, -0.64459228515625, -0.6018218994140625, -0.559051513671875, -0.5162811279296875, -0.4735107421875, -0.4307403564453125, -0.387969970703125, -0.3451995849609375, -0.30242919921875, -0.2596588134765625, -0.216888427734375, -0.1741180419921875, -0.13134765625, -0.0885772705078125, -0.045806884765625, -0.0030364990234375, 0.03973388671875, 0.0825042724609375, 0.125274658203125, 0.1680450439453125, 0.2108154296875, 0.2535858154296875, 0.296356201171875, 0.3391265869140625, 0.38189697265625, 0.4246673583984375, 0.467437744140625, 0.5102081298828125, 0.552978515625, 0.5957489013671875, 0.638519287109375, 0.6812896728515625, 0.72406005859375, 0.7668304443359375, 0.809600830078125, 0.8523712158203125, 0.8951416015625, 0.9379119873046875, 0.980682373046875, 1.0234527587890625, 1.06622314453125, 1.1089935302734375, 1.151763916015625, 1.1945343017578125, 1.2373046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 8.0, 8.0, 14.0, 31.0, 49.0, 104.0, 253.0, 723.0, 1447.0, 887.0, 268.0, 122.0, 53.0, 29.0, 22.0, 11.0, 12.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.556640625, -2.488616943359375, -2.42059326171875, -2.352569580078125, -2.2845458984375, -2.216522216796875, -2.14849853515625, -2.080474853515625, -2.012451171875, -1.944427490234375, -1.87640380859375, -1.808380126953125, -1.7403564453125, -1.672332763671875, -1.60430908203125, -1.536285400390625, -1.46826171875, -1.400238037109375, -1.33221435546875, -1.264190673828125, -1.1961669921875, -1.128143310546875, -1.06011962890625, -0.992095947265625, -0.924072265625, -0.856048583984375, -0.78802490234375, -0.720001220703125, -0.6519775390625, -0.583953857421875, -0.51593017578125, -0.447906494140625, -0.3798828125, -0.311859130859375, -0.24383544921875, -0.175811767578125, -0.1077880859375, -0.039764404296875, 0.02825927734375, 0.096282958984375, 0.164306640625, 0.232330322265625, 0.30035400390625, 0.368377685546875, 0.4364013671875, 0.504425048828125, 0.57244873046875, 0.640472412109375, 0.70849609375, 0.776519775390625, 0.84454345703125, 0.912567138671875, 0.9805908203125, 1.048614501953125, 1.11663818359375, 1.184661865234375, 1.252685546875, 1.320709228515625, 1.38873291015625, 1.456756591796875, 1.5247802734375, 1.592803955078125, 1.66082763671875, 1.728851318359375, 1.796875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 11.0, 15.0, 23.0, 46.0, 65.0, 89.0, 125.0, 150.0, 148.0, 96.0, 86.0, 36.0, 23.0, 16.0, 12.0, 9.0, 8.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.69163990020752, -8.415185928344727, -8.138731002807617, -7.862277030944824, -7.585823059082031, -7.309369087219238, -7.032914638519287, -6.756460189819336, -6.480006217956543, -6.20355224609375, -5.927097797393799, -5.650643348693848, -5.374189376831055, -5.097735404968262, -4.8212809562683105, -4.544826507568359, -4.268372535705566, -3.9919183254241943, -3.7154641151428223, -3.43900990486145, -3.162555694580078, -2.886101484298706, -2.609647274017334, -2.333193063735962, -2.05673885345459, -1.7802846431732178, -1.5038304328918457, -1.2273762226104736, -0.9509220123291016, -0.6744678020477295, -0.3980135917663574, -0.12155938148498535, 0.1548938751220703, 0.4313480854034424, 0.7078022956848145, 0.9842565059661865, 1.2607107162475586, 1.5371649265289307, 1.8136191368103027, 2.090073347091675, 2.366527557373047, 2.642981767654419, 2.919435977935791, 3.195890188217163, 3.472344398498535, 3.7487986087799072, 4.025252819061279, 4.3017072677612305, 4.578161239624023, 4.854615211486816, 5.131069660186768, 5.407524108886719, 5.683978080749512, 5.960432052612305, 6.236886501312256, 6.513340950012207, 6.789794921875, 7.066248893737793, 7.342703342437744, 7.619157791137695, 7.895611763000488, 8.172065734863281, 8.44852066040039, 8.724974632263184, 9.001428604125977]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 3.0, 7.0, 6.0, 10.0, 10.0, 7.0, 11.0, 15.0, 15.0, 18.0, 27.0, 23.0, 29.0, 25.0, 41.0, 35.0, 39.0, 39.0, 45.0, 42.0, 41.0, 55.0, 37.0, 42.0, 49.0, 32.0, 26.0, 40.0, 26.0, 32.0, 23.0, 17.0, 20.0, 17.0, 25.0, 14.0, 9.0, 8.0, 7.0, 7.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-5.3482346534729, -5.184440612792969, -5.020646095275879, -4.856852054595947, -4.693058013916016, -4.529263973236084, -4.365469455718994, -4.2016754150390625, -4.037881374359131, -3.87408709526062, -3.7102930545806885, -3.5464987754821777, -3.382704734802246, -3.2189104557037354, -3.0551161766052246, -2.891322135925293, -2.7275278568267822, -2.5637335777282715, -2.39993953704834, -2.236145257949829, -2.0723512172698975, -1.9085569381713867, -1.7447627782821655, -1.5809686183929443, -1.4171744585037231, -1.253380298614502, -1.0895861387252808, -0.9257919192314148, -0.7619977593421936, -0.5982035994529724, -0.43440937995910645, -0.27061522006988525, -0.10682106018066406, 0.05697311460971832, 0.2207672894001007, 0.3845614790916443, 0.5483556389808655, 0.7121497988700867, 0.8759440183639526, 1.0397381782531738, 1.203532338142395, 1.3673264980316162, 1.5311206579208374, 1.6949148178100586, 1.8587090969085693, 2.022503137588501, 2.1862974166870117, 2.3500914573669434, 2.513885736465454, 2.677680015563965, 2.8414740562438965, 3.0052683353424072, 3.169062376022339, 3.3328566551208496, 3.4966506958007812, 3.660444974899292, 3.8242392539978027, 3.9880335330963135, 4.151827812194824, 4.315621852874756, 4.4794158935546875, 4.643209934234619, 4.807004451751709, 4.970798492431641, 5.134592533111572]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 8.0, 10.0, 10.0, 18.0, 29.0, 34.0, 54.0, 105.0, 129.0, 214.0, 398.0, 676.0, 1184.0, 2176.0, 4484.0, 9252.0, 21273.0, 54457.0, 157816.0, 410868.0, 247789.0, 82031.0, 30511.0, 12682.0, 5880.0, 2912.0, 1518.0, 796.0, 483.0, 272.0, 153.0, 118.0, 69.0, 41.0, 31.0, 18.0, 17.0, 12.0, 3.0, 3.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.85693359375, -0.8290176391601562, -0.8011016845703125, -0.7731857299804688, -0.745269775390625, -0.7173538208007812, -0.6894378662109375, -0.6615219116210938, -0.63360595703125, -0.6056900024414062, -0.5777740478515625, -0.5498580932617188, -0.521942138671875, -0.49402618408203125, -0.4661102294921875, -0.43819427490234375, -0.4102783203125, -0.38236236572265625, -0.3544464111328125, -0.32653045654296875, -0.298614501953125, -0.27069854736328125, -0.2427825927734375, -0.21486663818359375, -0.18695068359375, -0.15903472900390625, -0.1311187744140625, -0.10320281982421875, -0.075286865234375, -0.04737091064453125, -0.0194549560546875, 0.00846099853515625, 0.036376953125, 0.06429290771484375, 0.0922088623046875, 0.12012481689453125, 0.148040771484375, 0.17595672607421875, 0.2038726806640625, 0.23178863525390625, 0.25970458984375, 0.28762054443359375, 0.3155364990234375, 0.34345245361328125, 0.371368408203125, 0.39928436279296875, 0.4272003173828125, 0.45511627197265625, 0.4830322265625, 0.5109481811523438, 0.5388641357421875, 0.5667800903320312, 0.594696044921875, 0.6226119995117188, 0.6505279541015625, 0.6784439086914062, 0.70635986328125, 0.7342758178710938, 0.7621917724609375, 0.7901077270507812, 0.818023681640625, 0.8459396362304688, 0.8738555908203125, 0.9017715454101562, 0.9296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 7.0, 5.0, 13.0, 18.0, 14.0, 25.0, 14.0, 24.0, 18.0, 34.0, 39.0, 31.0, 29.0, 40.0, 61.0, 50.0, 55.0, 64.0, 38.0, 40.0, 43.0, 41.0, 38.0, 29.0, 31.0, 24.0, 28.0, 21.0, 9.0, 24.0, 13.0, 17.0, 8.0, 11.0, 10.0, 6.0, 7.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.556640625, -0.5389938354492188, -0.5213470458984375, -0.5037002563476562, -0.486053466796875, -0.46840667724609375, -0.4507598876953125, -0.43311309814453125, -0.41546630859375, -0.39781951904296875, -0.3801727294921875, -0.36252593994140625, -0.344879150390625, -0.32723236083984375, -0.3095855712890625, -0.29193878173828125, -0.2742919921875, -0.25664520263671875, -0.2389984130859375, -0.22135162353515625, -0.203704833984375, -0.18605804443359375, -0.1684112548828125, -0.15076446533203125, -0.13311767578125, -0.11547088623046875, -0.0978240966796875, -0.08017730712890625, -0.062530517578125, -0.04488372802734375, -0.0272369384765625, -0.00959014892578125, 0.008056640625, 0.02570343017578125, 0.0433502197265625, 0.06099700927734375, 0.078643798828125, 0.09629058837890625, 0.1139373779296875, 0.13158416748046875, 0.14923095703125, 0.16687774658203125, 0.1845245361328125, 0.20217132568359375, 0.219818115234375, 0.23746490478515625, 0.2551116943359375, 0.27275848388671875, 0.2904052734375, 0.30805206298828125, 0.3256988525390625, 0.34334564208984375, 0.360992431640625, 0.37863922119140625, 0.3962860107421875, 0.41393280029296875, 0.43157958984375, 0.44922637939453125, 0.4668731689453125, 0.48451995849609375, 0.502166748046875, 0.5198135375976562, 0.5374603271484375, 0.5551071166992188, 0.57275390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 12.0, 4.0, 6.0, 11.0, 15.0, 21.0, 32.0, 30.0, 40.0, 67.0, 106.0, 158.0, 254.0, 416.0, 890.0, 1881.0, 5218.0, 18570.0, 107643.0, 725971.0, 152599.0, 23829.0, 6206.0, 2269.0, 1008.0, 500.0, 280.0, 163.0, 107.0, 80.0, 46.0, 33.0, 23.0, 19.0, 12.0, 10.0, 9.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6845703125, -1.629486083984375, -1.57440185546875, -1.519317626953125, -1.4642333984375, -1.409149169921875, -1.35406494140625, -1.298980712890625, -1.243896484375, -1.188812255859375, -1.13372802734375, -1.078643798828125, -1.0235595703125, -0.968475341796875, -0.91339111328125, -0.858306884765625, -0.80322265625, -0.748138427734375, -0.69305419921875, -0.637969970703125, -0.5828857421875, -0.527801513671875, -0.47271728515625, -0.417633056640625, -0.362548828125, -0.307464599609375, -0.25238037109375, -0.197296142578125, -0.1422119140625, -0.087127685546875, -0.03204345703125, 0.023040771484375, 0.078125, 0.133209228515625, 0.18829345703125, 0.243377685546875, 0.2984619140625, 0.353546142578125, 0.40863037109375, 0.463714599609375, 0.518798828125, 0.573883056640625, 0.62896728515625, 0.684051513671875, 0.7391357421875, 0.794219970703125, 0.84930419921875, 0.904388427734375, 0.95947265625, 1.014556884765625, 1.06964111328125, 1.124725341796875, 1.1798095703125, 1.234893798828125, 1.28997802734375, 1.345062255859375, 1.400146484375, 1.455230712890625, 1.51031494140625, 1.565399169921875, 1.6204833984375, 1.675567626953125, 1.73065185546875, 1.785736083984375, 1.8408203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 8.0, 18.0, 13.0, 28.0, 24.0, 24.0, 30.0, 34.0, 32.0, 40.0, 30.0, 42.0, 48.0, 56.0, 43.0, 59.0, 41.0, 52.0, 47.0, 38.0, 34.0, 43.0, 24.0, 29.0, 16.0, 20.0, 16.0, 13.0, 19.0, 8.0, 5.0, 6.0, 3.0, 3.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.21484375, -2.1429443359375, -2.071044921875, -1.9991455078125, -1.92724609375, -1.8553466796875, -1.783447265625, -1.7115478515625, -1.6396484375, -1.5677490234375, -1.495849609375, -1.4239501953125, -1.35205078125, -1.2801513671875, -1.208251953125, -1.1363525390625, -1.064453125, -0.9925537109375, -0.920654296875, -0.8487548828125, -0.77685546875, -0.7049560546875, -0.633056640625, -0.5611572265625, -0.4892578125, -0.4173583984375, -0.345458984375, -0.2735595703125, -0.20166015625, -0.1297607421875, -0.057861328125, 0.0140380859375, 0.0859375, 0.1578369140625, 0.229736328125, 0.3016357421875, 0.37353515625, 0.4454345703125, 0.517333984375, 0.5892333984375, 0.6611328125, 0.7330322265625, 0.804931640625, 0.8768310546875, 0.94873046875, 1.0206298828125, 1.092529296875, 1.1644287109375, 1.236328125, 1.3082275390625, 1.380126953125, 1.4520263671875, 1.52392578125, 1.5958251953125, 1.667724609375, 1.7396240234375, 1.8115234375, 1.8834228515625, 1.955322265625, 2.0272216796875, 2.09912109375, 2.1710205078125, 2.242919921875, 2.3148193359375, 2.38671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 5.0, 13.0, 10.0, 9.0, 22.0, 54.0, 86.0, 197.0, 575.0, 2242.0, 20413.0, 878815.0, 138108.0, 6191.0, 1119.0, 339.0, 173.0, 70.0, 44.0, 23.0, 14.0, 4.0, 7.0, 7.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6923828125, -1.635528564453125, -1.57867431640625, -1.521820068359375, -1.4649658203125, -1.408111572265625, -1.35125732421875, -1.294403076171875, -1.237548828125, -1.180694580078125, -1.12384033203125, -1.066986083984375, -1.0101318359375, -0.953277587890625, -0.89642333984375, -0.839569091796875, -0.78271484375, -0.725860595703125, -0.66900634765625, -0.612152099609375, -0.5552978515625, -0.498443603515625, -0.44158935546875, -0.384735107421875, -0.327880859375, -0.271026611328125, -0.21417236328125, -0.157318115234375, -0.1004638671875, -0.043609619140625, 0.01324462890625, 0.070098876953125, 0.126953125, 0.183807373046875, 0.24066162109375, 0.297515869140625, 0.3543701171875, 0.411224365234375, 0.46807861328125, 0.524932861328125, 0.581787109375, 0.638641357421875, 0.69549560546875, 0.752349853515625, 0.8092041015625, 0.866058349609375, 0.92291259765625, 0.979766845703125, 1.03662109375, 1.093475341796875, 1.15032958984375, 1.207183837890625, 1.2640380859375, 1.320892333984375, 1.37774658203125, 1.434600830078125, 1.491455078125, 1.548309326171875, 1.60516357421875, 1.662017822265625, 1.7188720703125, 1.775726318359375, 1.83258056640625, 1.889434814453125, 1.9462890625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 2.0, 6.0, 4.0, 10.0, 10.0, 6.0, 18.0, 27.0, 25.0, 40.0, 59.0, 99.0, 150.0, 184.0, 109.0, 69.0, 52.0, 40.0, 20.0, 20.0, 13.0, 10.0, 8.0, 8.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029730796813964844, -0.000290602445602417, -0.00028389692306518555, -0.0002771914005279541, -0.00027048587799072266, -0.0002637803554534912, -0.00025707483291625977, -0.0002503693103790283, -0.00024366378784179688, -0.00023695826530456543, -0.00023025274276733398, -0.00022354722023010254, -0.0002168416976928711, -0.00021013617515563965, -0.0002034306526184082, -0.00019672513008117676, -0.0001900196075439453, -0.00018331408500671387, -0.00017660856246948242, -0.00016990303993225098, -0.00016319751739501953, -0.00015649199485778809, -0.00014978647232055664, -0.0001430809497833252, -0.00013637542724609375, -0.0001296699047088623, -0.00012296438217163086, -0.00011625885963439941, -0.00010955333709716797, -0.00010284781455993652, -9.614229202270508e-05, -8.943676948547363e-05, -8.273124694824219e-05, -7.602572441101074e-05, -6.93202018737793e-05, -6.261467933654785e-05, -5.5909156799316406e-05, -4.920363426208496e-05, -4.2498111724853516e-05, -3.579258918762207e-05, -2.9087066650390625e-05, -2.238154411315918e-05, -1.5676021575927734e-05, -8.970499038696289e-06, -2.2649765014648438e-06, 4.4405460357666016e-06, 1.1146068572998047e-05, 1.7851591110229492e-05, 2.4557113647460938e-05, 3.126263618469238e-05, 3.796815872192383e-05, 4.4673681259155273e-05, 5.137920379638672e-05, 5.8084726333618164e-05, 6.479024887084961e-05, 7.149577140808105e-05, 7.82012939453125e-05, 8.490681648254395e-05, 9.161233901977539e-05, 9.831786155700684e-05, 0.00010502338409423828, 0.00011172890663146973, 0.00011843442916870117, 0.00012513995170593262, 0.00013184547424316406]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 7.0, 6.0, 7.0, 14.0, 11.0, 28.0, 43.0, 50.0, 64.0, 98.0, 156.0, 232.0, 396.0, 649.0, 1379.0, 3070.0, 7905.0, 29195.0, 221613.0, 692624.0, 67927.0, 14154.0, 4615.0, 1978.0, 947.0, 494.0, 315.0, 174.0, 118.0, 87.0, 45.0, 36.0, 33.0, 19.0, 15.0, 10.0, 8.0, 4.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.822265625, -0.7941436767578125, -0.766021728515625, -0.7378997802734375, -0.70977783203125, -0.6816558837890625, -0.653533935546875, -0.6254119873046875, -0.5972900390625, -0.5691680908203125, -0.541046142578125, -0.5129241943359375, -0.48480224609375, -0.4566802978515625, -0.428558349609375, -0.4004364013671875, -0.372314453125, -0.3441925048828125, -0.316070556640625, -0.2879486083984375, -0.25982666015625, -0.2317047119140625, -0.203582763671875, -0.1754608154296875, -0.1473388671875, -0.1192169189453125, -0.091094970703125, -0.0629730224609375, -0.03485107421875, -0.0067291259765625, 0.021392822265625, 0.0495147705078125, 0.07763671875, 0.1057586669921875, 0.133880615234375, 0.1620025634765625, 0.19012451171875, 0.2182464599609375, 0.246368408203125, 0.2744903564453125, 0.3026123046875, 0.3307342529296875, 0.358856201171875, 0.3869781494140625, 0.41510009765625, 0.4432220458984375, 0.471343994140625, 0.4994659423828125, 0.527587890625, 0.5557098388671875, 0.583831787109375, 0.6119537353515625, 0.64007568359375, 0.6681976318359375, 0.696319580078125, 0.7244415283203125, 0.7525634765625, 0.7806854248046875, 0.808807373046875, 0.8369293212890625, 0.86505126953125, 0.8931732177734375, 0.921295166015625, 0.9494171142578125, 0.9775390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 9.0, 8.0, 15.0, 22.0, 25.0, 32.0, 56.0, 58.0, 80.0, 134.0, 159.0, 118.0, 90.0, 34.0, 46.0, 30.0, 16.0, 16.0, 17.0, 9.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7724609375, -0.7419891357421875, -0.711517333984375, -0.6810455322265625, -0.65057373046875, -0.6201019287109375, -0.589630126953125, -0.5591583251953125, -0.5286865234375, -0.4982147216796875, -0.467742919921875, -0.4372711181640625, -0.40679931640625, -0.3763275146484375, -0.345855712890625, -0.3153839111328125, -0.284912109375, -0.2544403076171875, -0.223968505859375, -0.1934967041015625, -0.16302490234375, -0.1325531005859375, -0.102081298828125, -0.0716094970703125, -0.0411376953125, -0.0106658935546875, 0.019805908203125, 0.0502777099609375, 0.08074951171875, 0.1112213134765625, 0.141693115234375, 0.1721649169921875, 0.20263671875, 0.2331085205078125, 0.263580322265625, 0.2940521240234375, 0.32452392578125, 0.3549957275390625, 0.385467529296875, 0.4159393310546875, 0.4464111328125, 0.4768829345703125, 0.507354736328125, 0.5378265380859375, 0.56829833984375, 0.5987701416015625, 0.629241943359375, 0.6597137451171875, 0.690185546875, 0.7206573486328125, 0.751129150390625, 0.7816009521484375, 0.81207275390625, 0.8425445556640625, 0.873016357421875, 0.9034881591796875, 0.9339599609375, 0.9644317626953125, 0.994903564453125, 1.0253753662109375, 1.05584716796875, 1.0863189697265625, 1.116790771484375, 1.1472625732421875, 1.177734375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 9.0, 23.0, 14.0, 55.0, 158.0, 350.0, 253.0, 83.0, 36.0, 10.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.84917449951172, -35.09694290161133, -34.34470748901367, -33.59247589111328, -32.84024429321289, -32.0880126953125, -31.335779190063477, -30.583545684814453, -29.831314086914062, -29.07908058166504, -28.32684898376465, -27.574615478515625, -26.822383880615234, -26.07015037536621, -25.31791877746582, -24.565685272216797, -23.813453674316406, -23.061220169067383, -22.308988571166992, -21.55675506591797, -20.804523468017578, -20.052289962768555, -19.300058364868164, -18.54782485961914, -17.795591354370117, -17.043357849121094, -16.291126251220703, -15.538893699645996, -14.786661148071289, -14.034428596496582, -13.282196044921875, -12.529962539672852, -11.777731895446777, -11.02549934387207, -10.273266792297363, -9.521034240722656, -8.76880168914795, -8.016569137573242, -7.264336109161377, -6.51210355758667, -5.759871006011963, -5.007638454437256, -4.255405902862549, -3.5031731128692627, -2.7509405612945557, -1.9987080097198486, -1.2464752197265625, -0.49424266815185547, 0.25798988342285156, 1.0102224349975586, 1.7624551057815552, 2.5146877765655518, 3.266920328140259, 4.019152641296387, 4.771385669708252, 5.523618221282959, 6.275850772857666, 7.028083324432373, 7.78031587600708, 8.532548904418945, 9.284781455993652, 10.03701400756836, 10.789246559143066, 11.541479110717773, 12.29371166229248]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 10.0, 7.0, 9.0, 13.0, 15.0, 23.0, 22.0, 33.0, 36.0, 21.0, 32.0, 31.0, 43.0, 42.0, 58.0, 65.0, 59.0, 57.0, 50.0, 38.0, 51.0, 34.0, 37.0, 27.0, 33.0, 26.0, 24.0, 17.0, 17.0, 16.0, 7.0, 9.0, 9.0, 4.0, 6.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.269038200378418, -8.945643424987793, -8.622248649597168, -8.298853874206543, -7.975459575653076, -7.652064800262451, -7.328670501708984, -7.005275726318359, -6.681880950927734, -6.358486175537109, -6.035091400146484, -5.711697101593018, -5.388302326202393, -5.064907550811768, -4.741513252258301, -4.418118476867676, -4.094723701477051, -3.771328926086426, -3.44793438911438, -3.124539852142334, -2.801145076751709, -2.477750301361084, -2.154355764389038, -1.8309612274169922, -1.5075664520263672, -1.1841717958450317, -0.8607771396636963, -0.5373824834823608, -0.2139878273010254, 0.10940682888031006, 0.4328014850616455, 0.7561960220336914, 1.07958984375, 1.4029844999313354, 1.726379156112671, 2.049773693084717, 2.373168468475342, 2.696563243865967, 3.0199577808380127, 3.3433523178100586, 3.6667470932006836, 3.9901418685913086, 4.313536643981934, 4.6369309425354, 4.960325717926025, 5.28372049331665, 5.607114791870117, 5.930509567260742, 6.253904342651367, 6.577299118041992, 6.900693893432617, 7.224088191986084, 7.547482967376709, 7.870877742767334, 8.1942720413208, 8.517666816711426, 8.84106159210205, 9.164456367492676, 9.4878511428833, 9.811245918273926, 10.134639739990234, 10.45803451538086, 10.781429290771484, 11.10482406616211, 11.428218841552734]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 6.0, 8.0, 14.0, 17.0, 30.0, 59.0, 91.0, 134.0, 225.0, 310.0, 523.0, 770.0, 1381.0, 2586.0, 5966.0, 17684.0, 106410.0, 1815875.0, 2100445.0, 111956.0, 17080.0, 5817.0, 2771.0, 1514.0, 968.0, 543.0, 358.0, 237.0, 164.0, 104.0, 68.0, 37.0, 46.0, 23.0, 16.0, 8.0, 10.0, 6.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.283203125, -1.243133544921875, -1.20306396484375, -1.162994384765625, -1.1229248046875, -1.082855224609375, -1.04278564453125, -1.002716064453125, -0.962646484375, -0.922576904296875, -0.88250732421875, -0.842437744140625, -0.8023681640625, -0.762298583984375, -0.72222900390625, -0.682159423828125, -0.64208984375, -0.602020263671875, -0.56195068359375, -0.521881103515625, -0.4818115234375, -0.441741943359375, -0.40167236328125, -0.361602783203125, -0.321533203125, -0.281463623046875, -0.24139404296875, -0.201324462890625, -0.1612548828125, -0.121185302734375, -0.08111572265625, -0.041046142578125, -0.0009765625, 0.039093017578125, 0.07916259765625, 0.119232177734375, 0.1593017578125, 0.199371337890625, 0.23944091796875, 0.279510498046875, 0.319580078125, 0.359649658203125, 0.39971923828125, 0.439788818359375, 0.4798583984375, 0.519927978515625, 0.55999755859375, 0.600067138671875, 0.64013671875, 0.680206298828125, 0.72027587890625, 0.760345458984375, 0.8004150390625, 0.840484619140625, 0.88055419921875, 0.920623779296875, 0.960693359375, 1.000762939453125, 1.04083251953125, 1.080902099609375, 1.1209716796875, 1.161041259765625, 1.20111083984375, 1.241180419921875, 1.28125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 9.0, 14.0, 22.0, 21.0, 25.0, 39.0, 59.0, 44.0, 62.0, 83.0, 80.0, 81.0, 91.0, 72.0, 61.0, 44.0, 43.0, 51.0, 33.0, 21.0, 12.0, 12.0, 12.0, 6.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.666015625, -0.637908935546875, -0.60980224609375, -0.581695556640625, -0.5535888671875, -0.525482177734375, -0.49737548828125, -0.469268798828125, -0.441162109375, -0.413055419921875, -0.38494873046875, -0.356842041015625, -0.3287353515625, -0.300628662109375, -0.27252197265625, -0.244415283203125, -0.21630859375, -0.188201904296875, -0.16009521484375, -0.131988525390625, -0.1038818359375, -0.075775146484375, -0.04766845703125, -0.019561767578125, 0.008544921875, 0.036651611328125, 0.06475830078125, 0.092864990234375, 0.1209716796875, 0.149078369140625, 0.17718505859375, 0.205291748046875, 0.2333984375, 0.261505126953125, 0.28961181640625, 0.317718505859375, 0.3458251953125, 0.373931884765625, 0.40203857421875, 0.430145263671875, 0.458251953125, 0.486358642578125, 0.51446533203125, 0.542572021484375, 0.5706787109375, 0.598785400390625, 0.62689208984375, 0.654998779296875, 0.68310546875, 0.711212158203125, 0.73931884765625, 0.767425537109375, 0.7955322265625, 0.823638916015625, 0.85174560546875, 0.879852294921875, 0.907958984375, 0.936065673828125, 0.96417236328125, 0.992279052734375, 1.0203857421875, 1.048492431640625, 1.07659912109375, 1.104705810546875, 1.1328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 9.0, 8.0, 13.0, 11.0, 17.0, 25.0, 34.0, 50.0, 65.0, 77.0, 113.0, 194.0, 288.0, 404.0, 659.0, 1071.0, 2064.0, 4078.0, 10145.0, 35197.0, 271918.0, 3510002.0, 300056.0, 38480.0, 10759.0, 4087.0, 1900.0, 1029.0, 595.0, 295.0, 219.0, 141.0, 90.0, 58.0, 32.0, 34.0, 19.0, 16.0, 7.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.685546875, -1.63525390625, -1.5849609375, -1.53466796875, -1.484375, -1.43408203125, -1.3837890625, -1.33349609375, -1.283203125, -1.23291015625, -1.1826171875, -1.13232421875, -1.08203125, -1.03173828125, -0.9814453125, -0.93115234375, -0.880859375, -0.83056640625, -0.7802734375, -0.72998046875, -0.6796875, -0.62939453125, -0.5791015625, -0.52880859375, -0.478515625, -0.42822265625, -0.3779296875, -0.32763671875, -0.27734375, -0.22705078125, -0.1767578125, -0.12646484375, -0.076171875, -0.02587890625, 0.0244140625, 0.07470703125, 0.125, 0.17529296875, 0.2255859375, 0.27587890625, 0.326171875, 0.37646484375, 0.4267578125, 0.47705078125, 0.52734375, 0.57763671875, 0.6279296875, 0.67822265625, 0.728515625, 0.77880859375, 0.8291015625, 0.87939453125, 0.9296875, 0.97998046875, 1.0302734375, 1.08056640625, 1.130859375, 1.18115234375, 1.2314453125, 1.28173828125, 1.33203125, 1.38232421875, 1.4326171875, 1.48291015625, 1.533203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 10.0, 13.0, 11.0, 22.0, 33.0, 46.0, 100.0, 224.0, 474.0, 1006.0, 1088.0, 522.0, 225.0, 102.0, 45.0, 49.0, 23.0, 19.0, 18.0, 10.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.6510009765625, -2.581298828125, -2.5115966796875, -2.44189453125, -2.3721923828125, -2.302490234375, -2.2327880859375, -2.1630859375, -2.0933837890625, -2.023681640625, -1.9539794921875, -1.88427734375, -1.8145751953125, -1.744873046875, -1.6751708984375, -1.60546875, -1.5357666015625, -1.466064453125, -1.3963623046875, -1.32666015625, -1.2569580078125, -1.187255859375, -1.1175537109375, -1.0478515625, -0.9781494140625, -0.908447265625, -0.8387451171875, -0.76904296875, -0.6993408203125, -0.629638671875, -0.5599365234375, -0.490234375, -0.4205322265625, -0.350830078125, -0.2811279296875, -0.21142578125, -0.1417236328125, -0.072021484375, -0.0023193359375, 0.0673828125, 0.1370849609375, 0.206787109375, 0.2764892578125, 0.34619140625, 0.4158935546875, 0.485595703125, 0.5552978515625, 0.625, 0.6947021484375, 0.764404296875, 0.8341064453125, 0.90380859375, 0.9735107421875, 1.043212890625, 1.1129150390625, 1.1826171875, 1.2523193359375, 1.322021484375, 1.3917236328125, 1.46142578125, 1.5311279296875, 1.600830078125, 1.6705322265625, 1.740234375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 8.0, 9.0, 24.0, 63.0, 155.0, 295.0, 215.0, 131.0, 45.0, 22.0, 13.0, 8.0, 5.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.463030815124512, -14.75528335571289, -14.047536849975586, -13.339789390563965, -12.632041931152344, -11.924294471740723, -11.216547012329102, -10.508800506591797, -9.801053047180176, -9.093305587768555, -8.38555908203125, -7.677811622619629, -6.970064163208008, -6.262316703796387, -5.554569721221924, -4.846822738647461, -4.13907527923584, -3.431328058242798, -2.723580837249756, -2.015833616256714, -1.3080863952636719, -0.6003391742706299, 0.10740804672241211, 0.815155029296875, 1.522902488708496, 2.230649709701538, 2.93839693069458, 3.646144151687622, 4.353891372680664, 5.061638832092285, 5.769385814666748, 6.477132797241211, 7.184881210327148, 7.8926286697387695, 8.60037612915039, 9.308122634887695, 10.015870094299316, 10.723617553710938, 11.431364059448242, 12.139111518859863, 12.846858978271484, 13.554606437683105, 14.262353897094727, 14.970100402832031, 15.677847862243652, 16.385595321655273, 17.093341827392578, 17.801090240478516, 18.50883674621582, 19.216583251953125, 19.924331665039062, 20.632078170776367, 21.339824676513672, 22.04757308959961, 22.755319595336914, 23.46306610107422, 24.170814514160156, 24.87856101989746, 25.5863094329834, 26.294055938720703, 27.00180435180664, 27.709550857543945, 28.41729736328125, 29.125045776367188, 29.832792282104492]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 7.0, 14.0, 15.0, 20.0, 21.0, 22.0, 28.0, 36.0, 38.0, 44.0, 58.0, 52.0, 49.0, 57.0, 52.0, 44.0, 59.0, 47.0, 37.0, 40.0, 36.0, 44.0, 27.0, 22.0, 23.0, 18.0, 12.0, 15.0, 12.0, 16.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-9.771305084228516, -9.531112670898438, -9.290921211242676, -9.050728797912598, -8.81053638458252, -8.570343971252441, -8.33015251159668, -8.089960098266602, -7.849767684936523, -7.6095757484436035, -7.369383335113525, -7.1291913986206055, -6.888998985290527, -6.648807048797607, -6.4086151123046875, -6.168422698974609, -5.9282307624816895, -5.6880388259887695, -5.447846412658691, -5.2076544761657715, -4.967462062835693, -4.727270126342773, -4.487077713012695, -4.246885776519775, -4.0066938400268555, -3.7665016651153564, -3.5263094902038574, -3.2861175537109375, -3.0459251403808594, -2.8057332038879395, -2.5655410289764404, -2.3253488540649414, -2.0851564407348633, -1.8449642658233643, -1.6047720909118652, -1.3645800352096558, -1.1243878602981567, -0.8841956853866577, -0.6440036296844482, -0.4038114547729492, -0.1636192798614502, 0.07657286524772644, 0.3167650103569031, 0.5569571256637573, 0.7971493005752563, 1.0373414754867554, 1.2775335311889648, 1.5177257061004639, 1.757917881011963, 1.998110055923462, 2.238302230834961, 2.478494167327881, 2.718686580657959, 2.958878517150879, 3.199070692062378, 3.439262866973877, 3.679455041885376, 3.919647216796875, 4.159839153289795, 4.400031566619873, 4.640223503112793, 4.880415916442871, 5.120607852935791, 5.360799789428711, 5.600992202758789]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 7.0, 5.0, 6.0, 8.0, 17.0, 31.0, 37.0, 57.0, 86.0, 145.0, 207.0, 340.0, 600.0, 1032.0, 1963.0, 4017.0, 9525.0, 26811.0, 96410.0, 417357.0, 366105.0, 83375.0, 23787.0, 8662.0, 3681.0, 1825.0, 976.0, 581.0, 301.0, 214.0, 128.0, 73.0, 64.0, 36.0, 23.0, 18.0, 14.0, 3.0, 3.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.4931640625, -1.447845458984375, -1.40252685546875, -1.357208251953125, -1.3118896484375, -1.266571044921875, -1.22125244140625, -1.175933837890625, -1.130615234375, -1.085296630859375, -1.03997802734375, -0.994659423828125, -0.9493408203125, -0.904022216796875, -0.85870361328125, -0.813385009765625, -0.76806640625, -0.722747802734375, -0.67742919921875, -0.632110595703125, -0.5867919921875, -0.541473388671875, -0.49615478515625, -0.450836181640625, -0.405517578125, -0.360198974609375, -0.31488037109375, -0.269561767578125, -0.2242431640625, -0.178924560546875, -0.13360595703125, -0.088287353515625, -0.04296875, 0.002349853515625, 0.04766845703125, 0.092987060546875, 0.1383056640625, 0.183624267578125, 0.22894287109375, 0.274261474609375, 0.319580078125, 0.364898681640625, 0.41021728515625, 0.455535888671875, 0.5008544921875, 0.546173095703125, 0.59149169921875, 0.636810302734375, 0.68212890625, 0.727447509765625, 0.77276611328125, 0.818084716796875, 0.8634033203125, 0.908721923828125, 0.95404052734375, 0.999359130859375, 1.044677734375, 1.089996337890625, 1.13531494140625, 1.180633544921875, 1.2259521484375, 1.271270751953125, 1.31658935546875, 1.361907958984375, 1.4072265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 12.0, 11.0, 18.0, 9.0, 34.0, 26.0, 24.0, 29.0, 42.0, 39.0, 45.0, 45.0, 56.0, 52.0, 51.0, 36.0, 46.0, 54.0, 37.0, 52.0, 31.0, 36.0, 40.0, 22.0, 22.0, 18.0, 15.0, 16.0, 17.0, 12.0, 13.0, 9.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5654296875, -0.5472869873046875, -0.529144287109375, -0.5110015869140625, -0.49285888671875, -0.4747161865234375, -0.456573486328125, -0.4384307861328125, -0.4202880859375, -0.4021453857421875, -0.384002685546875, -0.3658599853515625, -0.34771728515625, -0.3295745849609375, -0.311431884765625, -0.2932891845703125, -0.275146484375, -0.2570037841796875, -0.238861083984375, -0.2207183837890625, -0.20257568359375, -0.1844329833984375, -0.166290283203125, -0.1481475830078125, -0.1300048828125, -0.1118621826171875, -0.093719482421875, -0.0755767822265625, -0.05743408203125, -0.0392913818359375, -0.021148681640625, -0.0030059814453125, 0.01513671875, 0.0332794189453125, 0.051422119140625, 0.0695648193359375, 0.08770751953125, 0.1058502197265625, 0.123992919921875, 0.1421356201171875, 0.1602783203125, 0.1784210205078125, 0.196563720703125, 0.2147064208984375, 0.23284912109375, 0.2509918212890625, 0.269134521484375, 0.2872772216796875, 0.305419921875, 0.3235626220703125, 0.341705322265625, 0.3598480224609375, 0.37799072265625, 0.3961334228515625, 0.414276123046875, 0.4324188232421875, 0.4505615234375, 0.4687042236328125, 0.486846923828125, 0.5049896240234375, 0.52313232421875, 0.5412750244140625, 0.559417724609375, 0.5775604248046875, 0.595703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 10.0, 2.0, 16.0, 18.0, 27.0, 31.0, 54.0, 64.0, 131.0, 208.0, 306.0, 615.0, 1194.0, 2994.0, 10079.0, 72844.0, 852478.0, 90033.0, 11403.0, 3241.0, 1296.0, 597.0, 363.0, 200.0, 115.0, 86.0, 34.0, 35.0, 18.0, 15.0, 11.0, 7.0, 7.0, 8.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.193359375, -3.09521484375, -2.9970703125, -2.89892578125, -2.80078125, -2.70263671875, -2.6044921875, -2.50634765625, -2.408203125, -2.31005859375, -2.2119140625, -2.11376953125, -2.015625, -1.91748046875, -1.8193359375, -1.72119140625, -1.623046875, -1.52490234375, -1.4267578125, -1.32861328125, -1.23046875, -1.13232421875, -1.0341796875, -0.93603515625, -0.837890625, -0.73974609375, -0.6416015625, -0.54345703125, -0.4453125, -0.34716796875, -0.2490234375, -0.15087890625, -0.052734375, 0.04541015625, 0.1435546875, 0.24169921875, 0.33984375, 0.43798828125, 0.5361328125, 0.63427734375, 0.732421875, 0.83056640625, 0.9287109375, 1.02685546875, 1.125, 1.22314453125, 1.3212890625, 1.41943359375, 1.517578125, 1.61572265625, 1.7138671875, 1.81201171875, 1.91015625, 2.00830078125, 2.1064453125, 2.20458984375, 2.302734375, 2.40087890625, 2.4990234375, 2.59716796875, 2.6953125, 2.79345703125, 2.8916015625, 2.98974609375, 3.087890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 8.0, 12.0, 11.0, 20.0, 21.0, 30.0, 28.0, 28.0, 38.0, 32.0, 33.0, 43.0, 51.0, 48.0, 48.0, 47.0, 53.0, 47.0, 48.0, 42.0, 46.0, 48.0, 34.0, 31.0, 37.0, 29.0, 21.0, 16.0, 16.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.763671875, -2.68365478515625, -2.6036376953125, -2.52362060546875, -2.443603515625, -2.36358642578125, -2.2835693359375, -2.20355224609375, -2.12353515625, -2.04351806640625, -1.9635009765625, -1.88348388671875, -1.803466796875, -1.72344970703125, -1.6434326171875, -1.56341552734375, -1.4833984375, -1.40338134765625, -1.3233642578125, -1.24334716796875, -1.163330078125, -1.08331298828125, -1.0032958984375, -0.92327880859375, -0.84326171875, -0.76324462890625, -0.6832275390625, -0.60321044921875, -0.523193359375, -0.44317626953125, -0.3631591796875, -0.28314208984375, -0.203125, -0.12310791015625, -0.0430908203125, 0.03692626953125, 0.116943359375, 0.19696044921875, 0.2769775390625, 0.35699462890625, 0.43701171875, 0.51702880859375, 0.5970458984375, 0.67706298828125, 0.757080078125, 0.83709716796875, 0.9171142578125, 0.99713134765625, 1.0771484375, 1.15716552734375, 1.2371826171875, 1.31719970703125, 1.397216796875, 1.47723388671875, 1.5572509765625, 1.63726806640625, 1.71728515625, 1.79730224609375, 1.8773193359375, 1.95733642578125, 2.037353515625, 2.11737060546875, 2.1973876953125, 2.27740478515625, 2.357421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 10.0, 12.0, 7.0, 19.0, 12.0, 15.0, 15.0, 35.0, 40.0, 50.0, 72.0, 90.0, 159.0, 284.0, 497.0, 855.0, 1740.0, 4025.0, 11750.0, 44916.0, 293621.0, 602937.0, 62765.0, 15081.0, 4992.0, 2126.0, 988.0, 529.0, 293.0, 192.0, 107.0, 82.0, 46.0, 34.0, 41.0, 25.0, 25.0, 14.0, 22.0, 4.0, 7.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.8740234375, -0.8483963012695312, -0.8227691650390625, -0.7971420288085938, -0.771514892578125, -0.7458877563476562, -0.7202606201171875, -0.6946334838867188, -0.66900634765625, -0.6433792114257812, -0.6177520751953125, -0.5921249389648438, -0.566497802734375, -0.5408706665039062, -0.5152435302734375, -0.48961639404296875, -0.4639892578125, -0.43836212158203125, -0.4127349853515625, -0.38710784912109375, -0.361480712890625, -0.33585357666015625, -0.3102264404296875, -0.28459930419921875, -0.25897216796875, -0.23334503173828125, -0.2077178955078125, -0.18209075927734375, -0.156463623046875, -0.13083648681640625, -0.1052093505859375, -0.07958221435546875, -0.053955078125, -0.02832794189453125, -0.0027008056640625, 0.02292633056640625, 0.048553466796875, 0.07418060302734375, 0.0998077392578125, 0.12543487548828125, 0.15106201171875, 0.17668914794921875, 0.2023162841796875, 0.22794342041015625, 0.253570556640625, 0.27919769287109375, 0.3048248291015625, 0.33045196533203125, 0.3560791015625, 0.38170623779296875, 0.4073333740234375, 0.43296051025390625, 0.458587646484375, 0.48421478271484375, 0.5098419189453125, 0.5354690551757812, 0.56109619140625, 0.5867233276367188, 0.6123504638671875, 0.6379776000976562, 0.663604736328125, 0.6892318725585938, 0.7148590087890625, 0.7404861450195312, 0.76611328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 5.0, 3.0, 4.0, 7.0, 9.0, 12.0, 14.0, 20.0, 30.0, 29.0, 35.0, 54.0, 68.0, 88.0, 132.0, 132.0, 85.0, 52.0, 36.0, 38.0, 29.0, 29.0, 17.0, 16.0, 11.0, 11.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001933574676513672, -0.00018686801195144653, -0.00018037855625152588, -0.00017388910055160522, -0.00016739964485168457, -0.00016091018915176392, -0.00015442073345184326, -0.0001479312777519226, -0.00014144182205200195, -0.0001349523663520813, -0.00012846291065216064, -0.00012197345495223999, -0.00011548399925231934, -0.00010899454355239868, -0.00010250508785247803, -9.601563215255737e-05, -8.952617645263672e-05, -8.303672075271606e-05, -7.654726505279541e-05, -7.005780935287476e-05, -6.35683536529541e-05, -5.707889795303345e-05, -5.058944225311279e-05, -4.409998655319214e-05, -3.7610530853271484e-05, -3.112107515335083e-05, -2.4631619453430176e-05, -1.814216375350952e-05, -1.1652708053588867e-05, -5.163252353668213e-06, 1.3262033462524414e-06, 7.815659046173096e-06, 1.430511474609375e-05, 2.0794570446014404e-05, 2.728402614593506e-05, 3.377348184585571e-05, 4.026293754577637e-05, 4.675239324569702e-05, 5.3241848945617676e-05, 5.973130464553833e-05, 6.622076034545898e-05, 7.271021604537964e-05, 7.919967174530029e-05, 8.568912744522095e-05, 9.21785831451416e-05, 9.866803884506226e-05, 0.00010515749454498291, 0.00011164695024490356, 0.00011813640594482422, 0.00012462586164474487, 0.00013111531734466553, 0.00013760477304458618, 0.00014409422874450684, 0.0001505836844444275, 0.00015707314014434814, 0.0001635625958442688, 0.00017005205154418945, 0.0001765415072441101, 0.00018303096294403076, 0.00018952041864395142, 0.00019600987434387207, 0.00020249933004379272, 0.00020898878574371338, 0.00021547824144363403, 0.0002219676971435547]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 11.0, 9.0, 22.0, 15.0, 32.0, 67.0, 79.0, 114.0, 193.0, 298.0, 503.0, 954.0, 2253.0, 5921.0, 23047.0, 175689.0, 758186.0, 62133.0, 11939.0, 3717.0, 1568.0, 704.0, 435.0, 233.0, 147.0, 93.0, 47.0, 48.0, 26.0, 14.0, 13.0, 10.0, 11.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0859375, -1.0488433837890625, -1.011749267578125, -0.9746551513671875, -0.93756103515625, -0.9004669189453125, -0.863372802734375, -0.8262786865234375, -0.7891845703125, -0.7520904541015625, -0.714996337890625, -0.6779022216796875, -0.64080810546875, -0.6037139892578125, -0.566619873046875, -0.5295257568359375, -0.492431640625, -0.4553375244140625, -0.418243408203125, -0.3811492919921875, -0.34405517578125, -0.3069610595703125, -0.269866943359375, -0.2327728271484375, -0.1956787109375, -0.1585845947265625, -0.121490478515625, -0.0843963623046875, -0.04730224609375, -0.0102081298828125, 0.026885986328125, 0.0639801025390625, 0.10107421875, 0.1381683349609375, 0.175262451171875, 0.2123565673828125, 0.24945068359375, 0.2865447998046875, 0.323638916015625, 0.3607330322265625, 0.3978271484375, 0.4349212646484375, 0.472015380859375, 0.5091094970703125, 0.54620361328125, 0.5832977294921875, 0.620391845703125, 0.6574859619140625, 0.694580078125, 0.7316741943359375, 0.768768310546875, 0.8058624267578125, 0.84295654296875, 0.8800506591796875, 0.917144775390625, 0.9542388916015625, 0.9913330078125, 1.0284271240234375, 1.065521240234375, 1.1026153564453125, 1.13970947265625, 1.1768035888671875, 1.213897705078125, 1.2509918212890625, 1.2880859375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 1.0, 7.0, 2.0, 3.0, 9.0, 9.0, 17.0, 23.0, 22.0, 23.0, 28.0, 50.0, 54.0, 69.0, 75.0, 99.0, 111.0, 86.0, 72.0, 39.0, 30.0, 39.0, 21.0, 11.0, 18.0, 9.0, 10.0, 9.0, 7.0, 13.0, 6.0, 2.0, 4.0, 3.0, 3.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8662109375, -0.8399276733398438, -0.8136444091796875, -0.7873611450195312, -0.761077880859375, -0.7347946166992188, -0.7085113525390625, -0.6822280883789062, -0.65594482421875, -0.6296615600585938, -0.6033782958984375, -0.5770950317382812, -0.550811767578125, -0.5245285034179688, -0.4982452392578125, -0.47196197509765625, -0.4456787109375, -0.41939544677734375, -0.3931121826171875, -0.36682891845703125, -0.340545654296875, -0.31426239013671875, -0.2879791259765625, -0.26169586181640625, -0.23541259765625, -0.20912933349609375, -0.1828460693359375, -0.15656280517578125, -0.130279541015625, -0.10399627685546875, -0.0777130126953125, -0.05142974853515625, -0.025146484375, 0.00113677978515625, 0.0274200439453125, 0.05370330810546875, 0.079986572265625, 0.10626983642578125, 0.1325531005859375, 0.15883636474609375, 0.18511962890625, 0.21140289306640625, 0.2376861572265625, 0.26396942138671875, 0.290252685546875, 0.31653594970703125, 0.3428192138671875, 0.36910247802734375, 0.3953857421875, 0.42166900634765625, 0.4479522705078125, 0.47423553466796875, 0.500518798828125, 0.5268020629882812, 0.5530853271484375, 0.5793685913085938, 0.60565185546875, 0.6319351196289062, 0.6582183837890625, 0.6845016479492188, 0.710784912109375, 0.7370681762695312, 0.7633514404296875, 0.7896347045898438, 0.81591796875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 10.0, 13.0, 45.0, 121.0, 376.0, 259.0, 97.0, 46.0, 18.0, 7.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.516643524169922, -26.525775909423828, -25.534910202026367, -24.544042587280273, -23.55317497253418, -22.56230926513672, -21.571441650390625, -20.58057403564453, -19.58970832824707, -18.598840713500977, -17.607975006103516, -16.617107391357422, -15.626240730285645, -14.635374069213867, -13.644506454467773, -12.653639793395996, -11.662772178649902, -10.671905517578125, -9.681037902832031, -8.690171241760254, -7.699304580688477, -6.708437442779541, -5.7175703048706055, -4.726703643798828, -3.7358365058898926, -2.744969606399536, -1.7541025876998901, -0.7632355690002441, 0.2276313304901123, 1.2184982299804688, 2.2093653678894043, 3.2002320289611816, 4.191099166870117, 5.181966304779053, 6.17283296585083, 7.163700103759766, 8.154566764831543, 9.14543342590332, 10.136301040649414, 11.127167701721191, 12.118034362792969, 13.108901023864746, 14.09976863861084, 15.090635299682617, 16.08150291442871, 17.072368621826172, 18.063236236572266, 19.05410385131836, 20.044971466064453, 21.035839080810547, 22.026704788208008, 23.0175724029541, 24.008440017700195, 24.999305725097656, 25.99017333984375, 26.981040954589844, 27.971906661987305, 28.9627742767334, 29.95363998413086, 30.944507598876953, 31.935375213623047, 32.92624282836914, 33.91710662841797, 34.90797424316406, 35.898841857910156]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 11.0, 7.0, 12.0, 19.0, 23.0, 19.0, 21.0, 31.0, 30.0, 31.0, 29.0, 47.0, 50.0, 38.0, 63.0, 76.0, 67.0, 46.0, 38.0, 38.0, 31.0, 41.0, 27.0, 20.0, 28.0, 29.0, 15.0, 16.0, 13.0, 13.0, 15.0, 9.0, 5.0, 7.0, 9.0, 8.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.68444538116455, -9.389105796813965, -9.093766212463379, -8.798426628112793, -8.503087043762207, -8.207747459411621, -7.912407875061035, -7.617068290710449, -7.321728706359863, -7.026389122009277, -6.731049537658691, -6.4357099533081055, -6.1403703689575195, -5.845030784606934, -5.549691200256348, -5.254351615905762, -4.959011554718018, -4.663671970367432, -4.368332386016846, -4.07299280166626, -3.777653217315674, -3.482313632965088, -3.186973810195923, -2.891634225845337, -2.596294641494751, -2.300955057144165, -2.005615472793579, -1.7102757692337036, -1.4149361848831177, -1.1195966005325317, -0.8242568969726562, -0.5289173126220703, -0.23357772827148438, 0.06176188588142395, 0.3571015000343323, 0.652441143989563, 0.9477807283401489, 1.2431203126907349, 1.5384600162506104, 1.8337996006011963, 2.1291391849517822, 2.424478769302368, 2.719818353652954, 3.015158176422119, 3.310497760772705, 3.605837345123291, 3.901176929473877, 4.196516513824463, 4.491856098175049, 4.787195682525635, 5.082535266876221, 5.377874851226807, 5.673214435577393, 5.9685540199279785, 6.263894081115723, 6.559233665466309, 6.8545732498168945, 7.1499128341674805, 7.445252418518066, 7.740592002868652, 8.035931587219238, 8.331271171569824, 8.62661075592041, 8.921950340270996, 9.217289924621582]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 10.0, 6.0, 12.0, 29.0, 36.0, 45.0, 70.0, 108.0, 199.0, 319.0, 512.0, 928.0, 1693.0, 3945.0, 10292.0, 61104.0, 1343213.0, 2632096.0, 115136.0, 14820.0, 4803.0, 2151.0, 1124.0, 667.0, 338.0, 245.0, 146.0, 73.0, 37.0, 31.0, 24.0, 23.0, 13.0, 7.0, 3.0, 4.0, 6.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5302734375, -1.482635498046875, -1.43499755859375, -1.387359619140625, -1.3397216796875, -1.292083740234375, -1.24444580078125, -1.196807861328125, -1.149169921875, -1.101531982421875, -1.05389404296875, -1.006256103515625, -0.9586181640625, -0.910980224609375, -0.86334228515625, -0.815704345703125, -0.76806640625, -0.720428466796875, -0.67279052734375, -0.625152587890625, -0.5775146484375, -0.529876708984375, -0.48223876953125, -0.434600830078125, -0.386962890625, -0.339324951171875, -0.29168701171875, -0.244049072265625, -0.1964111328125, -0.148773193359375, -0.10113525390625, -0.053497314453125, -0.005859375, 0.041778564453125, 0.08941650390625, 0.137054443359375, 0.1846923828125, 0.232330322265625, 0.27996826171875, 0.327606201171875, 0.375244140625, 0.422882080078125, 0.47052001953125, 0.518157958984375, 0.5657958984375, 0.613433837890625, 0.66107177734375, 0.708709716796875, 0.75634765625, 0.803985595703125, 0.85162353515625, 0.899261474609375, 0.9468994140625, 0.994537353515625, 1.04217529296875, 1.089813232421875, 1.137451171875, 1.185089111328125, 1.23272705078125, 1.280364990234375, 1.3280029296875, 1.375640869140625, 1.42327880859375, 1.470916748046875, 1.5185546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 6.0, 13.0, 12.0, 15.0, 16.0, 39.0, 30.0, 29.0, 36.0, 49.0, 49.0, 53.0, 56.0, 64.0, 54.0, 57.0, 53.0, 48.0, 40.0, 47.0, 34.0, 33.0, 34.0, 24.0, 14.0, 19.0, 15.0, 11.0, 13.0, 9.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486328125, -0.466522216796875, -0.44671630859375, -0.426910400390625, -0.4071044921875, -0.387298583984375, -0.36749267578125, -0.347686767578125, -0.327880859375, -0.308074951171875, -0.28826904296875, -0.268463134765625, -0.2486572265625, -0.228851318359375, -0.20904541015625, -0.189239501953125, -0.16943359375, -0.149627685546875, -0.12982177734375, -0.110015869140625, -0.0902099609375, -0.070404052734375, -0.05059814453125, -0.030792236328125, -0.010986328125, 0.008819580078125, 0.02862548828125, 0.048431396484375, 0.0682373046875, 0.088043212890625, 0.10784912109375, 0.127655029296875, 0.1474609375, 0.167266845703125, 0.18707275390625, 0.206878662109375, 0.2266845703125, 0.246490478515625, 0.26629638671875, 0.286102294921875, 0.305908203125, 0.325714111328125, 0.34552001953125, 0.365325927734375, 0.3851318359375, 0.404937744140625, 0.42474365234375, 0.444549560546875, 0.46435546875, 0.484161376953125, 0.50396728515625, 0.523773193359375, 0.5435791015625, 0.563385009765625, 0.58319091796875, 0.602996826171875, 0.622802734375, 0.642608642578125, 0.66241455078125, 0.682220458984375, 0.7020263671875, 0.721832275390625, 0.74163818359375, 0.761444091796875, 0.78125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 7.0, 3.0, 10.0, 15.0, 18.0, 30.0, 25.0, 52.0, 67.0, 82.0, 135.0, 201.0, 305.0, 453.0, 709.0, 1215.0, 2107.0, 4187.0, 9529.0, 31476.0, 231390.0, 3440104.0, 410822.0, 39873.0, 10911.0, 4519.0, 2339.0, 1376.0, 802.0, 523.0, 336.0, 207.0, 126.0, 96.0, 72.0, 47.0, 25.0, 30.0, 18.0, 8.0, 10.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7060546875, -1.6552734375, -1.6044921875, -1.5537109375, -1.5029296875, -1.4521484375, -1.4013671875, -1.3505859375, -1.2998046875, -1.2490234375, -1.1982421875, -1.1474609375, -1.0966796875, -1.0458984375, -0.9951171875, -0.9443359375, -0.8935546875, -0.8427734375, -0.7919921875, -0.7412109375, -0.6904296875, -0.6396484375, -0.5888671875, -0.5380859375, -0.4873046875, -0.4365234375, -0.3857421875, -0.3349609375, -0.2841796875, -0.2333984375, -0.1826171875, -0.1318359375, -0.0810546875, -0.0302734375, 0.0205078125, 0.0712890625, 0.1220703125, 0.1728515625, 0.2236328125, 0.2744140625, 0.3251953125, 0.3759765625, 0.4267578125, 0.4775390625, 0.5283203125, 0.5791015625, 0.6298828125, 0.6806640625, 0.7314453125, 0.7822265625, 0.8330078125, 0.8837890625, 0.9345703125, 0.9853515625, 1.0361328125, 1.0869140625, 1.1376953125, 1.1884765625, 1.2392578125, 1.2900390625, 1.3408203125, 1.3916015625, 1.4423828125, 1.4931640625, 1.5439453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 3.0, 11.0, 14.0, 17.0, 23.0, 51.0, 65.0, 125.0, 208.0, 412.0, 911.0, 1002.0, 625.0, 267.0, 161.0, 52.0, 38.0, 17.0, 15.0, 13.0, 9.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.287109375, -2.2202301025390625, -2.153350830078125, -2.0864715576171875, -2.01959228515625, -1.9527130126953125, -1.885833740234375, -1.8189544677734375, -1.7520751953125, -1.6851959228515625, -1.618316650390625, -1.5514373779296875, -1.48455810546875, -1.4176788330078125, -1.350799560546875, -1.2839202880859375, -1.217041015625, -1.1501617431640625, -1.083282470703125, -1.0164031982421875, -0.94952392578125, -0.8826446533203125, -0.815765380859375, -0.7488861083984375, -0.6820068359375, -0.6151275634765625, -0.548248291015625, -0.4813690185546875, -0.41448974609375, -0.3476104736328125, -0.280731201171875, -0.2138519287109375, -0.14697265625, -0.0800933837890625, -0.013214111328125, 0.0536651611328125, 0.12054443359375, 0.1874237060546875, 0.254302978515625, 0.3211822509765625, 0.3880615234375, 0.4549407958984375, 0.521820068359375, 0.5886993408203125, 0.65557861328125, 0.7224578857421875, 0.789337158203125, 0.8562164306640625, 0.923095703125, 0.9899749755859375, 1.056854248046875, 1.1237335205078125, 1.19061279296875, 1.2574920654296875, 1.324371337890625, 1.3912506103515625, 1.4581298828125, 1.5250091552734375, 1.591888427734375, 1.6587677001953125, 1.72564697265625, 1.7925262451171875, 1.859405517578125, 1.9262847900390625, 1.9931640625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 9.0, 19.0, 38.0, 119.0, 267.0, 291.0, 136.0, 72.0, 22.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.20813751220703, -32.40103530883789, -31.59393310546875, -30.786828994750977, -29.979726791381836, -29.172624588012695, -28.365520477294922, -27.55841827392578, -26.75131607055664, -25.9442138671875, -25.13711166381836, -24.330007553100586, -23.522905349731445, -22.715803146362305, -21.90869903564453, -21.10159683227539, -20.29449462890625, -19.48739242553711, -18.68029022216797, -17.873186111450195, -17.066083908081055, -16.258981704711914, -15.451878547668457, -14.644775390625, -13.83767318725586, -13.030570983886719, -12.223467826843262, -11.416364669799805, -10.609262466430664, -9.802160263061523, -8.995057106018066, -8.18795394897461, -7.380851745605469, -6.57374906539917, -5.766646385192871, -4.959543704986572, -4.152441024780273, -3.3453383445739746, -2.538235664367676, -1.731132984161377, -0.9240303039550781, -0.1169276237487793, 0.6901750564575195, 1.4972777366638184, 2.304380416870117, 3.111483097076416, 3.918585777282715, 4.725688457489014, 5.5327911376953125, 6.339893817901611, 7.14699649810791, 7.954099178314209, 8.761201858520508, 9.568304061889648, 10.375407218933105, 11.182510375976562, 11.989612579345703, 12.796714782714844, 13.6038179397583, 14.410921096801758, 15.218023300170898, 16.02512550354004, 16.832229614257812, 17.639331817626953, 18.446434020996094]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 15.0, 3.0, 11.0, 6.0, 9.0, 13.0, 20.0, 23.0, 24.0, 24.0, 29.0, 28.0, 30.0, 42.0, 28.0, 42.0, 43.0, 33.0, 45.0, 43.0, 43.0, 49.0, 38.0, 48.0, 48.0, 36.0, 33.0, 35.0, 32.0, 23.0, 17.0, 23.0, 9.0, 5.0, 11.0, 8.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.239570617675781, -7.022808074951172, -6.8060455322265625, -6.589283466339111, -6.372520923614502, -6.155758380889893, -5.938996315002441, -5.722233772277832, -5.505471229553223, -5.288708686828613, -5.071946144104004, -4.855184078216553, -4.638421535491943, -4.421658992767334, -4.204896926879883, -3.9881343841552734, -3.771371841430664, -3.5546092987060547, -3.3378469944000244, -3.121084690093994, -2.9043221473693848, -2.6875596046447754, -2.470797300338745, -2.254034996032715, -2.0372724533081055, -1.8205100297927856, -1.6037476062774658, -1.386985182762146, -1.1702227592468262, -0.9534603357315063, -0.7366979122161865, -0.5199354887008667, -0.3031735420227051, -0.08641111850738525, 0.13035130500793457, 0.3471137285232544, 0.5638761520385742, 0.780638575553894, 0.9974009990692139, 1.2141634225845337, 1.4309258460998535, 1.6476882696151733, 1.8644506931304932, 2.0812129974365234, 2.297975540161133, 2.514738082885742, 2.7315003871917725, 2.9482626914978027, 3.165025234222412, 3.3817877769470215, 3.5985500812530518, 3.815312385559082, 4.032074928283691, 4.248837471008301, 4.46560001373291, 4.682362079620361, 4.899124622344971, 5.11588716506958, 5.332649230957031, 5.549411773681641, 5.76617431640625, 5.982936859130859, 6.199699401855469, 6.41646146774292, 6.633224010467529]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 12.0, 10.0, 31.0, 24.0, 49.0, 77.0, 143.0, 211.0, 411.0, 699.0, 1383.0, 2591.0, 5972.0, 16099.0, 66514.0, 479124.0, 394107.0, 56020.0, 14340.0, 5366.0, 2487.0, 1236.0, 680.0, 398.0, 218.0, 117.0, 79.0, 53.0, 17.0, 13.0, 17.0, 14.0, 9.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.95587158203125, -1.8883056640625, -1.82073974609375, -1.753173828125, -1.68560791015625, -1.6180419921875, -1.55047607421875, -1.48291015625, -1.41534423828125, -1.3477783203125, -1.28021240234375, -1.212646484375, -1.14508056640625, -1.0775146484375, -1.00994873046875, -0.9423828125, -0.87481689453125, -0.8072509765625, -0.73968505859375, -0.672119140625, -0.60455322265625, -0.5369873046875, -0.46942138671875, -0.40185546875, -0.33428955078125, -0.2667236328125, -0.19915771484375, -0.131591796875, -0.06402587890625, 0.0035400390625, 0.07110595703125, 0.138671875, 0.20623779296875, 0.2738037109375, 0.34136962890625, 0.408935546875, 0.47650146484375, 0.5440673828125, 0.61163330078125, 0.67919921875, 0.74676513671875, 0.8143310546875, 0.88189697265625, 0.949462890625, 1.01702880859375, 1.0845947265625, 1.15216064453125, 1.2197265625, 1.28729248046875, 1.3548583984375, 1.42242431640625, 1.489990234375, 1.55755615234375, 1.6251220703125, 1.69268798828125, 1.76025390625, 1.82781982421875, 1.8953857421875, 1.96295166015625, 2.030517578125, 2.09808349609375, 2.1656494140625, 2.23321533203125, 2.30078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 12.0, 14.0, 23.0, 19.0, 23.0, 26.0, 33.0, 51.0, 39.0, 48.0, 46.0, 54.0, 52.0, 58.0, 61.0, 48.0, 56.0, 45.0, 34.0, 46.0, 26.0, 28.0, 31.0, 24.0, 16.0, 7.0, 14.0, 15.0, 15.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.5726242065429688, -0.5519866943359375, -0.5313491821289062, -0.510711669921875, -0.49007415771484375, -0.4694366455078125, -0.44879913330078125, -0.42816162109375, -0.40752410888671875, -0.3868865966796875, -0.36624908447265625, -0.345611572265625, -0.32497406005859375, -0.3043365478515625, -0.28369903564453125, -0.2630615234375, -0.24242401123046875, -0.2217864990234375, -0.20114898681640625, -0.180511474609375, -0.15987396240234375, -0.1392364501953125, -0.11859893798828125, -0.09796142578125, -0.07732391357421875, -0.0566864013671875, -0.03604888916015625, -0.015411376953125, 0.00522613525390625, 0.0258636474609375, 0.04650115966796875, 0.067138671875, 0.08777618408203125, 0.1084136962890625, 0.12905120849609375, 0.149688720703125, 0.17032623291015625, 0.1909637451171875, 0.21160125732421875, 0.23223876953125, 0.25287628173828125, 0.2735137939453125, 0.29415130615234375, 0.314788818359375, 0.33542633056640625, 0.3560638427734375, 0.37670135498046875, 0.3973388671875, 0.41797637939453125, 0.4386138916015625, 0.45925140380859375, 0.479888916015625, 0.5005264282226562, 0.5211639404296875, 0.5418014526367188, 0.56243896484375, 0.5830764770507812, 0.6037139892578125, 0.6243515014648438, 0.644989013671875, 0.6656265258789062, 0.6862640380859375, 0.7069015502929688, 0.7275390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 8.0, 17.0, 12.0, 27.0, 26.0, 30.0, 54.0, 78.0, 96.0, 162.0, 242.0, 402.0, 777.0, 1779.0, 4791.0, 19646.0, 235089.0, 741192.0, 32610.0, 6869.0, 2321.0, 974.0, 490.0, 280.0, 173.0, 121.0, 84.0, 61.0, 35.0, 22.0, 21.0, 22.0, 15.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.34765625, -4.22735595703125, -4.1070556640625, -3.98675537109375, -3.866455078125, -3.74615478515625, -3.6258544921875, -3.50555419921875, -3.38525390625, -3.26495361328125, -3.1446533203125, -3.02435302734375, -2.904052734375, -2.78375244140625, -2.6634521484375, -2.54315185546875, -2.4228515625, -2.30255126953125, -2.1822509765625, -2.06195068359375, -1.941650390625, -1.82135009765625, -1.7010498046875, -1.58074951171875, -1.46044921875, -1.34014892578125, -1.2198486328125, -1.09954833984375, -0.979248046875, -0.85894775390625, -0.7386474609375, -0.61834716796875, -0.498046875, -0.37774658203125, -0.2574462890625, -0.13714599609375, -0.016845703125, 0.10345458984375, 0.2237548828125, 0.34405517578125, 0.46435546875, 0.58465576171875, 0.7049560546875, 0.82525634765625, 0.945556640625, 1.06585693359375, 1.1861572265625, 1.30645751953125, 1.4267578125, 1.54705810546875, 1.6673583984375, 1.78765869140625, 1.907958984375, 2.02825927734375, 2.1485595703125, 2.26885986328125, 2.38916015625, 2.50946044921875, 2.6297607421875, 2.75006103515625, 2.870361328125, 2.99066162109375, 3.1109619140625, 3.23126220703125, 3.3515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 3.0, 11.0, 6.0, 14.0, 10.0, 14.0, 16.0, 19.0, 20.0, 35.0, 36.0, 41.0, 51.0, 41.0, 62.0, 56.0, 48.0, 47.0, 58.0, 52.0, 62.0, 56.0, 39.0, 27.0, 38.0, 24.0, 15.0, 11.0, 22.0, 6.0, 14.0, 6.0, 2.0, 10.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.734375, -2.646759033203125, -2.55914306640625, -2.471527099609375, -2.3839111328125, -2.296295166015625, -2.20867919921875, -2.121063232421875, -2.033447265625, -1.945831298828125, -1.85821533203125, -1.770599365234375, -1.6829833984375, -1.595367431640625, -1.50775146484375, -1.420135498046875, -1.33251953125, -1.244903564453125, -1.15728759765625, -1.069671630859375, -0.9820556640625, -0.894439697265625, -0.80682373046875, -0.719207763671875, -0.631591796875, -0.543975830078125, -0.45635986328125, -0.368743896484375, -0.2811279296875, -0.193511962890625, -0.10589599609375, -0.018280029296875, 0.0693359375, 0.156951904296875, 0.24456787109375, 0.332183837890625, 0.4197998046875, 0.507415771484375, 0.59503173828125, 0.682647705078125, 0.770263671875, 0.857879638671875, 0.94549560546875, 1.033111572265625, 1.1207275390625, 1.208343505859375, 1.29595947265625, 1.383575439453125, 1.47119140625, 1.558807373046875, 1.64642333984375, 1.734039306640625, 1.8216552734375, 1.909271240234375, 1.99688720703125, 2.084503173828125, 2.172119140625, 2.259735107421875, 2.34735107421875, 2.434967041015625, 2.5225830078125, 2.610198974609375, 2.69781494140625, 2.785430908203125, 2.873046875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 11.0, 14.0, 13.0, 21.0, 52.0, 67.0, 162.0, 273.0, 716.0, 2161.0, 9675.0, 396768.0, 624794.0, 10187.0, 2201.0, 763.0, 309.0, 153.0, 76.0, 42.0, 20.0, 17.0, 12.0, 9.0, 3.0, 7.0, 6.0, 0.0, 7.0, 1.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.12109375, -3.036773681640625, -2.95245361328125, -2.868133544921875, -2.7838134765625, -2.699493408203125, -2.61517333984375, -2.530853271484375, -2.446533203125, -2.362213134765625, -2.27789306640625, -2.193572998046875, -2.1092529296875, -2.024932861328125, -1.94061279296875, -1.856292724609375, -1.77197265625, -1.687652587890625, -1.60333251953125, -1.519012451171875, -1.4346923828125, -1.350372314453125, -1.26605224609375, -1.181732177734375, -1.097412109375, -1.013092041015625, -0.92877197265625, -0.844451904296875, -0.7601318359375, -0.675811767578125, -0.59149169921875, -0.507171630859375, -0.4228515625, -0.338531494140625, -0.25421142578125, -0.169891357421875, -0.0855712890625, -0.001251220703125, 0.08306884765625, 0.167388916015625, 0.251708984375, 0.336029052734375, 0.42034912109375, 0.504669189453125, 0.5889892578125, 0.673309326171875, 0.75762939453125, 0.841949462890625, 0.92626953125, 1.010589599609375, 1.09490966796875, 1.179229736328125, 1.2635498046875, 1.347869873046875, 1.43218994140625, 1.516510009765625, 1.600830078125, 1.685150146484375, 1.76947021484375, 1.853790283203125, 1.9381103515625, 2.022430419921875, 2.10675048828125, 2.191070556640625, 2.275390625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 15.0, 22.0, 27.0, 44.0, 67.0, 175.0, 293.0, 149.0, 67.0, 37.0, 37.0, 16.0, 15.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003523826599121094, -0.00033731013536453247, -0.00032223761081695557, -0.00030716508626937866, -0.00029209256172180176, -0.00027702003717422485, -0.00026194751262664795, -0.00024687498807907104, -0.00023180246353149414, -0.00021672993898391724, -0.00020165741443634033, -0.00018658488988876343, -0.00017151236534118652, -0.00015643984079360962, -0.00014136731624603271, -0.0001262947916984558, -0.0001112222671508789, -9.6149742603302e-05, -8.10772180557251e-05, -6.60046935081482e-05, -5.093216896057129e-05, -3.5859644412994385e-05, -2.078711986541748e-05, -5.714595317840576e-06, 9.357929229736328e-06, 2.4430453777313232e-05, 3.950297832489014e-05, 5.457550287246704e-05, 6.964802742004395e-05, 8.472055196762085e-05, 9.979307651519775e-05, 0.00011486560106277466, 0.00012993812561035156, 0.00014501065015792847, 0.00016008317470550537, 0.00017515569925308228, 0.00019022822380065918, 0.00020530074834823608, 0.000220373272895813, 0.0002354457974433899, 0.0002505183219909668, 0.0002655908465385437, 0.0002806633710861206, 0.0002957358956336975, 0.0003108084201812744, 0.0003258809447288513, 0.0003409534692764282, 0.0003560259938240051, 0.00037109851837158203, 0.00038617104291915894, 0.00040124356746673584, 0.00041631609201431274, 0.00043138861656188965, 0.00044646114110946655, 0.00046153366565704346, 0.00047660619020462036, 0.0004916787147521973, 0.0005067512392997742, 0.0005218237638473511, 0.000536896288394928, 0.0005519688129425049, 0.0005670413374900818, 0.0005821138620376587, 0.0005971863865852356, 0.0006122589111328125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 5.0, 1.0, 9.0, 14.0, 8.0, 20.0, 35.0, 59.0, 93.0, 164.0, 347.0, 762.0, 1931.0, 7267.0, 85358.0, 905701.0, 39114.0, 4907.0, 1499.0, 605.0, 270.0, 154.0, 75.0, 49.0, 37.0, 17.0, 16.0, 13.0, 6.0, 5.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.32110595703125, -2.2554931640625, -2.18988037109375, -2.124267578125, -2.05865478515625, -1.9930419921875, -1.92742919921875, -1.86181640625, -1.79620361328125, -1.7305908203125, -1.66497802734375, -1.599365234375, -1.53375244140625, -1.4681396484375, -1.40252685546875, -1.3369140625, -1.27130126953125, -1.2056884765625, -1.14007568359375, -1.074462890625, -1.00885009765625, -0.9432373046875, -0.87762451171875, -0.81201171875, -0.74639892578125, -0.6807861328125, -0.61517333984375, -0.549560546875, -0.48394775390625, -0.4183349609375, -0.35272216796875, -0.287109375, -0.22149658203125, -0.1558837890625, -0.09027099609375, -0.024658203125, 0.04095458984375, 0.1065673828125, 0.17218017578125, 0.23779296875, 0.30340576171875, 0.3690185546875, 0.43463134765625, 0.500244140625, 0.56585693359375, 0.6314697265625, 0.69708251953125, 0.7626953125, 0.82830810546875, 0.8939208984375, 0.95953369140625, 1.025146484375, 1.09075927734375, 1.1563720703125, 1.22198486328125, 1.28759765625, 1.35321044921875, 1.4188232421875, 1.48443603515625, 1.550048828125, 1.61566162109375, 1.6812744140625, 1.74688720703125, 1.8125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 8.0, 4.0, 14.0, 15.0, 26.0, 38.0, 41.0, 73.0, 116.0, 176.0, 167.0, 103.0, 86.0, 48.0, 29.0, 20.0, 15.0, 9.0, 7.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2345428466796875, -1.186859130859375, -1.1391754150390625, -1.09149169921875, -1.0438079833984375, -0.996124267578125, -0.9484405517578125, -0.9007568359375, -0.8530731201171875, -0.805389404296875, -0.7577056884765625, -0.71002197265625, -0.6623382568359375, -0.614654541015625, -0.5669708251953125, -0.519287109375, -0.4716033935546875, -0.423919677734375, -0.3762359619140625, -0.32855224609375, -0.2808685302734375, -0.233184814453125, -0.1855010986328125, -0.1378173828125, -0.0901336669921875, -0.042449951171875, 0.0052337646484375, 0.05291748046875, 0.1006011962890625, 0.148284912109375, 0.1959686279296875, 0.24365234375, 0.2913360595703125, 0.339019775390625, 0.3867034912109375, 0.43438720703125, 0.4820709228515625, 0.529754638671875, 0.5774383544921875, 0.6251220703125, 0.6728057861328125, 0.720489501953125, 0.7681732177734375, 0.81585693359375, 0.8635406494140625, 0.911224365234375, 0.9589080810546875, 1.006591796875, 1.0542755126953125, 1.101959228515625, 1.1496429443359375, 1.19732666015625, 1.2450103759765625, 1.292694091796875, 1.3403778076171875, 1.3880615234375, 1.4357452392578125, 1.483428955078125, 1.5311126708984375, 1.57879638671875, 1.6264801025390625, 1.674163818359375, 1.7218475341796875, 1.76953125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 14.0, 31.0, 70.0, 177.0, 387.0, 173.0, 62.0, 41.0, 10.0, 11.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.612131118774414, -28.675294876098633, -27.73845863342285, -26.80162239074707, -25.86478614807129, -24.927949905395508, -23.991113662719727, -23.054277420043945, -22.117441177368164, -21.180604934692383, -20.2437686920166, -19.30693244934082, -18.37009620666504, -17.433259963989258, -16.496423721313477, -15.559587478637695, -14.622751235961914, -13.685914993286133, -12.749078750610352, -11.81224250793457, -10.875406265258789, -9.938570022583008, -9.001733779907227, -8.064897537231445, -7.128061294555664, -6.191225051879883, -5.254388809204102, -4.31755256652832, -3.380716323852539, -2.443880081176758, -1.5070438385009766, -0.5702075958251953, 0.36663055419921875, 1.303466796875, 2.2403030395507812, 3.1771392822265625, 4.113975524902344, 5.050811767578125, 5.987648010253906, 6.9244842529296875, 7.861320495605469, 8.79815673828125, 9.734992980957031, 10.671829223632812, 11.608665466308594, 12.545501708984375, 13.482337951660156, 14.419174194335938, 15.356010437011719, 16.2928466796875, 17.22968292236328, 18.166519165039062, 19.103355407714844, 20.040191650390625, 20.977027893066406, 21.913864135742188, 22.85070037841797, 23.78753662109375, 24.72437286376953, 25.661209106445312, 26.598045349121094, 27.534881591796875, 28.471717834472656, 29.408554077148438, 30.34539031982422]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 2.0, 5.0, 7.0, 3.0, 9.0, 8.0, 9.0, 12.0, 24.0, 26.0, 19.0, 30.0, 34.0, 43.0, 35.0, 45.0, 61.0, 61.0, 75.0, 90.0, 60.0, 56.0, 46.0, 41.0, 28.0, 32.0, 17.0, 29.0, 28.0, 14.0, 13.0, 12.0, 9.0, 8.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.289093017578125, -15.860479354858398, -15.431865692138672, -15.003252983093262, -14.574639320373535, -14.146025657653809, -13.717411994934082, -13.288799285888672, -12.860185623168945, -12.431571960449219, -12.002958297729492, -11.574345588684082, -11.145731925964355, -10.717118263244629, -10.288504600524902, -9.859891891479492, -9.431278228759766, -9.002664566040039, -8.574050903320312, -8.145438194274902, -7.716824531555176, -7.288210868835449, -6.859597206115723, -6.430984020233154, -6.0023698806762695, -5.573756217956543, -5.145143032073975, -4.716529369354248, -4.28791618347168, -3.859302520751953, -3.4306890964508057, -3.002075672149658, -2.57346248626709, -2.1448490619659424, -1.716235637664795, -1.287622094154358, -0.8590086698532104, -0.43039512634277344, -0.0017817020416259766, 0.4268317222595215, 0.855445146560669, 1.2840585708618164, 1.7126719951629639, 2.1412854194641113, 2.569899082183838, 2.9985125064849854, 3.427125930786133, 3.8557393550872803, 4.284352779388428, 4.712966442108154, 5.141579627990723, 5.570193290710449, 5.998806476593018, 6.427420139312744, 6.8560333251953125, 7.284646987915039, 7.713260650634766, 8.141874313354492, 8.570487976074219, 8.999100685119629, 9.427714347839355, 9.856328010559082, 10.284941673278809, 10.713554382324219, 11.142168045043945]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 11.0, 12.0, 26.0, 43.0, 65.0, 99.0, 148.0, 259.0, 450.0, 875.0, 1949.0, 5273.0, 25367.0, 417320.0, 3476781.0, 238772.0, 18603.0, 4680.0, 1748.0, 770.0, 419.0, 237.0, 143.0, 83.0, 53.0, 21.0, 19.0, 24.0, 11.0, 3.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.21484375, -2.1613616943359375, -2.107879638671875, -2.0543975830078125, -2.00091552734375, -1.9474334716796875, -1.893951416015625, -1.8404693603515625, -1.7869873046875, -1.7335052490234375, -1.680023193359375, -1.6265411376953125, -1.57305908203125, -1.5195770263671875, -1.466094970703125, -1.4126129150390625, -1.359130859375, -1.3056488037109375, -1.252166748046875, -1.1986846923828125, -1.14520263671875, -1.0917205810546875, -1.038238525390625, -0.9847564697265625, -0.9312744140625, -0.8777923583984375, -0.824310302734375, -0.7708282470703125, -0.71734619140625, -0.6638641357421875, -0.610382080078125, -0.5569000244140625, -0.50341796875, -0.4499359130859375, -0.396453857421875, -0.3429718017578125, -0.28948974609375, -0.2360076904296875, -0.182525634765625, -0.1290435791015625, -0.0755615234375, -0.0220794677734375, 0.031402587890625, 0.0848846435546875, 0.13836669921875, 0.1918487548828125, 0.245330810546875, 0.2988128662109375, 0.352294921875, 0.4057769775390625, 0.459259033203125, 0.5127410888671875, 0.56622314453125, 0.6197052001953125, 0.673187255859375, 0.7266693115234375, 0.7801513671875, 0.8336334228515625, 0.887115478515625, 0.9405975341796875, 0.99407958984375, 1.0475616455078125, 1.101043701171875, 1.1545257568359375, 1.2080078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 0.0, 3.0, 7.0, 8.0, 10.0, 26.0, 18.0, 30.0, 29.0, 45.0, 54.0, 48.0, 53.0, 70.0, 59.0, 73.0, 70.0, 71.0, 58.0, 51.0, 46.0, 31.0, 32.0, 27.0, 24.0, 23.0, 12.0, 11.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9306640625, -0.9037399291992188, -0.8768157958984375, -0.8498916625976562, -0.822967529296875, -0.7960433959960938, -0.7691192626953125, -0.7421951293945312, -0.71527099609375, -0.6883468627929688, -0.6614227294921875, -0.6344985961914062, -0.607574462890625, -0.5806503295898438, -0.5537261962890625, -0.5268020629882812, -0.4998779296875, -0.47295379638671875, -0.4460296630859375, -0.41910552978515625, -0.392181396484375, -0.36525726318359375, -0.3383331298828125, -0.31140899658203125, -0.28448486328125, -0.25756072998046875, -0.2306365966796875, -0.20371246337890625, -0.176788330078125, -0.14986419677734375, -0.1229400634765625, -0.09601593017578125, -0.069091796875, -0.04216766357421875, -0.0152435302734375, 0.01168060302734375, 0.038604736328125, 0.06552886962890625, 0.0924530029296875, 0.11937713623046875, 0.14630126953125, 0.17322540283203125, 0.2001495361328125, 0.22707366943359375, 0.253997802734375, 0.28092193603515625, 0.3078460693359375, 0.33477020263671875, 0.3616943359375, 0.38861846923828125, 0.4155426025390625, 0.44246673583984375, 0.469390869140625, 0.49631500244140625, 0.5232391357421875, 0.5501632690429688, 0.57708740234375, 0.6040115356445312, 0.6309356689453125, 0.6578598022460938, 0.684783935546875, 0.7117080688476562, 0.7386322021484375, 0.7655563354492188, 0.79248046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 9.0, 11.0, 28.0, 35.0, 76.0, 141.0, 289.0, 654.0, 1646.0, 4527.0, 17918.0, 333963.0, 3768645.0, 52389.0, 8940.0, 2844.0, 1179.0, 491.0, 225.0, 115.0, 67.0, 29.0, 27.0, 9.0, 11.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.8050537109375, -2.705810546875, -2.6065673828125, -2.50732421875, -2.4080810546875, -2.308837890625, -2.2095947265625, -2.1103515625, -2.0111083984375, -1.911865234375, -1.8126220703125, -1.71337890625, -1.6141357421875, -1.514892578125, -1.4156494140625, -1.31640625, -1.2171630859375, -1.117919921875, -1.0186767578125, -0.91943359375, -0.8201904296875, -0.720947265625, -0.6217041015625, -0.5224609375, -0.4232177734375, -0.323974609375, -0.2247314453125, -0.12548828125, -0.0262451171875, 0.072998046875, 0.1722412109375, 0.271484375, 0.3707275390625, 0.469970703125, 0.5692138671875, 0.66845703125, 0.7677001953125, 0.866943359375, 0.9661865234375, 1.0654296875, 1.1646728515625, 1.263916015625, 1.3631591796875, 1.46240234375, 1.5616455078125, 1.660888671875, 1.7601318359375, 1.859375, 1.9586181640625, 2.057861328125, 2.1571044921875, 2.25634765625, 2.3555908203125, 2.454833984375, 2.5540771484375, 2.6533203125, 2.7525634765625, 2.851806640625, 2.9510498046875, 3.05029296875, 3.1495361328125, 3.248779296875, 3.3480224609375, 3.447265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 10.0, 10.0, 20.0, 19.0, 35.0, 53.0, 132.0, 388.0, 957.0, 1293.0, 696.0, 225.0, 88.0, 52.0, 25.0, 13.0, 16.0, 12.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.271484375, -2.1817626953125, -2.092041015625, -2.0023193359375, -1.91259765625, -1.8228759765625, -1.733154296875, -1.6434326171875, -1.5537109375, -1.4639892578125, -1.374267578125, -1.2845458984375, -1.19482421875, -1.1051025390625, -1.015380859375, -0.9256591796875, -0.8359375, -0.7462158203125, -0.656494140625, -0.5667724609375, -0.47705078125, -0.3873291015625, -0.297607421875, -0.2078857421875, -0.1181640625, -0.0284423828125, 0.061279296875, 0.1510009765625, 0.24072265625, 0.3304443359375, 0.420166015625, 0.5098876953125, 0.599609375, 0.6893310546875, 0.779052734375, 0.8687744140625, 0.95849609375, 1.0482177734375, 1.137939453125, 1.2276611328125, 1.3173828125, 1.4071044921875, 1.496826171875, 1.5865478515625, 1.67626953125, 1.7659912109375, 1.855712890625, 1.9454345703125, 2.03515625, 2.1248779296875, 2.214599609375, 2.3043212890625, 2.39404296875, 2.4837646484375, 2.573486328125, 2.6632080078125, 2.7529296875, 2.8426513671875, 2.932373046875, 3.0220947265625, 3.11181640625, 3.2015380859375, 3.291259765625, 3.3809814453125, 3.470703125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 9.0, 5.0, 19.0, 40.0, 81.0, 143.0, 263.0, 210.0, 107.0, 60.0, 26.0, 15.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.807705879211426, -13.204265594482422, -12.600826263427734, -11.99738597869873, -11.393945693969727, -10.790505409240723, -10.187065124511719, -9.583625793457031, -8.980185508728027, -8.376745223999023, -7.773305416107178, -7.169865608215332, -6.566425323486328, -5.962985038757324, -5.3595452308654785, -4.756105422973633, -4.152665138244629, -3.549225091934204, -2.9457850456237793, -2.3423449993133545, -1.7389049530029297, -1.1354649066925049, -0.5320248603820801, 0.07141494750976562, 0.6748552322387695, 1.2782952785491943, 1.8817353248596191, 2.485175371170044, 3.0886154174804688, 3.6920554637908936, 4.295495510101318, 4.898935317993164, 5.502376556396484, 6.105816841125488, 6.709256649017334, 7.31269645690918, 7.916136741638184, 8.519577026367188, 9.123016357421875, 9.726456642150879, 10.329896926879883, 10.933337211608887, 11.53677749633789, 12.140216827392578, 12.743657112121582, 13.347097396850586, 13.950536727905273, 14.553977012634277, 15.157417297363281, 15.760857582092285, 16.36429786682129, 16.967737197875977, 17.571178436279297, 18.174617767333984, 18.778057098388672, 19.38149642944336, 19.98493766784668, 20.588376998901367, 21.191818237304688, 21.795257568359375, 22.398696899414062, 23.002138137817383, 23.60557746887207, 24.20901870727539, 24.812458038330078]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 7.0, 8.0, 12.0, 14.0, 7.0, 17.0, 19.0, 27.0, 30.0, 29.0, 33.0, 46.0, 52.0, 51.0, 52.0, 58.0, 50.0, 51.0, 66.0, 60.0, 50.0, 56.0, 32.0, 27.0, 20.0, 25.0, 25.0, 14.0, 10.0, 11.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0], "bins": [-10.857721328735352, -10.576395034790039, -10.295068740844727, -10.013742446899414, -9.732416152954102, -9.451089859008789, -9.169763565063477, -8.888437271118164, -8.607110977172852, -8.325784683227539, -8.044458389282227, -7.763132095336914, -7.481805801391602, -7.200479507446289, -6.919153213500977, -6.637826919555664, -6.35650110244751, -6.075174808502197, -5.793848514556885, -5.512522220611572, -5.23119592666626, -4.949869632720947, -4.668543815612793, -4.3872175216674805, -4.105891227722168, -3.8245649337768555, -3.543238639831543, -3.2619123458862305, -2.980586051940918, -2.6992597579956055, -2.417933702468872, -2.1366074085235596, -1.8552813529968262, -1.5739550590515137, -1.2926287651062012, -1.0113025903701782, -0.7299762964248657, -0.4486500024795532, -0.16732382774353027, 0.11400246620178223, 0.3953287601470947, 0.6766550540924072, 0.957981288433075, 1.2393075227737427, 1.5206338167190552, 1.8019601106643677, 2.0832862854003906, 2.364612579345703, 2.6459388732910156, 2.927265167236328, 3.2085914611816406, 3.489917755126953, 3.7712440490722656, 4.052570343017578, 4.333896636962891, 4.615222930908203, 4.896549224853516, 5.177875518798828, 5.459201812744141, 5.740528106689453, 6.021854400634766, 6.303180694580078, 6.584506988525391, 6.865833282470703, 7.147159099578857]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 8.0, 5.0, 18.0, 23.0, 41.0, 73.0, 82.0, 215.0, 436.0, 1104.0, 3213.0, 12837.0, 72858.0, 512777.0, 380237.0, 50828.0, 9542.0, 2545.0, 933.0, 368.0, 158.0, 103.0, 70.0, 31.0, 16.0, 13.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.0769195556640625, -2.019073486328125, -1.9612274169921875, -1.90338134765625, -1.8455352783203125, -1.787689208984375, -1.7298431396484375, -1.6719970703125, -1.6141510009765625, -1.556304931640625, -1.4984588623046875, -1.44061279296875, -1.3827667236328125, -1.324920654296875, -1.2670745849609375, -1.209228515625, -1.1513824462890625, -1.093536376953125, -1.0356903076171875, -0.97784423828125, -0.9199981689453125, -0.862152099609375, -0.8043060302734375, -0.7464599609375, -0.6886138916015625, -0.630767822265625, -0.5729217529296875, -0.51507568359375, -0.4572296142578125, -0.399383544921875, -0.3415374755859375, -0.28369140625, -0.2258453369140625, -0.167999267578125, -0.1101531982421875, -0.05230712890625, 0.0055389404296875, 0.063385009765625, 0.1212310791015625, 0.1790771484375, 0.2369232177734375, 0.294769287109375, 0.3526153564453125, 0.41046142578125, 0.4683074951171875, 0.526153564453125, 0.5839996337890625, 0.641845703125, 0.6996917724609375, 0.757537841796875, 0.8153839111328125, 0.87322998046875, 0.9310760498046875, 0.988922119140625, 1.0467681884765625, 1.1046142578125, 1.1624603271484375, 1.220306396484375, 1.2781524658203125, 1.33599853515625, 1.3938446044921875, 1.451690673828125, 1.5095367431640625, 1.5673828125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 6.0, 10.0, 3.0, 9.0, 16.0, 16.0, 20.0, 26.0, 25.0, 31.0, 25.0, 44.0, 38.0, 50.0, 41.0, 55.0, 50.0, 43.0, 45.0, 48.0, 57.0, 35.0, 41.0, 26.0, 31.0, 33.0, 21.0, 37.0, 26.0, 20.0, 11.0, 17.0, 8.0, 6.0, 15.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5380859375, -0.5165557861328125, -0.495025634765625, -0.4734954833984375, -0.45196533203125, -0.4304351806640625, -0.408905029296875, -0.3873748779296875, -0.3658447265625, -0.3443145751953125, -0.322784423828125, -0.3012542724609375, -0.27972412109375, -0.2581939697265625, -0.236663818359375, -0.2151336669921875, -0.193603515625, -0.1720733642578125, -0.150543212890625, -0.1290130615234375, -0.10748291015625, -0.0859527587890625, -0.064422607421875, -0.0428924560546875, -0.0213623046875, 0.0001678466796875, 0.021697998046875, 0.0432281494140625, 0.06475830078125, 0.0862884521484375, 0.107818603515625, 0.1293487548828125, 0.15087890625, 0.1724090576171875, 0.193939208984375, 0.2154693603515625, 0.23699951171875, 0.2585296630859375, 0.280059814453125, 0.3015899658203125, 0.3231201171875, 0.3446502685546875, 0.366180419921875, 0.3877105712890625, 0.40924072265625, 0.4307708740234375, 0.452301025390625, 0.4738311767578125, 0.495361328125, 0.5168914794921875, 0.538421630859375, 0.5599517822265625, 0.58148193359375, 0.6030120849609375, 0.624542236328125, 0.6460723876953125, 0.6676025390625, 0.6891326904296875, 0.710662841796875, 0.7321929931640625, 0.75372314453125, 0.7752532958984375, 0.796783447265625, 0.8183135986328125, 0.83984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 12.0, 14.0, 27.0, 34.0, 53.0, 114.0, 189.0, 419.0, 1182.0, 4838.0, 32359.0, 591457.0, 382970.0, 28495.0, 4434.0, 1106.0, 402.0, 188.0, 95.0, 50.0, 43.0, 24.0, 16.0, 8.0, 5.0, 8.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7822265625, -1.7046356201171875, -1.627044677734375, -1.5494537353515625, -1.47186279296875, -1.3942718505859375, -1.316680908203125, -1.2390899658203125, -1.1614990234375, -1.0839080810546875, -1.006317138671875, -0.9287261962890625, -0.85113525390625, -0.7735443115234375, -0.695953369140625, -0.6183624267578125, -0.540771484375, -0.4631805419921875, -0.385589599609375, -0.3079986572265625, -0.23040771484375, -0.1528167724609375, -0.075225830078125, 0.0023651123046875, 0.0799560546875, 0.1575469970703125, 0.235137939453125, 0.3127288818359375, 0.39031982421875, 0.4679107666015625, 0.545501708984375, 0.6230926513671875, 0.70068359375, 0.7782745361328125, 0.855865478515625, 0.9334564208984375, 1.01104736328125, 1.0886383056640625, 1.166229248046875, 1.2438201904296875, 1.3214111328125, 1.3990020751953125, 1.476593017578125, 1.5541839599609375, 1.63177490234375, 1.7093658447265625, 1.786956787109375, 1.8645477294921875, 1.942138671875, 2.0197296142578125, 2.097320556640625, 2.1749114990234375, 2.25250244140625, 2.3300933837890625, 2.407684326171875, 2.4852752685546875, 2.5628662109375, 2.6404571533203125, 2.718048095703125, 2.7956390380859375, 2.87322998046875, 2.9508209228515625, 3.028411865234375, 3.1060028076171875, 3.18359375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 12.0, 18.0, 18.0, 24.0, 40.0, 43.0, 45.0, 54.0, 50.0, 60.0, 68.0, 66.0, 57.0, 66.0, 73.0, 53.0, 43.0, 43.0, 29.0, 21.0, 16.0, 19.0, 13.0, 14.0, 12.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.905181884765625, -3.79473876953125, -3.684295654296875, -3.5738525390625, -3.463409423828125, -3.35296630859375, -3.242523193359375, -3.132080078125, -3.021636962890625, -2.91119384765625, -2.800750732421875, -2.6903076171875, -2.579864501953125, -2.46942138671875, -2.358978271484375, -2.24853515625, -2.138092041015625, -2.02764892578125, -1.917205810546875, -1.8067626953125, -1.696319580078125, -1.58587646484375, -1.475433349609375, -1.364990234375, -1.254547119140625, -1.14410400390625, -1.033660888671875, -0.9232177734375, -0.812774658203125, -0.70233154296875, -0.591888427734375, -0.4814453125, -0.371002197265625, -0.26055908203125, -0.150115966796875, -0.0396728515625, 0.070770263671875, 0.18121337890625, 0.291656494140625, 0.402099609375, 0.512542724609375, 0.62298583984375, 0.733428955078125, 0.8438720703125, 0.954315185546875, 1.06475830078125, 1.175201416015625, 1.28564453125, 1.396087646484375, 1.50653076171875, 1.616973876953125, 1.7274169921875, 1.837860107421875, 1.94830322265625, 2.058746337890625, 2.169189453125, 2.279632568359375, 2.39007568359375, 2.500518798828125, 2.6109619140625, 2.721405029296875, 2.83184814453125, 2.942291259765625, 3.052734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 4.0, 10.0, 9.0, 16.0, 23.0, 45.0, 57.0, 102.0, 142.0, 257.0, 491.0, 1126.0, 2827.0, 8767.0, 33654.0, 172064.0, 671198.0, 121223.0, 25231.0, 6877.0, 2426.0, 988.0, 463.0, 220.0, 110.0, 81.0, 44.0, 23.0, 17.0, 15.0, 12.0, 8.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65185546875, -0.6310958862304688, -0.6103363037109375, -0.5895767211914062, -0.568817138671875, -0.5480575561523438, -0.5272979736328125, -0.5065383911132812, -0.48577880859375, -0.46501922607421875, -0.4442596435546875, -0.42350006103515625, -0.402740478515625, -0.38198089599609375, -0.3612213134765625, -0.34046173095703125, -0.3197021484375, -0.29894256591796875, -0.2781829833984375, -0.25742340087890625, -0.236663818359375, -0.21590423583984375, -0.1951446533203125, -0.17438507080078125, -0.15362548828125, -0.13286590576171875, -0.1121063232421875, -0.09134674072265625, -0.070587158203125, -0.04982757568359375, -0.0290679931640625, -0.00830841064453125, 0.012451171875, 0.03321075439453125, 0.0539703369140625, 0.07472991943359375, 0.095489501953125, 0.11624908447265625, 0.1370086669921875, 0.15776824951171875, 0.17852783203125, 0.19928741455078125, 0.2200469970703125, 0.24080657958984375, 0.261566162109375, 0.28232574462890625, 0.3030853271484375, 0.32384490966796875, 0.3446044921875, 0.36536407470703125, 0.3861236572265625, 0.40688323974609375, 0.427642822265625, 0.44840240478515625, 0.4691619873046875, 0.48992156982421875, 0.51068115234375, 0.5314407348632812, 0.5522003173828125, 0.5729598999023438, 0.593719482421875, 0.6144790649414062, 0.6352386474609375, 0.6559982299804688, 0.6767578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 2.0, 4.0, 3.0, 5.0, 11.0, 3.0, 8.0, 15.0, 18.0, 26.0, 23.0, 40.0, 49.0, 59.0, 71.0, 76.0, 74.0, 67.0, 86.0, 67.0, 59.0, 57.0, 29.0, 33.0, 24.0, 16.0, 20.0, 11.0, 8.0, 4.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001366138458251953, -0.0001324079930782318, -0.0001282021403312683, -0.0001239962875843048, -0.00011979043483734131, -0.00011558458209037781, -0.0001113787293434143, -0.0001071728765964508, -0.0001029670238494873, -9.87611711025238e-05, -9.45553183555603e-05, -9.03494656085968e-05, -8.61436128616333e-05, -8.19377601146698e-05, -7.77319073677063e-05, -7.35260546207428e-05, -6.93202018737793e-05, -6.51143491268158e-05, -6.0908496379852295e-05, -5.6702643632888794e-05, -5.249679088592529e-05, -4.829093813896179e-05, -4.408508539199829e-05, -3.987923264503479e-05, -3.567337989807129e-05, -3.146752715110779e-05, -2.7261674404144287e-05, -2.3055821657180786e-05, -1.8849968910217285e-05, -1.4644116163253784e-05, -1.0438263416290283e-05, -6.232410669326782e-06, -2.0265579223632812e-06, 2.1792948246002197e-06, 6.385147571563721e-06, 1.0591000318527222e-05, 1.4796853065490723e-05, 1.9002705812454224e-05, 2.3208558559417725e-05, 2.7414411306381226e-05, 3.1620264053344727e-05, 3.582611680030823e-05, 4.003196954727173e-05, 4.423782229423523e-05, 4.844367504119873e-05, 5.264952778816223e-05, 5.685538053512573e-05, 6.106123328208923e-05, 6.526708602905273e-05, 6.947293877601624e-05, 7.367879152297974e-05, 7.788464426994324e-05, 8.209049701690674e-05, 8.629634976387024e-05, 9.050220251083374e-05, 9.470805525779724e-05, 9.891390800476074e-05, 0.00010311976075172424, 0.00010732561349868774, 0.00011153146624565125, 0.00011573731899261475, 0.00011994317173957825, 0.00012414902448654175, 0.00012835487723350525, 0.00013256072998046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 13.0, 14.0, 22.0, 29.0, 48.0, 78.0, 211.0, 496.0, 1613.0, 7460.0, 69919.0, 850436.0, 105754.0, 9483.0, 1868.0, 586.0, 226.0, 120.0, 53.0, 41.0, 21.0, 10.0, 14.0, 10.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.20703125, -1.1662139892578125, -1.125396728515625, -1.0845794677734375, -1.04376220703125, -1.0029449462890625, -0.962127685546875, -0.9213104248046875, -0.8804931640625, -0.8396759033203125, -0.798858642578125, -0.7580413818359375, -0.71722412109375, -0.6764068603515625, -0.635589599609375, -0.5947723388671875, -0.553955078125, -0.5131378173828125, -0.472320556640625, -0.4315032958984375, -0.39068603515625, -0.3498687744140625, -0.309051513671875, -0.2682342529296875, -0.2274169921875, -0.1865997314453125, -0.145782470703125, -0.1049652099609375, -0.06414794921875, -0.0233306884765625, 0.017486572265625, 0.0583038330078125, 0.09912109375, 0.1399383544921875, 0.180755615234375, 0.2215728759765625, 0.26239013671875, 0.3032073974609375, 0.344024658203125, 0.3848419189453125, 0.4256591796875, 0.4664764404296875, 0.507293701171875, 0.5481109619140625, 0.58892822265625, 0.6297454833984375, 0.670562744140625, 0.7113800048828125, 0.752197265625, 0.7930145263671875, 0.833831787109375, 0.8746490478515625, 0.91546630859375, 0.9562835693359375, 0.997100830078125, 1.0379180908203125, 1.0787353515625, 1.1195526123046875, 1.160369873046875, 1.2011871337890625, 1.24200439453125, 1.2828216552734375, 1.323638916015625, 1.3644561767578125, 1.4052734375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 11.0, 9.0, 11.0, 10.0, 13.0, 29.0, 23.0, 28.0, 38.0, 64.0, 42.0, 68.0, 79.0, 93.0, 84.0, 73.0, 70.0, 48.0, 39.0, 36.0, 26.0, 14.0, 17.0, 22.0, 12.0, 5.0, 3.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.509765625, -0.49175262451171875, -0.4737396240234375, -0.45572662353515625, -0.437713623046875, -0.41970062255859375, -0.4016876220703125, -0.38367462158203125, -0.36566162109375, -0.34764862060546875, -0.3296356201171875, -0.31162261962890625, -0.293609619140625, -0.27559661865234375, -0.2575836181640625, -0.23957061767578125, -0.2215576171875, -0.20354461669921875, -0.1855316162109375, -0.16751861572265625, -0.149505615234375, -0.13149261474609375, -0.1134796142578125, -0.09546661376953125, -0.07745361328125, -0.05944061279296875, -0.0414276123046875, -0.02341461181640625, -0.005401611328125, 0.01261138916015625, 0.0306243896484375, 0.04863739013671875, 0.066650390625, 0.08466339111328125, 0.1026763916015625, 0.12068939208984375, 0.138702392578125, 0.15671539306640625, 0.1747283935546875, 0.19274139404296875, 0.21075439453125, 0.22876739501953125, 0.2467803955078125, 0.26479339599609375, 0.282806396484375, 0.30081939697265625, 0.3188323974609375, 0.33684539794921875, 0.3548583984375, 0.37287139892578125, 0.3908843994140625, 0.40889739990234375, 0.426910400390625, 0.44492340087890625, 0.4629364013671875, 0.48094940185546875, 0.49896240234375, 0.5169754028320312, 0.5349884033203125, 0.5530014038085938, 0.571014404296875, 0.5890274047851562, 0.6070404052734375, 0.6250534057617188, 0.64306640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 22.0, 72.0, 164.0, 373.0, 216.0, 83.0, 23.0, 14.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.668895721435547, -24.96940040588379, -24.26990509033203, -23.570409774780273, -22.870914459228516, -22.171419143676758, -21.471923828125, -20.772428512573242, -20.072933197021484, -19.373437881469727, -18.67394256591797, -17.97444725036621, -17.274951934814453, -16.575456619262695, -15.875961303710938, -15.17646598815918, -14.476970672607422, -13.777475357055664, -13.077980041503906, -12.378484725952148, -11.67898941040039, -10.979494094848633, -10.279998779296875, -9.580503463745117, -8.88100814819336, -8.181512832641602, -7.482017517089844, -6.782522201538086, -6.083026885986328, -5.38353157043457, -4.6840362548828125, -3.9845409393310547, -3.2850475311279297, -2.585552215576172, -1.886056900024414, -1.1865615844726562, -0.48706626892089844, 0.21242904663085938, 0.9119243621826172, 1.611419677734375, 2.310914993286133, 3.0104103088378906, 3.7099056243896484, 4.409400939941406, 5.108896255493164, 5.808391571044922, 6.50788688659668, 7.2073822021484375, 7.906877517700195, 8.606372833251953, 9.305868148803711, 10.005363464355469, 10.704858779907227, 11.404354095458984, 12.103849411010742, 12.8033447265625, 13.502840042114258, 14.202335357666016, 14.901830673217773, 15.601325988769531, 16.30082130432129, 17.000316619873047, 17.699811935424805, 18.399307250976562, 19.09880256652832]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 4.0, 6.0, 8.0, 9.0, 8.0, 20.0, 20.0, 27.0, 29.0, 26.0, 26.0, 25.0, 23.0, 35.0, 52.0, 58.0, 71.0, 70.0, 82.0, 57.0, 46.0, 38.0, 29.0, 34.0, 29.0, 34.0, 30.0, 16.0, 13.0, 14.0, 14.0, 12.0, 3.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.193066596984863, -10.83924388885498, -10.485422134399414, -10.131599426269531, -9.777776718139648, -9.423954963684082, -9.0701322555542, -8.716310501098633, -8.36248779296875, -8.008665084838867, -7.654842853546143, -7.301020622253418, -6.947198390960693, -6.593376159667969, -6.239553451538086, -5.885731220245361, -5.5319085121154785, -5.178086280822754, -4.824263572692871, -4.4704413414001465, -4.116619110107422, -3.762796640396118, -3.4089741706848145, -3.05515193939209, -2.701329469680786, -2.3475069999694824, -1.9936847686767578, -1.639862298965454, -1.28603994846344, -0.9322175979614258, -0.5783951282501221, -0.22457289695739746, 0.12924957275390625, 0.4830719530582428, 0.8368943333625793, 1.1907167434692383, 1.5445390939712524, 1.8983614444732666, 2.2521839141845703, 2.606006145477295, 2.9598286151885986, 3.3136510848999023, 3.667473316192627, 4.021295547485352, 4.375118255615234, 4.728940486907959, 5.082762718200684, 5.436585426330566, 5.790407657623291, 6.144229888916016, 6.498052597045898, 6.851874828338623, 7.205697059631348, 7.5595197677612305, 7.913341999053955, 8.26716423034668, 8.620986938476562, 8.974809646606445, 9.328631401062012, 9.682454109191895, 10.036276817321777, 10.390098571777344, 10.743921279907227, 11.09774398803711, 11.451565742492676]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 9.0, 14.0, 15.0, 17.0, 36.0, 55.0, 82.0, 177.0, 284.0, 489.0, 851.0, 1550.0, 3777.0, 12221.0, 242826.0, 3790682.0, 124452.0, 9916.0, 3361.0, 1465.0, 839.0, 428.0, 281.0, 154.0, 102.0, 59.0, 43.0, 23.0, 27.0, 13.0, 10.0, 5.0, 5.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.712890625, -2.636322021484375, -2.55975341796875, -2.483184814453125, -2.4066162109375, -2.330047607421875, -2.25347900390625, -2.176910400390625, -2.100341796875, -2.023773193359375, -1.94720458984375, -1.870635986328125, -1.7940673828125, -1.717498779296875, -1.64093017578125, -1.564361572265625, -1.48779296875, -1.411224365234375, -1.33465576171875, -1.258087158203125, -1.1815185546875, -1.104949951171875, -1.02838134765625, -0.951812744140625, -0.875244140625, -0.798675537109375, -0.72210693359375, -0.645538330078125, -0.5689697265625, -0.492401123046875, -0.41583251953125, -0.339263916015625, -0.2626953125, -0.186126708984375, -0.10955810546875, -0.032989501953125, 0.0435791015625, 0.120147705078125, 0.19671630859375, 0.273284912109375, 0.349853515625, 0.426422119140625, 0.50299072265625, 0.579559326171875, 0.6561279296875, 0.732696533203125, 0.80926513671875, 0.885833740234375, 0.96240234375, 1.038970947265625, 1.11553955078125, 1.192108154296875, 1.2686767578125, 1.345245361328125, 1.42181396484375, 1.498382568359375, 1.574951171875, 1.651519775390625, 1.72808837890625, 1.804656982421875, 1.8812255859375, 1.957794189453125, 2.03436279296875, 2.110931396484375, 2.1875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 13.0, 20.0, 9.0, 15.0, 18.0, 27.0, 26.0, 39.0, 32.0, 27.0, 43.0, 34.0, 37.0, 60.0, 58.0, 47.0, 38.0, 39.0, 48.0, 43.0, 36.0, 44.0, 35.0, 26.0, 33.0, 20.0, 22.0, 14.0, 10.0, 16.0, 10.0, 11.0, 5.0, 11.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.72705078125, -0.7073287963867188, -0.6876068115234375, -0.6678848266601562, -0.648162841796875, -0.6284408569335938, -0.6087188720703125, -0.5889968872070312, -0.56927490234375, -0.5495529174804688, -0.5298309326171875, -0.5101089477539062, -0.490386962890625, -0.47066497802734375, -0.4509429931640625, -0.43122100830078125, -0.4114990234375, -0.39177703857421875, -0.3720550537109375, -0.35233306884765625, -0.332611083984375, -0.31288909912109375, -0.2931671142578125, -0.27344512939453125, -0.25372314453125, -0.23400115966796875, -0.2142791748046875, -0.19455718994140625, -0.174835205078125, -0.15511322021484375, -0.1353912353515625, -0.11566925048828125, -0.095947265625, -0.07622528076171875, -0.0565032958984375, -0.03678131103515625, -0.017059326171875, 0.00266265869140625, 0.0223846435546875, 0.04210662841796875, 0.06182861328125, 0.08155059814453125, 0.1012725830078125, 0.12099456787109375, 0.140716552734375, 0.16043853759765625, 0.1801605224609375, 0.19988250732421875, 0.2196044921875, 0.23932647705078125, 0.2590484619140625, 0.27877044677734375, 0.298492431640625, 0.31821441650390625, 0.3379364013671875, 0.35765838623046875, 0.37738037109375, 0.39710235595703125, 0.4168243408203125, 0.43654632568359375, 0.456268310546875, 0.47599029541015625, 0.4957122802734375, 0.5154342651367188, 0.53515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 17.0, 18.0, 35.0, 47.0, 69.0, 130.0, 228.0, 391.0, 755.0, 1471.0, 3225.0, 8243.0, 31406.0, 796423.0, 3267203.0, 63836.0, 12224.0, 4492.0, 1960.0, 933.0, 494.0, 290.0, 135.0, 96.0, 45.0, 30.0, 19.0, 14.0, 12.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.64453125, -2.5693359375, -2.494140625, -2.4189453125, -2.34375, -2.2685546875, -2.193359375, -2.1181640625, -2.04296875, -1.9677734375, -1.892578125, -1.8173828125, -1.7421875, -1.6669921875, -1.591796875, -1.5166015625, -1.44140625, -1.3662109375, -1.291015625, -1.2158203125, -1.140625, -1.0654296875, -0.990234375, -0.9150390625, -0.83984375, -0.7646484375, -0.689453125, -0.6142578125, -0.5390625, -0.4638671875, -0.388671875, -0.3134765625, -0.23828125, -0.1630859375, -0.087890625, -0.0126953125, 0.0625, 0.1376953125, 0.212890625, 0.2880859375, 0.36328125, 0.4384765625, 0.513671875, 0.5888671875, 0.6640625, 0.7392578125, 0.814453125, 0.8896484375, 0.96484375, 1.0400390625, 1.115234375, 1.1904296875, 1.265625, 1.3408203125, 1.416015625, 1.4912109375, 1.56640625, 1.6416015625, 1.716796875, 1.7919921875, 1.8671875, 1.9423828125, 2.017578125, 2.0927734375, 2.16796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 10.0, 24.0, 35.0, 62.0, 119.0, 318.0, 656.0, 1164.0, 878.0, 395.0, 169.0, 77.0, 49.0, 28.0, 18.0, 9.0, 11.0, 3.0, 6.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.627197265625, -2.54931640625, -2.471435546875, -2.3935546875, -2.315673828125, -2.23779296875, -2.159912109375, -2.08203125, -2.004150390625, -1.92626953125, -1.848388671875, -1.7705078125, -1.692626953125, -1.61474609375, -1.536865234375, -1.458984375, -1.381103515625, -1.30322265625, -1.225341796875, -1.1474609375, -1.069580078125, -0.99169921875, -0.913818359375, -0.8359375, -0.758056640625, -0.68017578125, -0.602294921875, -0.5244140625, -0.446533203125, -0.36865234375, -0.290771484375, -0.212890625, -0.135009765625, -0.05712890625, 0.020751953125, 0.0986328125, 0.176513671875, 0.25439453125, 0.332275390625, 0.41015625, 0.488037109375, 0.56591796875, 0.643798828125, 0.7216796875, 0.799560546875, 0.87744140625, 0.955322265625, 1.033203125, 1.111083984375, 1.18896484375, 1.266845703125, 1.3447265625, 1.422607421875, 1.50048828125, 1.578369140625, 1.65625, 1.734130859375, 1.81201171875, 1.889892578125, 1.9677734375, 2.045654296875, 2.12353515625, 2.201416015625, 2.279296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 6.0, 13.0, 32.0, 82.0, 166.0, 246.0, 223.0, 114.0, 64.0, 34.0, 10.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.494823455810547, -29.815614700317383, -29.136404037475586, -28.457195281982422, -27.777984619140625, -27.09877586364746, -26.419567108154297, -25.7403564453125, -25.061147689819336, -24.381938934326172, -23.702728271484375, -23.02351951599121, -22.344310760498047, -21.66510009765625, -20.985891342163086, -20.306682586669922, -19.627471923828125, -18.94826316833496, -18.269052505493164, -17.58984375, -16.910633087158203, -16.23142433166504, -15.552215576171875, -14.873005867004395, -14.193796157836914, -13.514586448669434, -12.835376739501953, -12.156167984008789, -11.476958274841309, -10.797748565673828, -10.118539810180664, -9.439330101013184, -8.760120391845703, -8.080910682678223, -7.4017014503479, -6.722492218017578, -6.043282508850098, -5.364072799682617, -4.684863567352295, -4.005654335021973, -3.326444625854492, -2.647235155105591, -1.9680256843566895, -1.288816213607788, -0.6096067428588867, 0.06960272789001465, 0.748812198638916, 1.4280214309692383, 2.1072311401367188, 2.78644061088562, 3.4656500816345215, 4.144859313964844, 4.824069023132324, 5.503278732299805, 6.182487964630127, 6.861697196960449, 7.54090690612793, 8.22011661529541, 8.89932632446289, 9.578535079956055, 10.257744789123535, 10.936954498291016, 11.61616325378418, 12.29537296295166, 12.97458267211914]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 4.0, 11.0, 18.0, 13.0, 13.0, 12.0, 21.0, 16.0, 28.0, 25.0, 28.0, 27.0, 30.0, 35.0, 32.0, 42.0, 44.0, 42.0, 36.0, 40.0, 44.0, 45.0, 38.0, 40.0, 38.0, 39.0, 36.0, 19.0, 19.0, 20.0, 17.0, 9.0, 18.0, 13.0, 11.0, 8.0, 13.0, 8.0, 7.0, 6.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.378134250640869, -6.17901086807251, -5.979887008666992, -5.780763626098633, -5.581640243530273, -5.382516860961914, -5.183393478393555, -4.984269618988037, -4.785146236419678, -4.586022853851318, -4.386898994445801, -4.187775611877441, -3.988652229309082, -3.7895288467407227, -3.590405225753784, -3.3912816047668457, -3.1921582221984863, -2.993034839630127, -2.7939112186431885, -2.59478759765625, -2.3956642150878906, -2.1965408325195312, -1.9974172115325928, -1.7982937097549438, -1.599170207977295, -1.400046706199646, -1.200923204421997, -1.0017997026443481, -0.8026762008666992, -0.6035526990890503, -0.40442919731140137, -0.20530569553375244, -0.0061817169189453125, 0.1929417848587036, 0.39206528663635254, 0.5911887884140015, 0.7903122901916504, 0.9894357919692993, 1.1885592937469482, 1.3876827955245972, 1.586806297302246, 1.785929799079895, 1.985053300857544, 2.1841769218444824, 2.383300304412842, 2.582423686981201, 2.7815473079681396, 2.980670928955078, 3.1797943115234375, 3.378917694091797, 3.5780413150787354, 3.777164936065674, 3.976288318634033, 4.175411701202393, 4.37453556060791, 4.5736589431762695, 4.772782325744629, 4.971905708312988, 5.171029090881348, 5.370152950286865, 5.569276332855225, 5.768399715423584, 5.967523574829102, 6.166646957397461, 6.36577033996582]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 13.0, 8.0, 12.0, 16.0, 29.0, 42.0, 61.0, 78.0, 132.0, 227.0, 382.0, 706.0, 1662.0, 4289.0, 17114.0, 170561.0, 765037.0, 72095.0, 10255.0, 3060.0, 1319.0, 595.0, 285.0, 205.0, 122.0, 89.0, 57.0, 31.0, 29.0, 16.0, 13.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.478851318359375, -2.39715576171875, -2.315460205078125, -2.2337646484375, -2.152069091796875, -2.07037353515625, -1.988677978515625, -1.906982421875, -1.825286865234375, -1.74359130859375, -1.661895751953125, -1.5802001953125, -1.498504638671875, -1.41680908203125, -1.335113525390625, -1.25341796875, -1.171722412109375, -1.09002685546875, -1.008331298828125, -0.9266357421875, -0.844940185546875, -0.76324462890625, -0.681549072265625, -0.599853515625, -0.518157958984375, -0.43646240234375, -0.354766845703125, -0.2730712890625, -0.191375732421875, -0.10968017578125, -0.027984619140625, 0.0537109375, 0.135406494140625, 0.21710205078125, 0.298797607421875, 0.3804931640625, 0.462188720703125, 0.54388427734375, 0.625579833984375, 0.707275390625, 0.788970947265625, 0.87066650390625, 0.952362060546875, 1.0340576171875, 1.115753173828125, 1.19744873046875, 1.279144287109375, 1.36083984375, 1.442535400390625, 1.52423095703125, 1.605926513671875, 1.6876220703125, 1.769317626953125, 1.85101318359375, 1.932708740234375, 2.014404296875, 2.096099853515625, 2.17779541015625, 2.259490966796875, 2.3411865234375, 2.422882080078125, 2.50457763671875, 2.586273193359375, 2.66796875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 6.0, 13.0, 14.0, 12.0, 18.0, 21.0, 20.0, 24.0, 19.0, 29.0, 45.0, 42.0, 48.0, 44.0, 41.0, 49.0, 61.0, 51.0, 45.0, 44.0, 44.0, 43.0, 33.0, 35.0, 29.0, 33.0, 24.0, 17.0, 14.0, 18.0, 14.0, 7.0, 7.0, 14.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68212890625, -0.659210205078125, -0.63629150390625, -0.613372802734375, -0.5904541015625, -0.567535400390625, -0.54461669921875, -0.521697998046875, -0.498779296875, -0.475860595703125, -0.45294189453125, -0.430023193359375, -0.4071044921875, -0.384185791015625, -0.36126708984375, -0.338348388671875, -0.3154296875, -0.292510986328125, -0.26959228515625, -0.246673583984375, -0.2237548828125, -0.200836181640625, -0.17791748046875, -0.154998779296875, -0.132080078125, -0.109161376953125, -0.08624267578125, -0.063323974609375, -0.0404052734375, -0.017486572265625, 0.00543212890625, 0.028350830078125, 0.05126953125, 0.074188232421875, 0.09710693359375, 0.120025634765625, 0.1429443359375, 0.165863037109375, 0.18878173828125, 0.211700439453125, 0.234619140625, 0.257537841796875, 0.28045654296875, 0.303375244140625, 0.3262939453125, 0.349212646484375, 0.37213134765625, 0.395050048828125, 0.41796875, 0.440887451171875, 0.46380615234375, 0.486724853515625, 0.5096435546875, 0.532562255859375, 0.55548095703125, 0.578399658203125, 0.601318359375, 0.624237060546875, 0.64715576171875, 0.670074462890625, 0.6929931640625, 0.715911865234375, 0.73883056640625, 0.761749267578125, 0.78466796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 16.0, 18.0, 13.0, 43.0, 68.0, 74.0, 107.0, 171.0, 289.0, 521.0, 789.0, 1635.0, 3713.0, 13115.0, 113745.0, 835936.0, 62441.0, 9597.0, 2985.0, 1343.0, 707.0, 398.0, 259.0, 165.0, 120.0, 92.0, 41.0, 36.0, 26.0, 15.0, 17.0, 13.0, 5.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.50390625, -2.42413330078125, -2.3443603515625, -2.26458740234375, -2.184814453125, -2.10504150390625, -2.0252685546875, -1.94549560546875, -1.86572265625, -1.78594970703125, -1.7061767578125, -1.62640380859375, -1.546630859375, -1.46685791015625, -1.3870849609375, -1.30731201171875, -1.2275390625, -1.14776611328125, -1.0679931640625, -0.98822021484375, -0.908447265625, -0.82867431640625, -0.7489013671875, -0.66912841796875, -0.58935546875, -0.50958251953125, -0.4298095703125, -0.35003662109375, -0.270263671875, -0.19049072265625, -0.1107177734375, -0.03094482421875, 0.048828125, 0.12860107421875, 0.2083740234375, 0.28814697265625, 0.367919921875, 0.44769287109375, 0.5274658203125, 0.60723876953125, 0.68701171875, 0.76678466796875, 0.8465576171875, 0.92633056640625, 1.006103515625, 1.08587646484375, 1.1656494140625, 1.24542236328125, 1.3251953125, 1.40496826171875, 1.4847412109375, 1.56451416015625, 1.644287109375, 1.72406005859375, 1.8038330078125, 1.88360595703125, 1.96337890625, 2.04315185546875, 2.1229248046875, 2.20269775390625, 2.282470703125, 2.36224365234375, 2.4420166015625, 2.52178955078125, 2.6015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 3.0, 5.0, 9.0, 8.0, 10.0, 20.0, 14.0, 18.0, 32.0, 26.0, 27.0, 41.0, 57.0, 49.0, 63.0, 59.0, 61.0, 45.0, 58.0, 54.0, 40.0, 47.0, 45.0, 25.0, 25.0, 25.0, 38.0, 22.0, 15.0, 7.0, 6.0, 12.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.935546875, -2.84039306640625, -2.7452392578125, -2.65008544921875, -2.554931640625, -2.45977783203125, -2.3646240234375, -2.26947021484375, -2.17431640625, -2.07916259765625, -1.9840087890625, -1.88885498046875, -1.793701171875, -1.69854736328125, -1.6033935546875, -1.50823974609375, -1.4130859375, -1.31793212890625, -1.2227783203125, -1.12762451171875, -1.032470703125, -0.93731689453125, -0.8421630859375, -0.74700927734375, -0.65185546875, -0.55670166015625, -0.4615478515625, -0.36639404296875, -0.271240234375, -0.17608642578125, -0.0809326171875, 0.01422119140625, 0.109375, 0.20452880859375, 0.2996826171875, 0.39483642578125, 0.489990234375, 0.58514404296875, 0.6802978515625, 0.77545166015625, 0.87060546875, 0.96575927734375, 1.0609130859375, 1.15606689453125, 1.251220703125, 1.34637451171875, 1.4415283203125, 1.53668212890625, 1.6318359375, 1.72698974609375, 1.8221435546875, 1.91729736328125, 2.012451171875, 2.10760498046875, 2.2027587890625, 2.29791259765625, 2.39306640625, 2.48822021484375, 2.5833740234375, 2.67852783203125, 2.773681640625, 2.86883544921875, 2.9639892578125, 3.05914306640625, 3.154296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 8.0, 10.0, 8.0, 19.0, 22.0, 35.0, 39.0, 60.0, 82.0, 100.0, 174.0, 237.0, 415.0, 690.0, 1417.0, 2974.0, 7033.0, 19073.0, 64977.0, 550092.0, 311346.0, 59398.0, 17886.0, 6606.0, 2708.0, 1252.0, 698.0, 432.0, 214.0, 167.0, 114.0, 65.0, 57.0, 32.0, 25.0, 22.0, 19.0, 7.0, 12.0, 7.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4423828125, -0.42761993408203125, -0.4128570556640625, -0.39809417724609375, -0.383331298828125, -0.36856842041015625, -0.3538055419921875, -0.33904266357421875, -0.32427978515625, -0.30951690673828125, -0.2947540283203125, -0.27999114990234375, -0.265228271484375, -0.25046539306640625, -0.2357025146484375, -0.22093963623046875, -0.2061767578125, -0.19141387939453125, -0.1766510009765625, -0.16188812255859375, -0.147125244140625, -0.13236236572265625, -0.1175994873046875, -0.10283660888671875, -0.08807373046875, -0.07331085205078125, -0.0585479736328125, -0.04378509521484375, -0.029022216796875, -0.01425933837890625, 0.0005035400390625, 0.01526641845703125, 0.030029296875, 0.04479217529296875, 0.0595550537109375, 0.07431793212890625, 0.089080810546875, 0.10384368896484375, 0.1186065673828125, 0.13336944580078125, 0.14813232421875, 0.16289520263671875, 0.1776580810546875, 0.19242095947265625, 0.207183837890625, 0.22194671630859375, 0.2367095947265625, 0.25147247314453125, 0.2662353515625, 0.28099822998046875, 0.2957611083984375, 0.31052398681640625, 0.325286865234375, 0.34004974365234375, 0.3548126220703125, 0.36957550048828125, 0.38433837890625, 0.39910125732421875, 0.4138641357421875, 0.42862701416015625, 0.443389892578125, 0.45815277099609375, 0.4729156494140625, 0.48767852783203125, 0.50244140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 14.0, 9.0, 20.0, 17.0, 38.0, 75.0, 100.0, 142.0, 148.0, 144.0, 83.0, 46.0, 41.0, 19.0, 20.0, 11.0, 17.0, 11.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016379356384277344, -0.00015759654343128204, -0.00015139952301979065, -0.00014520250260829926, -0.00013900548219680786, -0.00013280846178531647, -0.00012661144137382507, -0.00012041442096233368, -0.00011421740055084229, -0.00010802038013935089, -0.0001018233597278595, -9.56263393163681e-05, -8.942931890487671e-05, -8.323229849338531e-05, -7.703527808189392e-05, -7.083825767040253e-05, -6.464123725891113e-05, -5.844421684741974e-05, -5.2247196435928345e-05, -4.605017602443695e-05, -3.985315561294556e-05, -3.365613520145416e-05, -2.745911478996277e-05, -2.1262094378471375e-05, -1.506507396697998e-05, -8.868053555488586e-06, -2.6710331439971924e-06, 3.5259872674942017e-06, 9.723007678985596e-06, 1.592002809047699e-05, 2.2117048501968384e-05, 2.8314068913459778e-05, 3.451108932495117e-05, 4.0708109736442566e-05, 4.690513014793396e-05, 5.3102150559425354e-05, 5.929917097091675e-05, 6.549619138240814e-05, 7.169321179389954e-05, 7.789023220539093e-05, 8.408725261688232e-05, 9.028427302837372e-05, 9.648129343986511e-05, 0.0001026783138513565, 0.0001088753342628479, 0.0001150723546743393, 0.00012126937508583069, 0.00012746639549732208, 0.00013366341590881348, 0.00013986043632030487, 0.00014605745673179626, 0.00015225447714328766, 0.00015845149755477905, 0.00016464851796627045, 0.00017084553837776184, 0.00017704255878925323, 0.00018323957920074463, 0.00018943659961223602, 0.00019563362002372742, 0.0002018306404352188, 0.0002080276608467102, 0.0002142246812582016, 0.000220421701669693, 0.0002266187220811844, 0.00023281574249267578]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 0.0, 6.0, 5.0, 7.0, 7.0, 17.0, 15.0, 36.0, 36.0, 50.0, 82.0, 122.0, 230.0, 327.0, 617.0, 1033.0, 2012.0, 4200.0, 10196.0, 28896.0, 111126.0, 674744.0, 154911.0, 37288.0, 12553.0, 4951.0, 2270.0, 1103.0, 655.0, 376.0, 242.0, 130.0, 100.0, 75.0, 40.0, 31.0, 16.0, 16.0, 7.0, 7.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0], "bins": [-0.5908203125, -0.5751075744628906, -0.5593948364257812, -0.5436820983886719, -0.5279693603515625, -0.5122566223144531, -0.49654388427734375, -0.4808311462402344, -0.465118408203125, -0.4494056701660156, -0.43369293212890625, -0.4179801940917969, -0.4022674560546875, -0.3865547180175781, -0.37084197998046875, -0.3551292419433594, -0.33941650390625, -0.3237037658691406, -0.30799102783203125, -0.2922782897949219, -0.2765655517578125, -0.2608528137207031, -0.24514007568359375, -0.22942733764648438, -0.213714599609375, -0.19800186157226562, -0.18228912353515625, -0.16657638549804688, -0.1508636474609375, -0.13515090942382812, -0.11943817138671875, -0.10372543334960938, -0.0880126953125, -0.07229995727539062, -0.05658721923828125, -0.040874481201171875, -0.0251617431640625, -0.009449005126953125, 0.00626373291015625, 0.021976470947265625, 0.037689208984375, 0.053401947021484375, 0.06911468505859375, 0.08482742309570312, 0.1005401611328125, 0.11625289916992188, 0.13196563720703125, 0.14767837524414062, 0.16339111328125, 0.17910385131835938, 0.19481658935546875, 0.21052932739257812, 0.2262420654296875, 0.24195480346679688, 0.25766754150390625, 0.2733802795410156, 0.289093017578125, 0.3048057556152344, 0.32051849365234375, 0.3362312316894531, 0.3519439697265625, 0.3676567077636719, 0.38336944580078125, 0.3990821838378906, 0.414794921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 17.0, 12.0, 14.0, 33.0, 42.0, 39.0, 77.0, 90.0, 104.0, 114.0, 117.0, 75.0, 48.0, 40.0, 30.0, 28.0, 27.0, 19.0, 12.0, 8.0, 5.0, 8.0, 4.0, 3.0, 5.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6403274536132812, -0.6204986572265625, -0.6006698608398438, -0.580841064453125, -0.5610122680664062, -0.5411834716796875, -0.5213546752929688, -0.50152587890625, -0.48169708251953125, -0.4618682861328125, -0.44203948974609375, -0.422210693359375, -0.40238189697265625, -0.3825531005859375, -0.36272430419921875, -0.3428955078125, -0.32306671142578125, -0.3032379150390625, -0.28340911865234375, -0.263580322265625, -0.24375152587890625, -0.2239227294921875, -0.20409393310546875, -0.18426513671875, -0.16443634033203125, -0.1446075439453125, -0.12477874755859375, -0.104949951171875, -0.08512115478515625, -0.0652923583984375, -0.04546356201171875, -0.025634765625, -0.00580596923828125, 0.0140228271484375, 0.03385162353515625, 0.053680419921875, 0.07350921630859375, 0.0933380126953125, 0.11316680908203125, 0.13299560546875, 0.15282440185546875, 0.1726531982421875, 0.19248199462890625, 0.212310791015625, 0.23213958740234375, 0.2519683837890625, 0.27179718017578125, 0.2916259765625, 0.31145477294921875, 0.3312835693359375, 0.35111236572265625, 0.370941162109375, 0.39076995849609375, 0.4105987548828125, 0.43042755126953125, 0.45025634765625, 0.47008514404296875, 0.4899139404296875, 0.5097427368164062, 0.529571533203125, 0.5494003295898438, 0.5692291259765625, 0.5890579223632812, 0.60888671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 13.0, 17.0, 21.0, 50.0, 62.0, 107.0, 249.0, 197.0, 102.0, 61.0, 41.0, 28.0, 16.0, 9.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.762823104858398, -12.3496675491333, -11.936511039733887, -11.523355484008789, -11.110198974609375, -10.697043418884277, -10.28388786315918, -9.870731353759766, -9.457575798034668, -9.04442024230957, -8.631263732910156, -8.218108177185059, -7.804952144622803, -7.391796112060547, -6.978640556335449, -6.565484523773193, -6.1523284912109375, -5.739172458648682, -5.326016426086426, -4.912860870361328, -4.499704837799072, -4.086548805236816, -3.6733930110931396, -3.260237216949463, -2.847081184387207, -2.433925151824951, -2.0207693576812744, -1.607613444328308, -1.1944575309753418, -0.7813014984130859, -0.3681457042694092, 0.04501008987426758, 0.45816612243652344, 0.8713220357894897, 1.284477949142456, 1.6976338624954224, 2.1107897758483887, 2.5239458084106445, 2.9371016025543213, 3.350257396697998, 3.763413429260254, 4.17656946182251, 4.589725494384766, 5.002881050109863, 5.416037082672119, 5.829193115234375, 6.242348670959473, 6.6555047035217285, 7.068660736083984, 7.48181676864624, 7.894972801208496, 8.308128356933594, 8.721284866333008, 9.134440422058105, 9.547595977783203, 9.960752487182617, 10.373908042907715, 10.787063598632812, 11.200220108032227, 11.613375663757324, 12.026531219482422, 12.439687728881836, 12.852843284606934, 13.265998840332031, 13.679155349731445]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 8.0, 7.0, 6.0, 2.0, 4.0, 9.0, 19.0, 9.0, 19.0, 16.0, 16.0, 24.0, 19.0, 28.0, 22.0, 28.0, 40.0, 37.0, 68.0, 108.0, 100.0, 75.0, 52.0, 41.0, 23.0, 26.0, 20.0, 20.0, 20.0, 25.0, 25.0, 10.0, 18.0, 16.0, 9.0, 11.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-11.756427764892578, -11.410192489624023, -11.063956260681152, -10.717720985412598, -10.371485710144043, -10.025249481201172, -9.679014205932617, -9.332778930664062, -8.986543655395508, -8.640308380126953, -8.294072151184082, -7.947836875915527, -7.601601600646973, -7.25536584854126, -6.909130096435547, -6.562894821166992, -6.216658592224121, -5.870422840118408, -5.5241875648498535, -5.177951812744141, -4.831716537475586, -4.485480785369873, -4.13924503326416, -3.7930095195770264, -3.4467740058898926, -3.100538492202759, -2.754302978515625, -2.408067226409912, -2.0618317127227783, -1.7155961990356445, -1.3693604469299316, -1.0231249332427979, -0.6768903732299805, -0.3306547999382019, 0.01558077335357666, 0.36181640625, 0.7080519199371338, 1.0542874336242676, 1.4005231857299805, 1.7467586994171143, 2.092994213104248, 2.439229726791382, 2.7854652404785156, 3.1317009925842285, 3.4779365062713623, 3.824172019958496, 4.170407772064209, 4.516643524169922, 4.862878799438477, 5.2091145515441895, 5.555349826812744, 5.901585578918457, 6.247820854187012, 6.594056606292725, 6.9402923583984375, 7.286527633666992, 7.632763385772705, 7.978999137878418, 8.325234413146973, 8.671470642089844, 9.017705917358398, 9.363941192626953, 9.710176467895508, 10.056412696838379, 10.402647972106934]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 9.0, 13.0, 18.0, 29.0, 43.0, 75.0, 120.0, 164.0, 258.0, 427.0, 700.0, 1108.0, 1932.0, 3800.0, 13265.0, 199949.0, 3420944.0, 518818.0, 21632.0, 5107.0, 2389.0, 1346.0, 777.0, 479.0, 269.0, 190.0, 127.0, 99.0, 61.0, 29.0, 32.0, 15.0, 18.0, 8.0, 6.0, 6.0, 8.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.73065185546875, -1.6722412109375, -1.61383056640625, -1.555419921875, -1.49700927734375, -1.4385986328125, -1.38018798828125, -1.32177734375, -1.26336669921875, -1.2049560546875, -1.14654541015625, -1.088134765625, -1.02972412109375, -0.9713134765625, -0.91290283203125, -0.8544921875, -0.79608154296875, -0.7376708984375, -0.67926025390625, -0.620849609375, -0.56243896484375, -0.5040283203125, -0.44561767578125, -0.38720703125, -0.32879638671875, -0.2703857421875, -0.21197509765625, -0.153564453125, -0.09515380859375, -0.0367431640625, 0.02166748046875, 0.080078125, 0.13848876953125, 0.1968994140625, 0.25531005859375, 0.313720703125, 0.37213134765625, 0.4305419921875, 0.48895263671875, 0.54736328125, 0.60577392578125, 0.6641845703125, 0.72259521484375, 0.781005859375, 0.83941650390625, 0.8978271484375, 0.95623779296875, 1.0146484375, 1.07305908203125, 1.1314697265625, 1.18988037109375, 1.248291015625, 1.30670166015625, 1.3651123046875, 1.42352294921875, 1.48193359375, 1.54034423828125, 1.5987548828125, 1.65716552734375, 1.715576171875, 1.77398681640625, 1.8323974609375, 1.89080810546875, 1.94921875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 5.0, 6.0, 10.0, 13.0, 11.0, 12.0, 21.0, 23.0, 21.0, 30.0, 32.0, 34.0, 27.0, 41.0, 35.0, 27.0, 39.0, 41.0, 43.0, 42.0, 47.0, 52.0, 51.0, 36.0, 50.0, 31.0, 22.0, 31.0, 23.0, 21.0, 21.0, 14.0, 20.0, 12.0, 12.0, 10.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.6253509521484375, -0.605194091796875, -0.5850372314453125, -0.56488037109375, -0.5447235107421875, -0.524566650390625, -0.5044097900390625, -0.4842529296875, -0.4640960693359375, -0.443939208984375, -0.4237823486328125, -0.40362548828125, -0.3834686279296875, -0.363311767578125, -0.3431549072265625, -0.322998046875, -0.3028411865234375, -0.282684326171875, -0.2625274658203125, -0.24237060546875, -0.2222137451171875, -0.202056884765625, -0.1819000244140625, -0.1617431640625, -0.1415863037109375, -0.121429443359375, -0.1012725830078125, -0.08111572265625, -0.0609588623046875, -0.040802001953125, -0.0206451416015625, -0.00048828125, 0.0196685791015625, 0.039825439453125, 0.0599822998046875, 0.08013916015625, 0.1002960205078125, 0.120452880859375, 0.1406097412109375, 0.1607666015625, 0.1809234619140625, 0.201080322265625, 0.2212371826171875, 0.24139404296875, 0.2615509033203125, 0.281707763671875, 0.3018646240234375, 0.322021484375, 0.3421783447265625, 0.362335205078125, 0.3824920654296875, 0.40264892578125, 0.4228057861328125, 0.442962646484375, 0.4631195068359375, 0.4832763671875, 0.5034332275390625, 0.523590087890625, 0.5437469482421875, 0.56390380859375, 0.5840606689453125, 0.604217529296875, 0.6243743896484375, 0.64453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 12.0, 9.0, 20.0, 36.0, 54.0, 105.0, 224.0, 492.0, 1322.0, 4079.0, 19936.0, 2712602.0, 1433149.0, 16507.0, 3620.0, 1200.0, 433.0, 194.0, 110.0, 70.0, 46.0, 19.0, 11.0, 12.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.90234375, -3.783935546875, -3.66552734375, -3.547119140625, -3.4287109375, -3.310302734375, -3.19189453125, -3.073486328125, -2.955078125, -2.836669921875, -2.71826171875, -2.599853515625, -2.4814453125, -2.363037109375, -2.24462890625, -2.126220703125, -2.0078125, -1.889404296875, -1.77099609375, -1.652587890625, -1.5341796875, -1.415771484375, -1.29736328125, -1.178955078125, -1.060546875, -0.942138671875, -0.82373046875, -0.705322265625, -0.5869140625, -0.468505859375, -0.35009765625, -0.231689453125, -0.11328125, 0.005126953125, 0.12353515625, 0.241943359375, 0.3603515625, 0.478759765625, 0.59716796875, 0.715576171875, 0.833984375, 0.952392578125, 1.07080078125, 1.189208984375, 1.3076171875, 1.426025390625, 1.54443359375, 1.662841796875, 1.78125, 1.899658203125, 2.01806640625, 2.136474609375, 2.2548828125, 2.373291015625, 2.49169921875, 2.610107421875, 2.728515625, 2.846923828125, 2.96533203125, 3.083740234375, 3.2021484375, 3.320556640625, 3.43896484375, 3.557373046875, 3.67578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 12.0, 11.0, 16.0, 24.0, 37.0, 82.0, 229.0, 572.0, 1186.0, 1030.0, 458.0, 194.0, 82.0, 45.0, 35.0, 12.0, 17.0, 9.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9296875, -2.840545654296875, -2.75140380859375, -2.662261962890625, -2.5731201171875, -2.483978271484375, -2.39483642578125, -2.305694580078125, -2.216552734375, -2.127410888671875, -2.03826904296875, -1.949127197265625, -1.8599853515625, -1.770843505859375, -1.68170166015625, -1.592559814453125, -1.50341796875, -1.414276123046875, -1.32513427734375, -1.235992431640625, -1.1468505859375, -1.057708740234375, -0.96856689453125, -0.879425048828125, -0.790283203125, -0.701141357421875, -0.61199951171875, -0.522857666015625, -0.4337158203125, -0.344573974609375, -0.25543212890625, -0.166290283203125, -0.0771484375, 0.011993408203125, 0.10113525390625, 0.190277099609375, 0.2794189453125, 0.368560791015625, 0.45770263671875, 0.546844482421875, 0.635986328125, 0.725128173828125, 0.81427001953125, 0.903411865234375, 0.9925537109375, 1.081695556640625, 1.17083740234375, 1.259979248046875, 1.34912109375, 1.438262939453125, 1.52740478515625, 1.616546630859375, 1.7056884765625, 1.794830322265625, 1.88397216796875, 1.973114013671875, 2.062255859375, 2.151397705078125, 2.24053955078125, 2.329681396484375, 2.4188232421875, 2.507965087890625, 2.59710693359375, 2.686248779296875, 2.775390625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 4.0, 11.0, 24.0, 78.0, 175.0, 342.0, 239.0, 81.0, 31.0, 12.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.909996032714844, -16.993131637573242, -16.07626724243164, -15.159402847290039, -14.242537498474121, -13.32567310333252, -12.408808708190918, -11.491943359375, -10.575078964233398, -9.658214569091797, -8.741350173950195, -7.8244853019714355, -6.907620429992676, -5.990756034851074, -5.073891639709473, -4.157026767730713, -3.2401628494262695, -2.323298215866089, -1.4064337015151978, -0.48956918716430664, 0.427295446395874, 1.3441600799560547, 2.2610244750976562, 3.177889347076416, 4.094753742218018, 5.011618137359619, 5.928483009338379, 6.8453474044799805, 7.762211799621582, 8.6790771484375, 9.595941543579102, 10.512805938720703, 11.429670333862305, 12.346534729003906, 13.263399124145508, 14.18026351928711, 15.097128868103027, 16.013992309570312, 16.930858612060547, 17.84772300720215, 18.76458740234375, 19.68145179748535, 20.598316192626953, 21.515180587768555, 22.432044982910156, 23.34891128540039, 24.26577377319336, 25.182640075683594, 26.099502563476562, 27.016366958618164, 27.933231353759766, 28.850095748901367, 29.76696014404297, 30.683826446533203, 31.600688934326172, 32.517555236816406, 33.43442153930664, 34.351287841796875, 35.268150329589844, 36.18501663208008, 37.10187911987305, 38.01874542236328, 38.93560791015625, 39.852474212646484, 40.76933670043945]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 9.0, 2.0, 11.0, 9.0, 15.0, 19.0, 12.0, 23.0, 30.0, 29.0, 39.0, 39.0, 55.0, 52.0, 53.0, 48.0, 44.0, 54.0, 53.0, 54.0, 56.0, 49.0, 45.0, 39.0, 30.0, 16.0, 25.0, 18.0, 25.0, 16.0, 9.0, 9.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.685941219329834, -7.404282569885254, -7.122623443603516, -6.8409647941589355, -6.559305667877197, -6.277647018432617, -5.995987892150879, -5.714329242706299, -5.432670593261719, -5.151011943817139, -4.8693528175354, -4.58769416809082, -4.306035041809082, -4.024376392364502, -3.7427175045013428, -3.4610586166381836, -3.1793994903564453, -2.897740602493286, -2.616081714630127, -2.334423065185547, -2.0527639389038086, -1.771105170249939, -1.4894464015960693, -1.2077875137329102, -0.926128625869751, -0.6444697380065918, -0.3628109097480774, -0.08115208148956299, 0.2005068063735962, 0.48216569423675537, 0.763824462890625, 1.0454833507537842, 1.3271417617797852, 1.6088006496429443, 1.8904595375061035, 2.1721181869506836, 2.453777313232422, 2.735435962677002, 3.017094850540161, 3.2987537384033203, 3.5804126262664795, 3.8620715141296387, 4.143730163574219, 4.425389289855957, 4.707047939300537, 4.988707065582275, 5.2703657150268555, 5.552024841308594, 5.833683490753174, 6.115342140197754, 6.397001266479492, 6.678659915924072, 6.9603190422058105, 7.241977691650391, 7.523636817932129, 7.805295467376709, 8.086954116821289, 8.368613243103027, 8.65027141571045, 8.931930541992188, 9.213589668273926, 9.495248794555664, 9.776906967163086, 10.058566093444824, 10.340225219726562]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 5.0, 17.0, 19.0, 26.0, 43.0, 52.0, 70.0, 102.0, 155.0, 205.0, 250.0, 415.0, 558.0, 841.0, 1276.0, 1765.0, 2864.0, 4353.0, 7880.0, 14986.0, 34817.0, 110175.0, 470647.0, 277479.0, 66550.0, 24326.0, 11421.0, 6128.0, 3708.0, 2391.0, 1533.0, 1074.0, 700.0, 494.0, 360.0, 238.0, 184.0, 123.0, 87.0, 58.0, 41.0, 33.0, 22.0, 29.0, 15.0, 6.0, 9.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.23046875, -1.190521240234375, -1.15057373046875, -1.110626220703125, -1.0706787109375, -1.030731201171875, -0.99078369140625, -0.950836181640625, -0.910888671875, -0.870941162109375, -0.83099365234375, -0.791046142578125, -0.7510986328125, -0.711151123046875, -0.67120361328125, -0.631256103515625, -0.59130859375, -0.551361083984375, -0.51141357421875, -0.471466064453125, -0.4315185546875, -0.391571044921875, -0.35162353515625, -0.311676025390625, -0.271728515625, -0.231781005859375, -0.19183349609375, -0.151885986328125, -0.1119384765625, -0.071990966796875, -0.03204345703125, 0.007904052734375, 0.0478515625, 0.087799072265625, 0.12774658203125, 0.167694091796875, 0.2076416015625, 0.247589111328125, 0.28753662109375, 0.327484130859375, 0.367431640625, 0.407379150390625, 0.44732666015625, 0.487274169921875, 0.5272216796875, 0.567169189453125, 0.60711669921875, 0.647064208984375, 0.68701171875, 0.726959228515625, 0.76690673828125, 0.806854248046875, 0.8468017578125, 0.886749267578125, 0.92669677734375, 0.966644287109375, 1.006591796875, 1.046539306640625, 1.08648681640625, 1.126434326171875, 1.1663818359375, 1.206329345703125, 1.24627685546875, 1.286224365234375, 1.326171875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 7.0, 8.0, 11.0, 15.0, 14.0, 29.0, 21.0, 18.0, 38.0, 38.0, 29.0, 43.0, 43.0, 49.0, 46.0, 45.0, 49.0, 60.0, 45.0, 58.0, 47.0, 38.0, 39.0, 29.0, 29.0, 28.0, 19.0, 22.0, 18.0, 18.0, 14.0, 9.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9208984375, -0.8956375122070312, -0.8703765869140625, -0.8451156616210938, -0.819854736328125, -0.7945938110351562, -0.7693328857421875, -0.7440719604492188, -0.71881103515625, -0.6935501098632812, -0.6682891845703125, -0.6430282592773438, -0.617767333984375, -0.5925064086914062, -0.5672454833984375, -0.5419845581054688, -0.5167236328125, -0.49146270751953125, -0.4662017822265625, -0.44094085693359375, -0.415679931640625, -0.39041900634765625, -0.3651580810546875, -0.33989715576171875, -0.31463623046875, -0.28937530517578125, -0.2641143798828125, -0.23885345458984375, -0.213592529296875, -0.18833160400390625, -0.1630706787109375, -0.13780975341796875, -0.112548828125, -0.08728790283203125, -0.0620269775390625, -0.03676605224609375, -0.011505126953125, 0.01375579833984375, 0.0390167236328125, 0.06427764892578125, 0.08953857421875, 0.11479949951171875, 0.1400604248046875, 0.16532135009765625, 0.190582275390625, 0.21584320068359375, 0.2411041259765625, 0.26636505126953125, 0.2916259765625, 0.31688690185546875, 0.3421478271484375, 0.36740875244140625, 0.392669677734375, 0.41793060302734375, 0.4431915283203125, 0.46845245361328125, 0.49371337890625, 0.5189743041992188, 0.5442352294921875, 0.5694961547851562, 0.594757080078125, 0.6200180053710938, 0.6452789306640625, 0.6705398559570312, 0.69580078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 9.0, 14.0, 16.0, 31.0, 40.0, 58.0, 105.0, 180.0, 294.0, 477.0, 951.0, 2177.0, 6707.0, 44580.0, 928121.0, 52937.0, 7406.0, 2290.0, 987.0, 463.0, 228.0, 174.0, 95.0, 79.0, 49.0, 24.0, 16.0, 12.0, 10.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.962890625, -3.844696044921875, -3.72650146484375, -3.608306884765625, -3.4901123046875, -3.371917724609375, -3.25372314453125, -3.135528564453125, -3.017333984375, -2.899139404296875, -2.78094482421875, -2.662750244140625, -2.5445556640625, -2.426361083984375, -2.30816650390625, -2.189971923828125, -2.07177734375, -1.953582763671875, -1.83538818359375, -1.717193603515625, -1.5989990234375, -1.480804443359375, -1.36260986328125, -1.244415283203125, -1.126220703125, -1.008026123046875, -0.88983154296875, -0.771636962890625, -0.6534423828125, -0.535247802734375, -0.41705322265625, -0.298858642578125, -0.1806640625, -0.062469482421875, 0.05572509765625, 0.173919677734375, 0.2921142578125, 0.410308837890625, 0.52850341796875, 0.646697998046875, 0.764892578125, 0.883087158203125, 1.00128173828125, 1.119476318359375, 1.2376708984375, 1.355865478515625, 1.47406005859375, 1.592254638671875, 1.71044921875, 1.828643798828125, 1.94683837890625, 2.065032958984375, 2.1832275390625, 2.301422119140625, 2.41961669921875, 2.537811279296875, 2.656005859375, 2.774200439453125, 2.89239501953125, 3.010589599609375, 3.1287841796875, 3.246978759765625, 3.36517333984375, 3.483367919921875, 3.6015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 5.0, 1.0, 7.0, 12.0, 11.0, 14.0, 11.0, 16.0, 17.0, 25.0, 24.0, 41.0, 23.0, 38.0, 49.0, 48.0, 56.0, 59.0, 57.0, 55.0, 55.0, 48.0, 44.0, 39.0, 40.0, 25.0, 32.0, 24.0, 24.0, 21.0, 10.0, 12.0, 14.0, 10.0, 3.0, 7.0, 4.0, 8.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.68359375, -3.585052490234375, -3.48651123046875, -3.387969970703125, -3.2894287109375, -3.190887451171875, -3.09234619140625, -2.993804931640625, -2.895263671875, -2.796722412109375, -2.69818115234375, -2.599639892578125, -2.5010986328125, -2.402557373046875, -2.30401611328125, -2.205474853515625, -2.10693359375, -2.008392333984375, -1.90985107421875, -1.811309814453125, -1.7127685546875, -1.614227294921875, -1.51568603515625, -1.417144775390625, -1.318603515625, -1.220062255859375, -1.12152099609375, -1.022979736328125, -0.9244384765625, -0.825897216796875, -0.72735595703125, -0.628814697265625, -0.5302734375, -0.431732177734375, -0.33319091796875, -0.234649658203125, -0.1361083984375, -0.037567138671875, 0.06097412109375, 0.159515380859375, 0.258056640625, 0.356597900390625, 0.45513916015625, 0.553680419921875, 0.6522216796875, 0.750762939453125, 0.84930419921875, 0.947845458984375, 1.04638671875, 1.144927978515625, 1.24346923828125, 1.342010498046875, 1.4405517578125, 1.539093017578125, 1.63763427734375, 1.736175537109375, 1.834716796875, 1.933258056640625, 2.03179931640625, 2.130340576171875, 2.2288818359375, 2.327423095703125, 2.42596435546875, 2.524505615234375, 2.623046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 7.0, 11.0, 15.0, 12.0, 34.0, 37.0, 57.0, 67.0, 129.0, 225.0, 434.0, 1080.0, 3145.0, 12439.0, 93318.0, 867260.0, 56721.0, 9241.0, 2453.0, 936.0, 400.0, 147.0, 103.0, 72.0, 51.0, 37.0, 21.0, 20.0, 15.0, 14.0, 10.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.0107421875, -0.9813613891601562, -0.9519805908203125, -0.9225997924804688, -0.893218994140625, -0.8638381958007812, -0.8344573974609375, -0.8050765991210938, -0.77569580078125, -0.7463150024414062, -0.7169342041015625, -0.6875534057617188, -0.658172607421875, -0.6287918090820312, -0.5994110107421875, -0.5700302124023438, -0.5406494140625, -0.5112686157226562, -0.4818878173828125, -0.45250701904296875, -0.423126220703125, -0.39374542236328125, -0.3643646240234375, -0.33498382568359375, -0.30560302734375, -0.27622222900390625, -0.2468414306640625, -0.21746063232421875, -0.188079833984375, -0.15869903564453125, -0.1293182373046875, -0.09993743896484375, -0.070556640625, -0.04117584228515625, -0.0117950439453125, 0.01758575439453125, 0.046966552734375, 0.07634735107421875, 0.1057281494140625, 0.13510894775390625, 0.16448974609375, 0.19387054443359375, 0.2232513427734375, 0.25263214111328125, 0.282012939453125, 0.31139373779296875, 0.3407745361328125, 0.37015533447265625, 0.3995361328125, 0.42891693115234375, 0.4582977294921875, 0.48767852783203125, 0.517059326171875, 0.5464401245117188, 0.5758209228515625, 0.6052017211914062, 0.63458251953125, 0.6639633178710938, 0.6933441162109375, 0.7227249145507812, 0.752105712890625, 0.7814865112304688, 0.8108673095703125, 0.8402481079101562, 0.86962890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 3.0, 4.0, 2.0, 10.0, 4.0, 6.0, 8.0, 13.0, 23.0, 25.0, 39.0, 45.0, 72.0, 114.0, 139.0, 154.0, 94.0, 62.0, 49.0, 34.0, 15.0, 21.0, 13.0, 10.0, 12.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017523765563964844, -0.00016895122826099396, -0.00016266480088233948, -0.000156378373503685, -0.00015009194612503052, -0.00014380551874637604, -0.00013751909136772156, -0.00013123266398906708, -0.0001249462366104126, -0.00011865980923175812, -0.00011237338185310364, -0.00010608695447444916, -9.980052709579468e-05, -9.35140997171402e-05, -8.722767233848572e-05, -8.094124495983124e-05, -7.465481758117676e-05, -6.836839020252228e-05, -6.20819628238678e-05, -5.579553544521332e-05, -4.950910806655884e-05, -4.322268068790436e-05, -3.693625330924988e-05, -3.06498259305954e-05, -2.4363398551940918e-05, -1.8076971173286438e-05, -1.1790543794631958e-05, -5.504116415977478e-06, 7.82310962677002e-07, 7.068738341331482e-06, 1.3355165719985962e-05, 1.9641593098640442e-05, 2.5928020477294922e-05, 3.22144478559494e-05, 3.850087523460388e-05, 4.478730261325836e-05, 5.107372999191284e-05, 5.736015737056732e-05, 6.36465847492218e-05, 6.993301212787628e-05, 7.621943950653076e-05, 8.250586688518524e-05, 8.879229426383972e-05, 9.50787216424942e-05, 0.00010136514902114868, 0.00010765157639980316, 0.00011393800377845764, 0.00012022443115711212, 0.0001265108585357666, 0.00013279728591442108, 0.00013908371329307556, 0.00014537014067173004, 0.00015165656805038452, 0.000157942995429039, 0.00016422942280769348, 0.00017051585018634796, 0.00017680227756500244, 0.00018308870494365692, 0.0001893751323223114, 0.00019566155970096588, 0.00020194798707962036, 0.00020823441445827484, 0.00021452084183692932, 0.0002208072692155838, 0.00022709369659423828]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 10.0, 8.0, 15.0, 30.0, 49.0, 48.0, 85.0, 100.0, 156.0, 241.0, 344.0, 585.0, 1013.0, 1806.0, 3882.0, 9003.0, 26742.0, 120374.0, 736172.0, 106719.0, 24593.0, 8512.0, 3759.0, 1758.0, 958.0, 549.0, 326.0, 232.0, 146.0, 97.0, 67.0, 55.0, 28.0, 24.0, 15.0, 7.0, 9.0, 5.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5143661499023438, -0.4974822998046875, -0.48059844970703125, -0.463714599609375, -0.44683074951171875, -0.4299468994140625, -0.41306304931640625, -0.39617919921875, -0.37929534912109375, -0.3624114990234375, -0.34552764892578125, -0.328643798828125, -0.31175994873046875, -0.2948760986328125, -0.27799224853515625, -0.2611083984375, -0.24422454833984375, -0.2273406982421875, -0.21045684814453125, -0.193572998046875, -0.17668914794921875, -0.1598052978515625, -0.14292144775390625, -0.12603759765625, -0.10915374755859375, -0.0922698974609375, -0.07538604736328125, -0.058502197265625, -0.04161834716796875, -0.0247344970703125, -0.00785064697265625, 0.009033203125, 0.02591705322265625, 0.0428009033203125, 0.05968475341796875, 0.076568603515625, 0.09345245361328125, 0.1103363037109375, 0.12722015380859375, 0.14410400390625, 0.16098785400390625, 0.1778717041015625, 0.19475555419921875, 0.211639404296875, 0.22852325439453125, 0.2454071044921875, 0.26229095458984375, 0.2791748046875, 0.29605865478515625, 0.3129425048828125, 0.32982635498046875, 0.346710205078125, 0.36359405517578125, 0.3804779052734375, 0.39736175537109375, 0.41424560546875, 0.43112945556640625, 0.4480133056640625, 0.46489715576171875, 0.481781005859375, 0.49866485595703125, 0.5155487060546875, 0.5324325561523438, 0.54931640625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 10.0, 6.0, 11.0, 8.0, 15.0, 16.0, 17.0, 37.0, 33.0, 32.0, 51.0, 58.0, 85.0, 87.0, 96.0, 82.0, 64.0, 73.0, 28.0, 36.0, 20.0, 24.0, 19.0, 13.0, 18.0, 5.0, 10.0, 4.0, 8.0, 4.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.46435546875, -0.44824981689453125, -0.4321441650390625, -0.41603851318359375, -0.399932861328125, -0.38382720947265625, -0.3677215576171875, -0.35161590576171875, -0.33551025390625, -0.31940460205078125, -0.3032989501953125, -0.28719329833984375, -0.271087646484375, -0.25498199462890625, -0.2388763427734375, -0.22277069091796875, -0.2066650390625, -0.19055938720703125, -0.1744537353515625, -0.15834808349609375, -0.142242431640625, -0.12613677978515625, -0.1100311279296875, -0.09392547607421875, -0.07781982421875, -0.06171417236328125, -0.0456085205078125, -0.02950286865234375, -0.013397216796875, 0.00270843505859375, 0.0188140869140625, 0.03491973876953125, 0.051025390625, 0.06713104248046875, 0.0832366943359375, 0.09934234619140625, 0.115447998046875, 0.13155364990234375, 0.1476593017578125, 0.16376495361328125, 0.17987060546875, 0.19597625732421875, 0.2120819091796875, 0.22818756103515625, 0.244293212890625, 0.26039886474609375, 0.2765045166015625, 0.29261016845703125, 0.3087158203125, 0.32482147216796875, 0.3409271240234375, 0.35703277587890625, 0.373138427734375, 0.38924407958984375, 0.4053497314453125, 0.42145538330078125, 0.43756103515625, 0.45366668701171875, 0.4697723388671875, 0.48587799072265625, 0.501983642578125, 0.5180892944335938, 0.5341949462890625, 0.5503005981445312, 0.56640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 13.0, 43.0, 147.0, 549.0, 159.0, 50.0, 19.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.531171798706055, -20.42557716369629, -19.319982528686523, -18.214385986328125, -17.10879135131836, -16.003196716308594, -14.897602081298828, -13.792007446289062, -12.68641185760498, -11.580817222595215, -10.475221633911133, -9.369626998901367, -8.264032363891602, -7.1584367752075195, -6.052842140197754, -4.94724702835083, -3.8416519165039062, -2.7360568046569824, -1.6304619312286377, -0.524867057800293, 0.5807280540466309, 1.6863231658935547, 2.7919178009033203, 3.897512912750244, 5.003108024597168, 6.108703136444092, 7.214298248291016, 8.319892883300781, 9.425487518310547, 10.531083106994629, 11.636677742004395, 12.742273330688477, 13.84786605834961, 14.953460693359375, 16.05905532836914, 17.164649963378906, 18.270246505737305, 19.37584114074707, 20.481435775756836, 21.5870304107666, 22.692626953125, 23.798221588134766, 24.90381622314453, 26.009410858154297, 27.115007400512695, 28.22060203552246, 29.326196670532227, 30.431791305541992, 31.537385940551758, 32.642982482910156, 33.74857711791992, 34.85417175292969, 35.95976638793945, 37.06536102294922, 38.170955657958984, 39.27655029296875, 40.382144927978516, 41.48773956298828, 42.59333419799805, 43.69892883300781, 44.80452346801758, 45.910118103027344, 47.015716552734375, 48.12131118774414, 49.226905822753906]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 7.0, 10.0, 11.0, 14.0, 13.0, 17.0, 19.0, 18.0, 23.0, 13.0, 23.0, 31.0, 35.0, 44.0, 74.0, 145.0, 124.0, 50.0, 41.0, 36.0, 27.0, 27.0, 25.0, 18.0, 26.0, 18.0, 19.0, 13.0, 16.0, 12.0, 9.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.020453453063965, -11.640933990478516, -11.261414527893066, -10.881895065307617, -10.502376556396484, -10.122857093811035, -9.743337631225586, -9.363818168640137, -8.984298706054688, -8.604779243469238, -8.225259780883789, -7.845740795135498, -7.466221809387207, -7.086702346801758, -6.707182884216309, -6.327663421630859, -5.948144912719727, -5.568625450134277, -5.189106464385986, -4.809587001800537, -4.430068016052246, -4.050548553466797, -3.6710290908813477, -3.2915098667144775, -2.9119906425476074, -2.5324714183807373, -2.152952194213867, -1.773432731628418, -1.3939135074615479, -1.0143942832946777, -0.6348748207092285, -0.2553555965423584, 0.12416362762451172, 0.5036829113960266, 0.8832021951675415, 1.2627215385437012, 1.6422407627105713, 2.0217599868774414, 2.4012794494628906, 2.7807986736297607, 3.160317897796631, 3.539837121963501, 3.919356346130371, 4.29887580871582, 4.6783952713012695, 5.0579142570495605, 5.43743371963501, 5.816952705383301, 6.19647216796875, 6.575991630554199, 6.95551061630249, 7.3350300788879395, 7.7145490646362305, 8.09406852722168, 8.473587989807129, 8.853107452392578, 9.232625961303711, 9.61214542388916, 9.99166488647461, 10.371183395385742, 10.750702857971191, 11.13022232055664, 11.50974178314209, 11.889261245727539, 12.268780708312988]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 11.0, 14.0, 15.0, 24.0, 25.0, 31.0, 53.0, 73.0, 96.0, 160.0, 203.0, 292.0, 417.0, 664.0, 1071.0, 1892.0, 3433.0, 7462.0, 21765.0, 128961.0, 1266178.0, 2334491.0, 357582.0, 45384.0, 12408.0, 5116.0, 2551.0, 1344.0, 860.0, 532.0, 350.0, 249.0, 176.0, 104.0, 80.0, 57.0, 40.0, 29.0, 22.0, 14.0, 7.0, 9.0, 8.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.541015625, -1.490020751953125, -1.43902587890625, -1.388031005859375, -1.3370361328125, -1.286041259765625, -1.23504638671875, -1.184051513671875, -1.133056640625, -1.082061767578125, -1.03106689453125, -0.980072021484375, -0.9290771484375, -0.878082275390625, -0.82708740234375, -0.776092529296875, -0.72509765625, -0.674102783203125, -0.62310791015625, -0.572113037109375, -0.5211181640625, -0.470123291015625, -0.41912841796875, -0.368133544921875, -0.317138671875, -0.266143798828125, -0.21514892578125, -0.164154052734375, -0.1131591796875, -0.062164306640625, -0.01116943359375, 0.039825439453125, 0.0908203125, 0.141815185546875, 0.19281005859375, 0.243804931640625, 0.2947998046875, 0.345794677734375, 0.39678955078125, 0.447784423828125, 0.498779296875, 0.549774169921875, 0.60076904296875, 0.651763916015625, 0.7027587890625, 0.753753662109375, 0.80474853515625, 0.855743408203125, 0.90673828125, 0.957733154296875, 1.00872802734375, 1.059722900390625, 1.1107177734375, 1.161712646484375, 1.21270751953125, 1.263702392578125, 1.314697265625, 1.365692138671875, 1.41668701171875, 1.467681884765625, 1.5186767578125, 1.569671630859375, 1.62066650390625, 1.671661376953125, 1.72265625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 6.0, 13.0, 20.0, 11.0, 20.0, 35.0, 25.0, 38.0, 28.0, 37.0, 37.0, 35.0, 54.0, 36.0, 44.0, 48.0, 48.0, 45.0, 44.0, 62.0, 37.0, 48.0, 41.0, 28.0, 25.0, 23.0, 18.0, 19.0, 20.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.9111328125, -0.8868637084960938, -0.8625946044921875, -0.8383255004882812, -0.814056396484375, -0.7897872924804688, -0.7655181884765625, -0.7412490844726562, -0.71697998046875, -0.6927108764648438, -0.6684417724609375, -0.6441726684570312, -0.619903564453125, -0.5956344604492188, -0.5713653564453125, -0.5470962524414062, -0.5228271484375, -0.49855804443359375, -0.4742889404296875, -0.45001983642578125, -0.425750732421875, -0.40148162841796875, -0.3772125244140625, -0.35294342041015625, -0.32867431640625, -0.30440521240234375, -0.2801361083984375, -0.25586700439453125, -0.231597900390625, -0.20732879638671875, -0.1830596923828125, -0.15879058837890625, -0.134521484375, -0.11025238037109375, -0.0859832763671875, -0.06171417236328125, -0.037445068359375, -0.01317596435546875, 0.0110931396484375, 0.03536224365234375, 0.05963134765625, 0.08390045166015625, 0.1081695556640625, 0.13243865966796875, 0.156707763671875, 0.18097686767578125, 0.2052459716796875, 0.22951507568359375, 0.2537841796875, 0.27805328369140625, 0.3023223876953125, 0.32659149169921875, 0.350860595703125, 0.37512969970703125, 0.3993988037109375, 0.42366790771484375, 0.44793701171875, 0.47220611572265625, 0.4964752197265625, 0.5207443237304688, 0.545013427734375, 0.5692825317382812, 0.5935516357421875, 0.6178207397460938, 0.64208984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 3.0, 3.0, 6.0, 11.0, 14.0, 22.0, 28.0, 37.0, 53.0, 83.0, 98.0, 220.0, 359.0, 890.0, 2379.0, 9807.0, 135672.0, 3989086.0, 46973.0, 5657.0, 1536.0, 619.0, 254.0, 158.0, 77.0, 64.0, 41.0, 33.0, 22.0, 13.0, 14.0, 12.0, 15.0, 10.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.76171875, -4.59381103515625, -4.4259033203125, -4.25799560546875, -4.090087890625, -3.92218017578125, -3.7542724609375, -3.58636474609375, -3.41845703125, -3.25054931640625, -3.0826416015625, -2.91473388671875, -2.746826171875, -2.57891845703125, -2.4110107421875, -2.24310302734375, -2.0751953125, -1.90728759765625, -1.7393798828125, -1.57147216796875, -1.403564453125, -1.23565673828125, -1.0677490234375, -0.89984130859375, -0.73193359375, -0.56402587890625, -0.3961181640625, -0.22821044921875, -0.060302734375, 0.10760498046875, 0.2755126953125, 0.44342041015625, 0.611328125, 0.77923583984375, 0.9471435546875, 1.11505126953125, 1.282958984375, 1.45086669921875, 1.6187744140625, 1.78668212890625, 1.95458984375, 2.12249755859375, 2.2904052734375, 2.45831298828125, 2.626220703125, 2.79412841796875, 2.9620361328125, 3.12994384765625, 3.2978515625, 3.46575927734375, 3.6336669921875, 3.80157470703125, 3.969482421875, 4.13739013671875, 4.3052978515625, 4.47320556640625, 4.64111328125, 4.80902099609375, 4.9769287109375, 5.14483642578125, 5.312744140625, 5.48065185546875, 5.6485595703125, 5.81646728515625, 5.984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 10.0, 10.0, 13.0, 21.0, 28.0, 26.0, 52.0, 81.0, 137.0, 220.0, 350.0, 646.0, 876.0, 653.0, 386.0, 225.0, 116.0, 82.0, 50.0, 30.0, 14.0, 19.0, 11.0, 8.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.345977783203125, -3.23687744140625, -3.127777099609375, -3.0186767578125, -2.909576416015625, -2.80047607421875, -2.691375732421875, -2.582275390625, -2.473175048828125, -2.36407470703125, -2.254974365234375, -2.1458740234375, -2.036773681640625, -1.92767333984375, -1.818572998046875, -1.70947265625, -1.600372314453125, -1.49127197265625, -1.382171630859375, -1.2730712890625, -1.163970947265625, -1.05487060546875, -0.945770263671875, -0.836669921875, -0.727569580078125, -0.61846923828125, -0.509368896484375, -0.4002685546875, -0.291168212890625, -0.18206787109375, -0.072967529296875, 0.0361328125, 0.145233154296875, 0.25433349609375, 0.363433837890625, 0.4725341796875, 0.581634521484375, 0.69073486328125, 0.799835205078125, 0.908935546875, 1.018035888671875, 1.12713623046875, 1.236236572265625, 1.3453369140625, 1.454437255859375, 1.56353759765625, 1.672637939453125, 1.78173828125, 1.890838623046875, 1.99993896484375, 2.109039306640625, 2.2181396484375, 2.327239990234375, 2.43634033203125, 2.545440673828125, 2.654541015625, 2.763641357421875, 2.87274169921875, 2.981842041015625, 3.0909423828125, 3.200042724609375, 3.30914306640625, 3.418243408203125, 3.52734375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 9.0, 23.0, 39.0, 90.0, 186.0, 274.0, 197.0, 96.0, 37.0, 17.0, 8.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.7006950378418, -49.388797760009766, -48.076904296875, -46.76500701904297, -45.45310974121094, -44.14121627807617, -42.82931900024414, -41.517425537109375, -40.205528259277344, -38.89363098144531, -37.58173751831055, -36.269840240478516, -34.95794677734375, -33.64604949951172, -32.33415222167969, -31.02225685119629, -29.71036148071289, -28.398466110229492, -27.086570739746094, -25.774673461914062, -24.462778091430664, -23.150882720947266, -21.838985443115234, -20.527090072631836, -19.215194702148438, -17.90329933166504, -16.59140396118164, -15.27950668334961, -13.967611312866211, -12.655715942382812, -11.343819618225098, -10.031923294067383, -8.720024108886719, -7.408128261566162, -6.0962324142456055, -4.784336566925049, -3.472440719604492, -2.1605448722839355, -0.8486490249633789, 0.46324729919433594, 1.7751426696777344, 3.087038516998291, 4.398934364318848, 5.710830211639404, 7.022726058959961, 8.33462142944336, 9.646517753601074, 10.958414077758789, 12.270309448242188, 13.582204818725586, 14.8941011428833, 16.205997467041016, 17.517892837524414, 18.829788208007812, 20.141685485839844, 21.453580856323242, 22.76547622680664, 24.07737159729004, 25.389266967773438, 26.70116424560547, 28.013059616088867, 29.324954986572266, 30.636852264404297, 31.948747634887695, 33.260643005371094]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 3.0, 8.0, 11.0, 10.0, 10.0, 19.0, 24.0, 25.0, 39.0, 33.0, 40.0, 35.0, 48.0, 64.0, 64.0, 66.0, 48.0, 53.0, 52.0, 55.0, 42.0, 33.0, 37.0, 23.0, 37.0, 16.0, 32.0, 10.0, 10.0, 9.0, 11.0, 3.0, 8.0, 8.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.228525161743164, -16.702938079833984, -16.177352905273438, -15.651765823364258, -15.126178741455078, -14.600592613220215, -14.075006484985352, -13.549419403076172, -13.023833274841309, -12.498247146606445, -11.972660064697266, -11.447073936462402, -10.921487808227539, -10.39590072631836, -9.870314598083496, -9.344728469848633, -8.819141387939453, -8.29355525970459, -7.76796817779541, -7.242382049560547, -6.716795444488525, -6.191208839416504, -5.665622711181641, -5.140036106109619, -4.614449501037598, -4.088862895965576, -3.563276529312134, -3.0376901626586914, -2.51210355758667, -1.9865169525146484, -1.460930585861206, -0.9353442192077637, -0.409759521484375, 0.11582696437835693, 0.6414134502410889, 1.1669999361038208, 1.6925864219665527, 2.218173027038574, 2.7437593936920166, 3.269345760345459, 3.7949323654174805, 4.320518970489502, 4.846105575561523, 5.371691703796387, 5.897278308868408, 6.42286491394043, 6.948451042175293, 7.4740376472473145, 7.999624252319336, 8.5252103805542, 9.050797462463379, 9.576383590698242, 10.101970672607422, 10.627556800842285, 11.153142929077148, 11.678730010986328, 12.204316139221191, 12.729902267456055, 13.255489349365234, 13.781075477600098, 14.306661605834961, 14.83224868774414, 15.357834815979004, 15.883420944213867, 16.409008026123047]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 10.0, 10.0, 15.0, 24.0, 46.0, 66.0, 83.0, 177.0, 364.0, 802.0, 1951.0, 6153.0, 27789.0, 434704.0, 535577.0, 30654.0, 6439.0, 2006.0, 841.0, 392.0, 182.0, 101.0, 60.0, 29.0, 23.0, 12.0, 8.0, 10.0, 7.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.201171875, -2.130218505859375, -2.05926513671875, -1.988311767578125, -1.9173583984375, -1.846405029296875, -1.77545166015625, -1.704498291015625, -1.633544921875, -1.562591552734375, -1.49163818359375, -1.420684814453125, -1.3497314453125, -1.278778076171875, -1.20782470703125, -1.136871337890625, -1.06591796875, -0.994964599609375, -0.92401123046875, -0.853057861328125, -0.7821044921875, -0.711151123046875, -0.64019775390625, -0.569244384765625, -0.498291015625, -0.427337646484375, -0.35638427734375, -0.285430908203125, -0.2144775390625, -0.143524169921875, -0.07257080078125, -0.001617431640625, 0.0693359375, 0.140289306640625, 0.21124267578125, 0.282196044921875, 0.3531494140625, 0.424102783203125, 0.49505615234375, 0.566009521484375, 0.636962890625, 0.707916259765625, 0.77886962890625, 0.849822998046875, 0.9207763671875, 0.991729736328125, 1.06268310546875, 1.133636474609375, 1.20458984375, 1.275543212890625, 1.34649658203125, 1.417449951171875, 1.4884033203125, 1.559356689453125, 1.63031005859375, 1.701263427734375, 1.772216796875, 1.843170166015625, 1.91412353515625, 1.985076904296875, 2.0560302734375, 2.126983642578125, 2.19793701171875, 2.268890380859375, 2.33984375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 15.0, 27.0, 32.0, 46.0, 55.0, 74.0, 88.0, 106.0, 85.0, 106.0, 95.0, 65.0, 60.0, 45.0, 26.0, 22.0, 17.0, 11.0, 8.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.783203125, -1.7263946533203125, -1.669586181640625, -1.6127777099609375, -1.55596923828125, -1.4991607666015625, -1.442352294921875, -1.3855438232421875, -1.3287353515625, -1.2719268798828125, -1.215118408203125, -1.1583099365234375, -1.10150146484375, -1.0446929931640625, -0.987884521484375, -0.9310760498046875, -0.874267578125, -0.8174591064453125, -0.760650634765625, -0.7038421630859375, -0.64703369140625, -0.5902252197265625, -0.533416748046875, -0.4766082763671875, -0.4197998046875, -0.3629913330078125, -0.306182861328125, -0.2493743896484375, -0.19256591796875, -0.1357574462890625, -0.078948974609375, -0.0221405029296875, 0.03466796875, 0.0914764404296875, 0.148284912109375, 0.2050933837890625, 0.26190185546875, 0.3187103271484375, 0.375518798828125, 0.4323272705078125, 0.4891357421875, 0.5459442138671875, 0.602752685546875, 0.6595611572265625, 0.71636962890625, 0.7731781005859375, 0.829986572265625, 0.8867950439453125, 0.943603515625, 1.0004119873046875, 1.057220458984375, 1.1140289306640625, 1.17083740234375, 1.2276458740234375, 1.284454345703125, 1.3412628173828125, 1.3980712890625, 1.4548797607421875, 1.511688232421875, 1.5684967041015625, 1.62530517578125, 1.6821136474609375, 1.738922119140625, 1.7957305908203125, 1.8525390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 5.0, 10.0, 17.0, 12.0, 17.0, 22.0, 49.0, 59.0, 108.0, 165.0, 271.0, 616.0, 1411.0, 4898.0, 39122.0, 953376.0, 40355.0, 5212.0, 1453.0, 581.0, 273.0, 180.0, 121.0, 56.0, 52.0, 28.0, 23.0, 21.0, 9.0, 11.0, 6.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.400177001953125, -2.31597900390625, -2.231781005859375, -2.1475830078125, -2.063385009765625, -1.97918701171875, -1.894989013671875, -1.810791015625, -1.726593017578125, -1.64239501953125, -1.558197021484375, -1.4739990234375, -1.389801025390625, -1.30560302734375, -1.221405029296875, -1.13720703125, -1.053009033203125, -0.96881103515625, -0.884613037109375, -0.8004150390625, -0.716217041015625, -0.63201904296875, -0.547821044921875, -0.463623046875, -0.379425048828125, -0.29522705078125, -0.211029052734375, -0.1268310546875, -0.042633056640625, 0.04156494140625, 0.125762939453125, 0.2099609375, 0.294158935546875, 0.37835693359375, 0.462554931640625, 0.5467529296875, 0.630950927734375, 0.71514892578125, 0.799346923828125, 0.883544921875, 0.967742919921875, 1.05194091796875, 1.136138916015625, 1.2203369140625, 1.304534912109375, 1.38873291015625, 1.472930908203125, 1.55712890625, 1.641326904296875, 1.72552490234375, 1.809722900390625, 1.8939208984375, 1.978118896484375, 2.06231689453125, 2.146514892578125, 2.230712890625, 2.314910888671875, 2.39910888671875, 2.483306884765625, 2.5675048828125, 2.651702880859375, 2.73590087890625, 2.820098876953125, 2.904296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 10.0, 11.0, 7.0, 13.0, 8.0, 11.0, 23.0, 25.0, 29.0, 35.0, 44.0, 68.0, 69.0, 100.0, 95.0, 94.0, 65.0, 49.0, 31.0, 40.0, 32.0, 19.0, 22.0, 17.0, 20.0, 13.0, 10.0, 9.0, 6.0, 11.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.70703125, -4.55206298828125, -4.3970947265625, -4.24212646484375, -4.087158203125, -3.93218994140625, -3.7772216796875, -3.62225341796875, -3.46728515625, -3.31231689453125, -3.1573486328125, -3.00238037109375, -2.847412109375, -2.69244384765625, -2.5374755859375, -2.38250732421875, -2.2275390625, -2.07257080078125, -1.9176025390625, -1.76263427734375, -1.607666015625, -1.45269775390625, -1.2977294921875, -1.14276123046875, -0.98779296875, -0.83282470703125, -0.6778564453125, -0.52288818359375, -0.367919921875, -0.21295166015625, -0.0579833984375, 0.09698486328125, 0.251953125, 0.40692138671875, 0.5618896484375, 0.71685791015625, 0.871826171875, 1.02679443359375, 1.1817626953125, 1.33673095703125, 1.49169921875, 1.64666748046875, 1.8016357421875, 1.95660400390625, 2.111572265625, 2.26654052734375, 2.4215087890625, 2.57647705078125, 2.7314453125, 2.88641357421875, 3.0413818359375, 3.19635009765625, 3.351318359375, 3.50628662109375, 3.6612548828125, 3.81622314453125, 3.97119140625, 4.12615966796875, 4.2811279296875, 4.43609619140625, 4.591064453125, 4.74603271484375, 4.9010009765625, 5.05596923828125, 5.2109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 2.0, 9.0, 5.0, 10.0, 21.0, 19.0, 34.0, 41.0, 54.0, 83.0, 88.0, 116.0, 150.0, 230.0, 305.0, 448.0, 620.0, 1026.0, 1607.0, 2860.0, 5453.0, 12410.0, 41001.0, 816593.0, 125048.0, 21789.0, 8337.0, 3973.0, 2182.0, 1355.0, 767.0, 556.0, 368.0, 247.0, 176.0, 133.0, 88.0, 75.0, 53.0, 39.0, 40.0, 29.0, 24.0, 24.0, 18.0, 9.0, 6.0, 8.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.283935546875, -0.2747077941894531, -0.26548004150390625, -0.2562522888183594, -0.2470245361328125, -0.23779678344726562, -0.22856903076171875, -0.21934127807617188, -0.210113525390625, -0.20088577270507812, -0.19165802001953125, -0.18243026733398438, -0.1732025146484375, -0.16397476196289062, -0.15474700927734375, -0.14551925659179688, -0.13629150390625, -0.12706375122070312, -0.11783599853515625, -0.10860824584960938, -0.0993804931640625, -0.09015274047851562, -0.08092498779296875, -0.07169723510742188, -0.062469482421875, -0.053241729736328125, -0.04401397705078125, -0.034786224365234375, -0.0255584716796875, -0.016330718994140625, -0.00710296630859375, 0.002124786376953125, 0.0113525390625, 0.020580291748046875, 0.02980804443359375, 0.039035797119140625, 0.0482635498046875, 0.057491302490234375, 0.06671905517578125, 0.07594680786132812, 0.085174560546875, 0.09440231323242188, 0.10363006591796875, 0.11285781860351562, 0.1220855712890625, 0.13131332397460938, 0.14054107666015625, 0.14976882934570312, 0.15899658203125, 0.16822433471679688, 0.17745208740234375, 0.18667984008789062, 0.1959075927734375, 0.20513534545898438, 0.21436309814453125, 0.22359085083007812, 0.232818603515625, 0.24204635620117188, 0.25127410888671875, 0.2605018615722656, 0.2697296142578125, 0.2789573669433594, 0.28818511962890625, 0.2974128723144531, 0.306640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 2.0, 8.0, 11.0, 17.0, 21.0, 37.0, 64.0, 143.0, 324.0, 175.0, 79.0, 35.0, 24.0, 16.0, 11.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020551681518554688, -0.00019777566194534302, -0.00019003450870513916, -0.0001822933554649353, -0.00017455220222473145, -0.0001668110489845276, -0.00015906989574432373, -0.00015132874250411987, -0.00014358758926391602, -0.00013584643602371216, -0.0001281052827835083, -0.00012036412954330444, -0.00011262297630310059, -0.00010488182306289673, -9.714066982269287e-05, -8.939951658248901e-05, -8.165836334228516e-05, -7.39172101020813e-05, -6.617605686187744e-05, -5.8434903621673584e-05, -5.0693750381469727e-05, -4.295259714126587e-05, -3.521144390106201e-05, -2.7470290660858154e-05, -1.9729137420654297e-05, -1.198798418045044e-05, -4.246830940246582e-06, 3.4943222999572754e-06, 1.1235475540161133e-05, 1.897662878036499e-05, 2.6717782020568848e-05, 3.4458935260772705e-05, 4.220008850097656e-05, 4.994124174118042e-05, 5.768239498138428e-05, 6.542354822158813e-05, 7.316470146179199e-05, 8.090585470199585e-05, 8.864700794219971e-05, 9.638816118240356e-05, 0.00010412931442260742, 0.00011187046766281128, 0.00011961162090301514, 0.000127352774143219, 0.00013509392738342285, 0.0001428350806236267, 0.00015057623386383057, 0.00015831738710403442, 0.00016605854034423828, 0.00017379969358444214, 0.000181540846824646, 0.00018928200006484985, 0.0001970231533050537, 0.00020476430654525757, 0.00021250545978546143, 0.00022024661302566528, 0.00022798776626586914, 0.000235728919506073, 0.00024347007274627686, 0.0002512112259864807, 0.00025895237922668457, 0.00026669353246688843, 0.0002744346857070923, 0.00028217583894729614, 0.0002899169921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 8.0, 8.0, 13.0, 30.0, 24.0, 33.0, 43.0, 59.0, 92.0, 150.0, 215.0, 288.0, 491.0, 709.0, 1186.0, 2083.0, 4201.0, 8900.0, 24586.0, 136122.0, 796186.0, 46793.0, 13635.0, 5687.0, 2818.0, 1629.0, 866.0, 567.0, 374.0, 239.0, 153.0, 100.0, 94.0, 57.0, 24.0, 25.0, 15.0, 9.0, 8.0, 8.0, 3.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.263671875, -0.2546501159667969, -0.24562835693359375, -0.23660659790039062, -0.2275848388671875, -0.21856307983398438, -0.20954132080078125, -0.20051956176757812, -0.191497802734375, -0.18247604370117188, -0.17345428466796875, -0.16443252563476562, -0.1554107666015625, -0.14638900756835938, -0.13736724853515625, -0.12834548950195312, -0.11932373046875, -0.11030197143554688, -0.10128021240234375, -0.09225845336914062, -0.0832366943359375, -0.07421493530273438, -0.06519317626953125, -0.056171417236328125, -0.047149658203125, -0.038127899169921875, -0.02910614013671875, -0.020084381103515625, -0.0110626220703125, -0.002040863037109375, 0.00698089599609375, 0.016002655029296875, 0.0250244140625, 0.034046173095703125, 0.04306793212890625, 0.052089691162109375, 0.0611114501953125, 0.07013320922851562, 0.07915496826171875, 0.08817672729492188, 0.097198486328125, 0.10622024536132812, 0.11524200439453125, 0.12426376342773438, 0.1332855224609375, 0.14230728149414062, 0.15132904052734375, 0.16035079956054688, 0.16937255859375, 0.17839431762695312, 0.18741607666015625, 0.19643783569335938, 0.2054595947265625, 0.21448135375976562, 0.22350311279296875, 0.23252487182617188, 0.241546630859375, 0.2505683898925781, 0.25959014892578125, 0.2686119079589844, 0.2776336669921875, 0.2866554260253906, 0.29567718505859375, 0.3046989440917969, 0.313720703125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 7.0, 4.0, 8.0, 12.0, 5.0, 5.0, 5.0, 10.0, 10.0, 20.0, 26.0, 38.0, 102.0, 125.0, 203.0, 156.0, 82.0, 45.0, 18.0, 23.0, 14.0, 14.0, 11.0, 9.0, 11.0, 4.0, 4.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53564453125, -0.5181045532226562, -0.5005645751953125, -0.48302459716796875, -0.465484619140625, -0.44794464111328125, -0.4304046630859375, -0.41286468505859375, -0.39532470703125, -0.37778472900390625, -0.3602447509765625, -0.34270477294921875, -0.325164794921875, -0.30762481689453125, -0.2900848388671875, -0.27254486083984375, -0.2550048828125, -0.23746490478515625, -0.2199249267578125, -0.20238494873046875, -0.184844970703125, -0.16730499267578125, -0.1497650146484375, -0.13222503662109375, -0.11468505859375, -0.09714508056640625, -0.0796051025390625, -0.06206512451171875, -0.044525146484375, -0.02698516845703125, -0.0094451904296875, 0.00809478759765625, 0.025634765625, 0.04317474365234375, 0.0607147216796875, 0.07825469970703125, 0.095794677734375, 0.11333465576171875, 0.1308746337890625, 0.14841461181640625, 0.16595458984375, 0.18349456787109375, 0.2010345458984375, 0.21857452392578125, 0.236114501953125, 0.25365447998046875, 0.2711944580078125, 0.28873443603515625, 0.3062744140625, 0.32381439208984375, 0.3413543701171875, 0.35889434814453125, 0.376434326171875, 0.39397430419921875, 0.4115142822265625, 0.42905426025390625, 0.44659423828125, 0.46413421630859375, 0.4816741943359375, 0.49921417236328125, 0.516754150390625, 0.5342941284179688, 0.5518341064453125, 0.5693740844726562, 0.5869140625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 15.0, 27.0, 56.0, 90.0, 567.0, 127.0, 50.0, 33.0, 11.0, 13.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.343408584594727, -28.584228515625, -27.825048446655273, -27.065868377685547, -26.306690216064453, -25.547510147094727, -24.788330078125, -24.029150009155273, -23.269969940185547, -22.51078987121582, -21.751609802246094, -20.992431640625, -20.233251571655273, -19.474071502685547, -18.71489143371582, -17.955711364746094, -17.196533203125, -16.437353134155273, -15.678174018859863, -14.918993949890137, -14.159814834594727, -13.400634765625, -12.641454696655273, -11.882274627685547, -11.123095512390137, -10.36391544342041, -9.604736328125, -8.845556259155273, -8.086376190185547, -7.327197074890137, -6.56801700592041, -5.808837413787842, -5.049655914306641, -4.290476322174072, -3.531296491622925, -2.7721166610717773, -2.012937068939209, -1.2537574768066406, -0.49457740783691406, 0.2646021842956543, 1.0237817764282227, 1.7829614877700806, 2.5421411991119385, 3.301321029663086, 4.060500621795654, 4.819680213928223, 5.578860282897949, 6.338039875030518, 7.097219467163086, 7.856399059295654, 8.615578651428223, 9.37475872039795, 10.13393783569336, 10.893117904663086, 11.652297973632812, 12.411478042602539, 13.17065715789795, 13.929837226867676, 14.689016342163086, 15.448196411132812, 16.20737648010254, 16.966556549072266, 17.72573471069336, 18.484914779663086, 19.244094848632812]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 10.0, 18.0, 14.0, 18.0, 7.0, 18.0, 23.0, 21.0, 28.0, 35.0, 37.0, 56.0, 283.0, 216.0, 46.0, 27.0, 33.0, 21.0, 17.0, 10.0, 16.0, 15.0, 8.0, 7.0, 3.0, 7.0, 4.0, 6.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.077590942382812, -21.524276733398438, -20.970964431762695, -20.41765022277832, -19.864336013793945, -19.311023712158203, -18.757709503173828, -18.204395294189453, -17.651081085205078, -17.097766876220703, -16.54445457458496, -15.991140365600586, -15.437826156616211, -14.884512901306152, -14.331199645996094, -13.777885437011719, -13.224573135375977, -12.671259880065918, -12.117945671081543, -11.564632415771484, -11.01131820678711, -10.45800495147705, -9.904691696166992, -9.351377487182617, -8.798064231872559, -8.2447509765625, -7.691436767578125, -7.138123512268066, -6.58480978012085, -6.031496047973633, -5.478182792663574, -4.924869060516357, -4.371553421020508, -3.818239688873291, -3.2649261951446533, -2.7116127014160156, -2.158298969268799, -1.604985237121582, -1.0516717433929443, -0.49835824966430664, 0.054955482482910156, 0.6082690954208374, 1.1615827083587646, 1.714896321296692, 2.268209934234619, 2.821523666381836, 3.3748371601104736, 3.9281506538391113, 4.481464385986328, 5.034778118133545, 5.588091850280762, 6.14140510559082, 6.694718837738037, 7.248032569885254, 7.8013458251953125, 8.354660034179688, 8.907973289489746, 9.461286544799805, 10.01460075378418, 10.567914009094238, 11.121227264404297, 11.674541473388672, 12.22785472869873, 12.781167984008789, 13.334482192993164]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 4.0, 5.0, 7.0, 5.0, 9.0, 6.0, 11.0, 10.0, 13.0, 10.0, 18.0, 26.0, 20.0, 21.0, 27.0, 27.0, 44.0, 51.0, 80.0, 213.0, 100.0, 41.0, 46.0, 15.0, 31.0, 25.0, 16.0, 17.0, 19.0, 20.0, 15.0, 12.0, 10.0, 8.0, 5.0, 0.0, 3.0, 4.0, 1.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.9716796875, -0.9464340209960938, -0.9211883544921875, -0.8959426879882812, -0.870697021484375, -0.8454513549804688, -0.8202056884765625, -0.7949600219726562, -0.76971435546875, -0.7444686889648438, -0.7192230224609375, -0.6939773559570312, -0.668731689453125, -0.6434860229492188, -0.6182403564453125, -0.5929946899414062, -0.5677490234375, -0.5425033569335938, -0.5172576904296875, -0.49201202392578125, -0.466766357421875, -0.44152069091796875, -0.4162750244140625, -0.39102935791015625, -0.36578369140625, -0.34053802490234375, -0.3152923583984375, -0.29004669189453125, -0.264801025390625, -0.23955535888671875, -0.2143096923828125, -0.18906402587890625, -0.163818359375, -0.13857269287109375, -0.1133270263671875, -0.08808135986328125, -0.062835693359375, -0.03759002685546875, -0.0123443603515625, 0.01290130615234375, 0.03814697265625, 0.06339263916015625, 0.0886383056640625, 0.11388397216796875, 0.139129638671875, 0.16437530517578125, 0.1896209716796875, 0.21486663818359375, 0.2401123046875, 0.26535797119140625, 0.2906036376953125, 0.31584930419921875, 0.341094970703125, 0.36634063720703125, 0.3915863037109375, 0.41683197021484375, 0.44207763671875, 0.46732330322265625, 0.4925689697265625, 0.5178146362304688, 0.543060302734375, 0.5683059692382812, 0.5935516357421875, 0.6187973022460938, 0.64404296875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 1.0, 3.0, 11.0, 9.0, 7.0, 13.0, 11.0, 32.0, 37.0, 67.0, 107.0, 184.0, 363.0, 812.0, 2454.0, 10997.0, 8336661.0, 30420.0, 4010.0, 1253.0, 501.0, 239.0, 122.0, 71.0, 57.0, 40.0, 25.0, 12.0, 10.0, 9.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.116008758544922, -7.867669105529785, -7.619329929351807, -7.37099027633667, -7.122651100158691, -6.874311447143555, -6.625971794128418, -6.3776326179504395, -6.129293441772461, -5.880953788757324, -5.632614612579346, -5.384274959564209, -5.1359357833862305, -4.887596130371094, -4.639256477355957, -4.3909173011779785, -4.142577648162842, -3.894238233566284, -3.6458988189697266, -3.39755916595459, -3.1492199897766113, -2.9008803367614746, -2.652540922164917, -2.4042015075683594, -2.1558620929718018, -1.9075226783752441, -1.6591832637786865, -1.4108437299728394, -1.1625043153762817, -0.9141649007797241, -0.665825366973877, -0.41748595237731934, -0.16914606094360352, 0.07919338345527649, 0.3275328278541565, 0.5758723020553589, 0.8242117166519165, 1.0725511312484741, 1.3208906650543213, 1.569230079650879, 1.8175694942474365, 2.065908908843994, 2.3142483234405518, 2.5625877380371094, 2.810927391052246, 3.0592665672302246, 3.3076062202453613, 3.555945634841919, 3.8042850494384766, 4.052624702453613, 4.300963878631592, 4.5493035316467285, 4.797642707824707, 5.045982360839844, 5.2943220138549805, 5.542661190032959, 5.7910003662109375, 6.039340019226074, 6.287679195404053, 6.5360188484191895, 6.784358024597168, 7.032697677612305, 7.281037330627441, 7.52937650680542, 7.777716159820557]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 1.0, 3.0, 4.0, 7.0, 8.0, 3.0, 3.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.90190601348877, -13.522135734558105, -13.142365455627441, -12.762595176696777, -12.382824897766113, -12.00305461883545, -11.623283386230469, -11.243513107299805, -10.86374282836914, -10.483972549438477, -10.104202270507812, -9.724431991577148, -9.344661712646484, -8.96489143371582, -8.585121154785156, -8.205350875854492, -7.825580596923828, -7.445810317993164, -7.0660400390625, -6.686269760131836, -6.306499481201172, -5.926729202270508, -5.5469584465026855, -5.1671881675720215, -4.787417888641357, -4.407647609710693, -4.027877330780029, -3.648106813430786, -3.268336534500122, -2.888566255569458, -2.508795738220215, -2.129025459289551, -1.7492551803588867, -1.3694849014282227, -0.989714503288269, -0.6099441051483154, -0.23017382621765137, 0.1495964527130127, 0.5293669700622559, 0.9091372489929199, 1.288907527923584, 1.668677806854248, 2.048448085784912, 2.4282186031341553, 2.8079888820648193, 3.1877591609954834, 3.5675296783447266, 3.9472999572753906, 4.327070236206055, 4.706840515136719, 5.086610794067383, 5.466381072998047, 5.846151351928711, 6.225921630859375, 6.605692386627197, 6.985462665557861, 7.365232944488525, 7.7450032234191895, 8.124773979187012, 8.504544258117676, 8.88431453704834, 9.264084815979004, 9.643855094909668, 10.023625373840332, 10.403395652770996]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 8.0, 12.0, 22.0, 36.0, 45.0, 72.0, 101.0, 129.0, 148.0, 127.0, 105.0, 72.0, 41.0, 24.0, 20.0, 11.0, 15.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.529296875, -0.5066299438476562, -0.4839630126953125, -0.46129608154296875, -0.438629150390625, -0.41596221923828125, -0.3932952880859375, -0.37062835693359375, -0.34796142578125, -0.32529449462890625, -0.3026275634765625, -0.27996063232421875, -0.257293701171875, -0.23462677001953125, -0.2119598388671875, -0.18929290771484375, -0.1666259765625, -0.14395904541015625, -0.1212921142578125, -0.09862518310546875, -0.075958251953125, -0.05329132080078125, -0.0306243896484375, -0.00795745849609375, 0.01470947265625, 0.03737640380859375, 0.0600433349609375, 0.08271026611328125, 0.105377197265625, 0.12804412841796875, 0.1507110595703125, 0.17337799072265625, 0.196044921875, 0.21871185302734375, 0.2413787841796875, 0.26404571533203125, 0.286712646484375, 0.30937957763671875, 0.3320465087890625, 0.35471343994140625, 0.37738037109375, 0.40004730224609375, 0.4227142333984375, 0.44538116455078125, 0.468048095703125, 0.49071502685546875, 0.5133819580078125, 0.5360488891601562, 0.5587158203125, 0.5813827514648438, 0.6040496826171875, 0.6267166137695312, 0.649383544921875, 0.6720504760742188, 0.6947174072265625, 0.7173843383789062, 0.74005126953125, 0.7627182006835938, 0.7853851318359375, 0.8080520629882812, 0.830718994140625, 0.8533859252929688, 0.8760528564453125, 0.8987197875976562, 0.92138671875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 12.0, 15.0, 27.0, 49.0, 63.0, 116.0, 205.0, 327.0, 639.0, 1480.0, 3851.0, 13019.0, 57324.0, 248632.0, 154718.0, 31062.0, 7796.0, 2573.0, 1010.0, 556.0, 279.0, 163.0, 104.0, 72.0, 39.0, 42.0, 27.0, 15.0, 16.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.40625, -8.1143798828125, -7.822509765625, -7.5306396484375, -7.23876953125, -6.9468994140625, -6.655029296875, -6.3631591796875, -6.0712890625, -5.7794189453125, -5.487548828125, -5.1956787109375, -4.90380859375, -4.6119384765625, -4.320068359375, -4.0281982421875, -3.736328125, -3.4444580078125, -3.152587890625, -2.8607177734375, -2.56884765625, -2.2769775390625, -1.985107421875, -1.6932373046875, -1.4013671875, -1.1094970703125, -0.817626953125, -0.5257568359375, -0.23388671875, 0.0579833984375, 0.349853515625, 0.6417236328125, 0.93359375, 1.2254638671875, 1.517333984375, 1.8092041015625, 2.10107421875, 2.3929443359375, 2.684814453125, 2.9766845703125, 3.2685546875, 3.5604248046875, 3.852294921875, 4.1441650390625, 4.43603515625, 4.7279052734375, 5.019775390625, 5.3116455078125, 5.603515625, 5.8953857421875, 6.187255859375, 6.4791259765625, 6.77099609375, 7.0628662109375, 7.354736328125, 7.6466064453125, 7.9384765625, 8.2303466796875, 8.522216796875, 8.8140869140625, 9.10595703125, 9.3978271484375, 9.689697265625, 9.9815673828125, 10.2734375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 7.0, 12.0, 10.0, 14.0, 15.0, 22.0, 18.0, 46.0, 46.0, 45.0, 61.0, 66.0, 77.0, 70.0, 96.0, 78.0, 60.0, 57.0, 51.0, 38.0, 34.0, 16.0, 18.0, 10.0, 11.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.005859375, -0.9661712646484375, -0.926483154296875, -0.8867950439453125, -0.84710693359375, -0.8074188232421875, -0.767730712890625, -0.7280426025390625, -0.6883544921875, -0.6486663818359375, -0.608978271484375, -0.5692901611328125, -0.52960205078125, -0.4899139404296875, -0.450225830078125, -0.4105377197265625, -0.370849609375, -0.3311614990234375, -0.291473388671875, -0.2517852783203125, -0.21209716796875, -0.1724090576171875, -0.132720947265625, -0.0930328369140625, -0.0533447265625, -0.0136566162109375, 0.026031494140625, 0.0657196044921875, 0.10540771484375, 0.1450958251953125, 0.184783935546875, 0.2244720458984375, 0.26416015625, 0.3038482666015625, 0.343536376953125, 0.3832244873046875, 0.42291259765625, 0.4626007080078125, 0.502288818359375, 0.5419769287109375, 0.5816650390625, 0.6213531494140625, 0.661041259765625, 0.7007293701171875, 0.74041748046875, 0.7801055908203125, 0.819793701171875, 0.8594818115234375, 0.899169921875, 0.9388580322265625, 0.978546142578125, 1.0182342529296875, 1.05792236328125, 1.0976104736328125, 1.137298583984375, 1.1769866943359375, 1.2166748046875, 1.2563629150390625, 1.296051025390625, 1.3357391357421875, 1.37542724609375, 1.4151153564453125, 1.454803466796875, 1.4944915771484375, 1.5341796875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 13.0, 31.0, 38.0, 72.0, 84.0, 75.0, 69.0, 25.0, 24.0, 6.0, 6.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.710701942443848, -6.456543922424316, -6.202386379241943, -5.94822883605957, -5.694070816040039, -5.439912796020508, -5.185755252838135, -4.931597709655762, -4.6774396896362305, -4.423281669616699, -4.169124126434326, -3.914966344833374, -3.660808563232422, -3.4066507816314697, -3.1524930000305176, -2.8983352184295654, -2.6441774368286133, -2.390019655227661, -2.135861873626709, -1.8817040920257568, -1.6275463104248047, -1.3733885288238525, -1.1192307472229004, -0.8650729656219482, -0.6109151840209961, -0.35675740242004395, -0.1025996208190918, 0.15155816078186035, 0.4057159423828125, 0.6598737239837646, 0.9140315055847168, 1.168189287185669, 1.4223461151123047, 1.6765038967132568, 1.930661678314209, 2.184819459915161, 2.4389772415161133, 2.6931350231170654, 2.9472928047180176, 3.2014505863189697, 3.455608367919922, 3.709766149520874, 3.963923931121826, 4.218081474304199, 4.4722394943237305, 4.726397514343262, 4.980555057525635, 5.234712600708008, 5.488870620727539, 5.74302864074707, 5.997186183929443, 6.251343727111816, 6.505501747131348, 6.759659767150879, 7.013817310333252, 7.267974853515625, 7.522132873535156, 7.7762908935546875, 8.030448913574219, 8.284605979919434, 8.538763999938965, 8.792922019958496, 9.047079086303711, 9.301237106323242, 9.555395126342773]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 14.0, 27.0, 25.0, 44.0, 51.0, 81.0, 64.0, 26.0, 30.0, 28.0, 13.0, 10.0, 5.0, 5.0, 5.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8963820934295654, -3.7414605617523193, -3.5865390300750732, -3.431617498397827, -3.27669620513916, -3.121774673461914, -2.966853141784668, -2.811931610107422, -2.657010078430176, -2.5020885467529297, -2.3471670150756836, -2.1922454833984375, -2.0373239517211914, -1.8824025392532349, -1.7274811267852783, -1.5725595951080322, -1.4176380634307861, -1.26271653175354, -1.107795000076294, -0.9528735876083374, -0.7979520559310913, -0.6430305242538452, -0.4881090521812439, -0.3331875801086426, -0.17826604843139648, -0.02334454655647278, 0.13157695531845093, 0.28649845719337463, 0.44141995906829834, 0.5963414907455444, 0.7512629628181458, 0.9061844348907471, 1.061105728149414, 1.2160272598266602, 1.3709487915039062, 1.5258702039718628, 1.6807917356491089, 1.835713267326355, 1.9906346797943115, 2.1455562114715576, 2.3004777431488037, 2.45539927482605, 2.610320806503296, 2.765242338180542, 2.920163631439209, 3.075085163116455, 3.230006694793701, 3.3849282264709473, 3.5398497581481934, 3.6947712898254395, 3.8496928215026855, 4.004614353179932, 4.159535884857178, 4.314457416534424, 4.46937894821167, 4.624300003051758, 4.779221534729004, 4.93414306640625, 5.089064598083496, 5.243986129760742, 5.398907661437988, 5.553829193115234, 5.7087507247924805, 5.863672256469727, 6.018593788146973]}, "eval/loss": 4.259941577911377, "eval/wer": 1.0190995636652123, "eval/runtime": 524.0014, "eval/samples_per_second": 5.042, "eval/steps_per_second": 0.632, "train/train_runtime": 51677.5666, "train/train_samples_per_second": 5.522, "train/train_steps_per_second": 0.043, "train/total_flos": 0.0, "train/train_loss": 4.09313003856505}