diff --git "a/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" "b/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" --- "a/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" +++ "b/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 5.4525, "train/learning_rate": 2.7185915492957747e-05, "train/epoch": 3.36, "train/global_step": 3000, "_runtime": 17953, "_timestamp": 1647962455, "_step": 3001, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 9.0, 14.0, 12.0, 15.0, 16.0, 23.0, 17.0, 19.0, 32.0, 35.0, 36.0, 39.0, 33.0, 39.0, 48.0, 45.0, 42.0, 53.0, 52.0, 45.0, 35.0, 35.0, 33.0, 34.0, 37.0, 39.0, 28.0, 24.0, 14.0, 22.0, 12.0, 7.0, 8.0, 8.0, 9.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.77167510986328, -28.803977966308594, -27.836280822753906, -26.86858367919922, -25.90088653564453, -24.933189392089844, -23.965492248535156, -22.99779510498047, -22.03009796142578, -21.062400817871094, -20.094703674316406, -19.12700653076172, -18.15930938720703, -17.191612243652344, -16.223915100097656, -15.256217956542969, -14.288521766662598, -13.32082462310791, -12.353127479553223, -11.385430335998535, -10.417733192443848, -9.450037002563477, -8.482339859008789, -7.514642238616943, -6.546945095062256, -5.579247951507568, -4.611550807952881, -3.6438539028167725, -2.676156759262085, -1.7084598541259766, -0.7407627105712891, 0.22693443298339844, 1.194631576538086, 2.1623287200927734, 3.130025863647461, 4.097723007202148, 5.065420150756836, 6.033116817474365, 7.000813961029053, 7.96851110458374, 8.936208724975586, 9.903905868530273, 10.871603012084961, 11.839300155639648, 12.806997299194336, 13.774694442749023, 14.742391586303711, 15.710088729858398, 16.677783966064453, 17.64548110961914, 18.613178253173828, 19.580875396728516, 20.548572540283203, 21.51626968383789, 22.483966827392578, 23.451663970947266, 24.419361114501953, 25.38705825805664, 26.354755401611328, 27.322452545166016, 28.290149688720703, 29.25784683227539, 30.225543975830078, 31.193241119384766, 32.16093826293945]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 9.0, 6.0, 9.0, 11.0, 14.0, 15.0, 18.0, 20.0, 23.0, 16.0, 29.0, 33.0, 37.0, 24.0, 32.0, 27.0, 35.0, 32.0, 44.0, 49.0, 45.0, 31.0, 35.0, 45.0, 37.0, 35.0, 40.0, 25.0, 29.0, 18.0, 19.0, 23.0, 23.0, 18.0, 14.0, 16.0, 12.0, 8.0, 9.0, 8.0, 10.0, 2.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.996685028076172, -25.12548828125, -24.254291534423828, -23.383094787597656, -22.511898040771484, -21.640701293945312, -20.76950454711914, -19.898305892944336, -19.027109146118164, -18.155912399291992, -17.28471565246582, -16.41351890563965, -15.54232120513916, -14.671124458312988, -13.799927711486816, -12.928730010986328, -12.057534217834473, -11.1863374710083, -10.315140724182129, -9.44394302368164, -8.572746276855469, -7.701549530029297, -6.830352783203125, -5.959155559539795, -5.087958812713623, -4.216762065887451, -3.345564842224121, -2.474368095397949, -1.6031711101531982, -0.7319741249084473, 0.1392226219177246, 1.0104198455810547, 1.8816165924072266, 2.7528135776519775, 3.6240105628967285, 4.4952073097229, 5.3664045333862305, 6.237601280212402, 7.108798027038574, 7.979995250701904, 8.851192474365234, 9.722389221191406, 10.593585968017578, 11.46478271484375, 12.335980415344238, 13.20717716217041, 14.078373908996582, 14.94957160949707, 15.820767402648926, 16.691965103149414, 17.563161849975586, 18.434358596801758, 19.30555534362793, 20.1767520904541, 21.047948837280273, 21.919145584106445, 22.790342330932617, 23.66153907775879, 24.53273582458496, 25.403932571411133, 26.275129318237305, 27.14632797241211, 28.01752471923828, 28.888721466064453, 29.759918212890625]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 15.0, 11.0, 24.0, 32.0, 42.0, 69.0, 121.0, 236.0, 318.0, 556.0, 867.0, 1414.0, 2515.0, 4302.0, 7574.0, 13292.0, 24470.0, 44917.0, 83028.0, 154579.0, 276027.0, 451581.0, 633359.0, 718607.0, 644385.0, 470864.0, 295488.0, 166385.0, 90777.0, 49126.0, 26160.0, 14230.0, 8049.0, 4539.0, 2524.0, 1498.0, 882.0, 563.0, 312.0, 193.0, 134.0, 76.0, 52.0, 30.0, 20.0, 15.0, 13.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-22.21875, -21.556640625, -20.89453125, -20.232421875, -19.5703125, -18.908203125, -18.24609375, -17.583984375, -16.921875, -16.259765625, -15.59765625, -14.935546875, -14.2734375, -13.611328125, -12.94921875, -12.287109375, -11.625, -10.962890625, -10.30078125, -9.638671875, -8.9765625, -8.314453125, -7.65234375, -6.990234375, -6.328125, -5.666015625, -5.00390625, -4.341796875, -3.6796875, -3.017578125, -2.35546875, -1.693359375, -1.03125, -0.369140625, 0.29296875, 0.955078125, 1.6171875, 2.279296875, 2.94140625, 3.603515625, 4.265625, 4.927734375, 5.58984375, 6.251953125, 6.9140625, 7.576171875, 8.23828125, 8.900390625, 9.5625, 10.224609375, 10.88671875, 11.548828125, 12.2109375, 12.873046875, 13.53515625, 14.197265625, 14.859375, 15.521484375, 16.18359375, 16.845703125, 17.5078125, 18.169921875, 18.83203125, 19.494140625, 20.15625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 6.0, 5.0, 9.0, 7.0, 17.0, 9.0, 14.0, 12.0, 17.0, 14.0, 15.0, 22.0, 31.0, 17.0, 23.0, 30.0, 39.0, 30.0, 39.0, 29.0, 42.0, 31.0, 37.0, 39.0, 24.0, 37.0, 35.0, 35.0, 21.0, 26.0, 31.0, 33.0, 24.0, 37.0, 21.0, 19.0, 20.0, 11.0, 14.0, 21.0, 10.0, 4.0, 7.0, 8.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-19.640625, -19.005126953125, -18.36962890625, -17.734130859375, -17.0986328125, -16.463134765625, -15.82763671875, -15.192138671875, -14.556640625, -13.921142578125, -13.28564453125, -12.650146484375, -12.0146484375, -11.379150390625, -10.74365234375, -10.108154296875, -9.47265625, -8.837158203125, -8.20166015625, -7.566162109375, -6.9306640625, -6.295166015625, -5.65966796875, -5.024169921875, -4.388671875, -3.753173828125, -3.11767578125, -2.482177734375, -1.8466796875, -1.211181640625, -0.57568359375, 0.059814453125, 0.6953125, 1.330810546875, 1.96630859375, 2.601806640625, 3.2373046875, 3.872802734375, 4.50830078125, 5.143798828125, 5.779296875, 6.414794921875, 7.05029296875, 7.685791015625, 8.3212890625, 8.956787109375, 9.59228515625, 10.227783203125, 10.86328125, 11.498779296875, 12.13427734375, 12.769775390625, 13.4052734375, 14.040771484375, 14.67626953125, 15.311767578125, 15.947265625, 16.582763671875, 17.21826171875, 17.853759765625, 18.4892578125, 19.124755859375, 19.76025390625, 20.395751953125, 21.03125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 12.0, 10.0, 13.0, 15.0, 34.0, 48.0, 80.0, 120.0, 136.0, 261.0, 409.0, 593.0, 884.0, 1414.0, 2157.0, 3457.0, 5359.0, 8173.0, 12487.0, 19342.0, 29995.0, 45820.0, 69398.0, 103265.0, 151915.0, 218832.0, 303579.0, 404250.0, 499370.0, 534496.0, 481463.0, 383711.0, 287391.0, 203749.0, 141630.0, 96252.0, 63868.0, 42215.0, 27500.0, 17956.0, 11545.0, 7495.0, 4894.0, 3158.0, 1936.0, 1290.0, 795.0, 549.0, 338.0, 221.0, 142.0, 82.0, 63.0, 57.0, 26.0, 22.0, 7.0, 7.0, 6.0, 8.0, 1.0, 0.0, 1.0], "bins": [-16.65625, -16.1083984375, -15.560546875, -15.0126953125, -14.46484375, -13.9169921875, -13.369140625, -12.8212890625, -12.2734375, -11.7255859375, -11.177734375, -10.6298828125, -10.08203125, -9.5341796875, -8.986328125, -8.4384765625, -7.890625, -7.3427734375, -6.794921875, -6.2470703125, -5.69921875, -5.1513671875, -4.603515625, -4.0556640625, -3.5078125, -2.9599609375, -2.412109375, -1.8642578125, -1.31640625, -0.7685546875, -0.220703125, 0.3271484375, 0.875, 1.4228515625, 1.970703125, 2.5185546875, 3.06640625, 3.6142578125, 4.162109375, 4.7099609375, 5.2578125, 5.8056640625, 6.353515625, 6.9013671875, 7.44921875, 7.9970703125, 8.544921875, 9.0927734375, 9.640625, 10.1884765625, 10.736328125, 11.2841796875, 11.83203125, 12.3798828125, 12.927734375, 13.4755859375, 14.0234375, 14.5712890625, 15.119140625, 15.6669921875, 16.21484375, 16.7626953125, 17.310546875, 17.8583984375, 18.40625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 8.0, 2.0, 8.0, 13.0, 17.0, 22.0, 28.0, 35.0, 57.0, 58.0, 70.0, 63.0, 91.0, 118.0, 127.0, 161.0, 184.0, 237.0, 211.0, 236.0, 248.0, 249.0, 250.0, 258.0, 201.0, 175.0, 138.0, 141.0, 129.0, 98.0, 81.0, 59.0, 63.0, 46.0, 41.0, 27.0, 29.0, 22.0, 12.0, 13.0, 11.0, 8.0, 5.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -8.00390625, -7.71875, -7.43359375, -7.1484375, -6.86328125, -6.578125, -6.29296875, -6.0078125, -5.72265625, -5.4375, -5.15234375, -4.8671875, -4.58203125, -4.296875, -4.01171875, -3.7265625, -3.44140625, -3.15625, -2.87109375, -2.5859375, -2.30078125, -2.015625, -1.73046875, -1.4453125, -1.16015625, -0.875, -0.58984375, -0.3046875, -0.01953125, 0.265625, 0.55078125, 0.8359375, 1.12109375, 1.40625, 1.69140625, 1.9765625, 2.26171875, 2.546875, 2.83203125, 3.1171875, 3.40234375, 3.6875, 3.97265625, 4.2578125, 4.54296875, 4.828125, 5.11328125, 5.3984375, 5.68359375, 5.96875, 6.25390625, 6.5390625, 6.82421875, 7.109375, 7.39453125, 7.6796875, 7.96484375, 8.25, 8.53515625, 8.8203125, 9.10546875, 9.390625, 9.67578125, 9.9609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 8.0, 5.0, 6.0, 15.0, 13.0, 16.0, 14.0, 32.0, 26.0, 26.0, 20.0, 38.0, 25.0, 27.0, 38.0, 38.0, 43.0, 44.0, 39.0, 41.0, 47.0, 43.0, 42.0, 33.0, 34.0, 37.0, 25.0, 33.0, 29.0, 20.0, 15.0, 18.0, 14.0, 20.0, 15.0, 8.0, 5.0, 6.0, 4.0, 6.0, 10.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.059850692749023, -20.349275588989258, -19.638700485229492, -18.928125381469727, -18.217548370361328, -17.506973266601562, -16.796398162841797, -16.08582305908203, -15.375247955322266, -14.6646728515625, -13.954097747802734, -13.243521690368652, -12.532946586608887, -11.822371482849121, -11.111795425415039, -10.401220321655273, -9.690645217895508, -8.980070114135742, -8.269495010375977, -7.5589189529418945, -6.848343849182129, -6.137768745422363, -5.4271931648254395, -4.716617584228516, -4.00604248046875, -3.2954671382904053, -2.5848917961120605, -1.8743164539337158, -1.163741111755371, -0.45316576957702637, 0.25740957260131836, 0.9679851531982422, 1.678558349609375, 2.3891336917877197, 3.0997090339660645, 3.810284376144409, 4.520859718322754, 5.2314348220825195, 5.942010402679443, 6.652585983276367, 7.363161087036133, 8.073736190795898, 8.784311294555664, 9.494887351989746, 10.205462455749512, 10.916037559509277, 11.62661361694336, 12.337188720703125, 13.04776382446289, 13.758338928222656, 14.468914031982422, 15.179490089416504, 15.89006519317627, 16.60064125061035, 17.311216354370117, 18.021791458129883, 18.73236656188965, 19.442941665649414, 20.15351676940918, 20.864091873168945, 21.574668884277344, 22.28524398803711, 22.995819091796875, 23.70639419555664, 24.416969299316406]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 4.0, 17.0, 13.0, 11.0, 16.0, 14.0, 9.0, 18.0, 36.0, 29.0, 22.0, 42.0, 21.0, 44.0, 30.0, 28.0, 38.0, 37.0, 42.0, 36.0, 34.0, 46.0, 38.0, 32.0, 27.0, 34.0, 29.0, 28.0, 29.0, 25.0, 25.0, 22.0, 12.0, 14.0, 11.0, 8.0, 9.0, 4.0, 9.0, 12.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-22.522737503051758, -21.81505584716797, -21.10737419128418, -20.39969253540039, -19.6920108795166, -18.984329223632812, -18.276649475097656, -17.568967819213867, -16.861286163330078, -16.15360450744629, -15.4459228515625, -14.738241195678711, -14.030560493469238, -13.32287883758545, -12.61519718170166, -11.907516479492188, -11.199833869934082, -10.492152214050293, -9.784470558166504, -9.076789855957031, -8.369108200073242, -7.661426544189453, -6.953744888305664, -6.246063709259033, -5.538382053375244, -4.830700397491455, -4.123019218444824, -3.415337562561035, -2.707656145095825, -1.9999747276306152, -1.2922930717468262, -0.5846118927001953, 0.12306976318359375, 0.8307512402534485, 1.5384327173233032, 2.2461142539978027, 2.9537956714630127, 3.6614770889282227, 4.369158744812012, 5.076839923858643, 5.784521579742432, 6.492203235626221, 7.199884414672852, 7.907566070556641, 8.61524772644043, 9.322929382324219, 10.030611038208008, 10.73829174041748, 11.44597339630127, 12.153655052185059, 12.861336708068848, 13.56901741027832, 14.27669906616211, 14.984380722045898, 15.692062377929688, 16.399744033813477, 17.107425689697266, 17.815107345581055, 18.522789001464844, 19.230470657348633, 19.938152313232422, 20.645832061767578, 21.353515625, 22.061195373535156, 22.768877029418945]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 5.0, 16.0, 20.0, 28.0, 45.0, 48.0, 74.0, 95.0, 165.0, 214.0, 377.0, 547.0, 762.0, 1239.0, 1817.0, 3017.0, 4966.0, 8138.0, 13982.0, 23896.0, 41118.0, 71847.0, 121867.0, 182671.0, 200374.0, 150262.0, 92502.0, 53442.0, 30278.0, 17718.0, 10470.0, 6186.0, 3694.0, 2253.0, 1529.0, 960.0, 655.0, 402.0, 250.0, 192.0, 131.0, 98.0, 64.0, 43.0, 26.0, 18.0, 9.0, 15.0, 5.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.1953125, -10.8367919921875, -10.478271484375, -10.1197509765625, -9.76123046875, -9.4027099609375, -9.044189453125, -8.6856689453125, -8.3271484375, -7.9686279296875, -7.610107421875, -7.2515869140625, -6.89306640625, -6.5345458984375, -6.176025390625, -5.8175048828125, -5.458984375, -5.1004638671875, -4.741943359375, -4.3834228515625, -4.02490234375, -3.6663818359375, -3.307861328125, -2.9493408203125, -2.5908203125, -2.2322998046875, -1.873779296875, -1.5152587890625, -1.15673828125, -0.7982177734375, -0.439697265625, -0.0811767578125, 0.27734375, 0.6358642578125, 0.994384765625, 1.3529052734375, 1.71142578125, 2.0699462890625, 2.428466796875, 2.7869873046875, 3.1455078125, 3.5040283203125, 3.862548828125, 4.2210693359375, 4.57958984375, 4.9381103515625, 5.296630859375, 5.6551513671875, 6.013671875, 6.3721923828125, 6.730712890625, 7.0892333984375, 7.44775390625, 7.8062744140625, 8.164794921875, 8.5233154296875, 8.8818359375, 9.2403564453125, 9.598876953125, 9.9573974609375, 10.31591796875, 10.6744384765625, 11.032958984375, 11.3914794921875, 11.75]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 12.0, 14.0, 12.0, 14.0, 20.0, 16.0, 14.0, 18.0, 25.0, 42.0, 30.0, 37.0, 37.0, 33.0, 49.0, 39.0, 22.0, 38.0, 44.0, 36.0, 42.0, 40.0, 33.0, 27.0, 30.0, 34.0, 27.0, 35.0, 15.0, 18.0, 17.0, 14.0, 16.0, 13.0, 8.0, 6.0, 10.0, 10.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-23.65625, -22.94873046875, -22.2412109375, -21.53369140625, -20.826171875, -20.11865234375, -19.4111328125, -18.70361328125, -17.99609375, -17.28857421875, -16.5810546875, -15.87353515625, -15.166015625, -14.45849609375, -13.7509765625, -13.04345703125, -12.3359375, -11.62841796875, -10.9208984375, -10.21337890625, -9.505859375, -8.79833984375, -8.0908203125, -7.38330078125, -6.67578125, -5.96826171875, -5.2607421875, -4.55322265625, -3.845703125, -3.13818359375, -2.4306640625, -1.72314453125, -1.015625, -0.30810546875, 0.3994140625, 1.10693359375, 1.814453125, 2.52197265625, 3.2294921875, 3.93701171875, 4.64453125, 5.35205078125, 6.0595703125, 6.76708984375, 7.474609375, 8.18212890625, 8.8896484375, 9.59716796875, 10.3046875, 11.01220703125, 11.7197265625, 12.42724609375, 13.134765625, 13.84228515625, 14.5498046875, 15.25732421875, 15.96484375, 16.67236328125, 17.3798828125, 18.08740234375, 18.794921875, 19.50244140625, 20.2099609375, 20.91748046875, 21.625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 9.0, 15.0, 25.0, 35.0, 55.0, 79.0, 127.0, 195.0, 293.0, 513.0, 856.0, 1405.0, 2497.0, 4565.0, 8636.0, 17420.0, 36332.0, 78040.0, 159764.0, 255419.0, 232008.0, 129801.0, 61420.0, 28865.0, 13921.0, 7116.0, 3805.0, 2095.0, 1234.0, 737.0, 466.0, 308.0, 161.0, 122.0, 58.0, 51.0, 31.0, 22.0, 17.0, 9.0, 7.0, 11.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03125, -9.7161865234375, -9.401123046875, -9.0860595703125, -8.77099609375, -8.4559326171875, -8.140869140625, -7.8258056640625, -7.5107421875, -7.1956787109375, -6.880615234375, -6.5655517578125, -6.25048828125, -5.9354248046875, -5.620361328125, -5.3052978515625, -4.990234375, -4.6751708984375, -4.360107421875, -4.0450439453125, -3.72998046875, -3.4149169921875, -3.099853515625, -2.7847900390625, -2.4697265625, -2.1546630859375, -1.839599609375, -1.5245361328125, -1.20947265625, -0.8944091796875, -0.579345703125, -0.2642822265625, 0.05078125, 0.3658447265625, 0.680908203125, 0.9959716796875, 1.31103515625, 1.6260986328125, 1.941162109375, 2.2562255859375, 2.5712890625, 2.8863525390625, 3.201416015625, 3.5164794921875, 3.83154296875, 4.1466064453125, 4.461669921875, 4.7767333984375, 5.091796875, 5.4068603515625, 5.721923828125, 6.0369873046875, 6.35205078125, 6.6671142578125, 6.982177734375, 7.2972412109375, 7.6123046875, 7.9273681640625, 8.242431640625, 8.5574951171875, 8.87255859375, 9.1876220703125, 9.502685546875, 9.8177490234375, 10.1328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 1.0, 6.0, 7.0, 10.0, 8.0, 14.0, 15.0, 17.0, 19.0, 32.0, 25.0, 20.0, 39.0, 34.0, 46.0, 28.0, 33.0, 37.0, 37.0, 42.0, 48.0, 54.0, 37.0, 44.0, 28.0, 37.0, 48.0, 32.0, 33.0, 26.0, 22.0, 14.0, 18.0, 20.0, 11.0, 15.0, 8.0, 10.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.046875, -19.4267578125, -18.806640625, -18.1865234375, -17.56640625, -16.9462890625, -16.326171875, -15.7060546875, -15.0859375, -14.4658203125, -13.845703125, -13.2255859375, -12.60546875, -11.9853515625, -11.365234375, -10.7451171875, -10.125, -9.5048828125, -8.884765625, -8.2646484375, -7.64453125, -7.0244140625, -6.404296875, -5.7841796875, -5.1640625, -4.5439453125, -3.923828125, -3.3037109375, -2.68359375, -2.0634765625, -1.443359375, -0.8232421875, -0.203125, 0.4169921875, 1.037109375, 1.6572265625, 2.27734375, 2.8974609375, 3.517578125, 4.1376953125, 4.7578125, 5.3779296875, 5.998046875, 6.6181640625, 7.23828125, 7.8583984375, 8.478515625, 9.0986328125, 9.71875, 10.3388671875, 10.958984375, 11.5791015625, 12.19921875, 12.8193359375, 13.439453125, 14.0595703125, 14.6796875, 15.2998046875, 15.919921875, 16.5400390625, 17.16015625, 17.7802734375, 18.400390625, 19.0205078125, 19.640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 6.0, 1.0, 4.0, 8.0, 12.0, 13.0, 34.0, 35.0, 61.0, 110.0, 135.0, 172.0, 286.0, 431.0, 578.0, 818.0, 1198.0, 1778.0, 2580.0, 3860.0, 6522.0, 11365.0, 21195.0, 46306.0, 132379.0, 411957.0, 259734.0, 76535.0, 31378.0, 15469.0, 8580.0, 5063.0, 3174.0, 2117.0, 1400.0, 989.0, 681.0, 456.0, 393.0, 245.0, 167.0, 114.0, 75.0, 56.0, 36.0, 22.0, 14.0, 7.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.66796875, -4.52099609375, -4.3740234375, -4.22705078125, -4.080078125, -3.93310546875, -3.7861328125, -3.63916015625, -3.4921875, -3.34521484375, -3.1982421875, -3.05126953125, -2.904296875, -2.75732421875, -2.6103515625, -2.46337890625, -2.31640625, -2.16943359375, -2.0224609375, -1.87548828125, -1.728515625, -1.58154296875, -1.4345703125, -1.28759765625, -1.140625, -0.99365234375, -0.8466796875, -0.69970703125, -0.552734375, -0.40576171875, -0.2587890625, -0.11181640625, 0.03515625, 0.18212890625, 0.3291015625, 0.47607421875, 0.623046875, 0.77001953125, 0.9169921875, 1.06396484375, 1.2109375, 1.35791015625, 1.5048828125, 1.65185546875, 1.798828125, 1.94580078125, 2.0927734375, 2.23974609375, 2.38671875, 2.53369140625, 2.6806640625, 2.82763671875, 2.974609375, 3.12158203125, 3.2685546875, 3.41552734375, 3.5625, 3.70947265625, 3.8564453125, 4.00341796875, 4.150390625, 4.29736328125, 4.4443359375, 4.59130859375, 4.73828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 12.0, 16.0, 20.0, 26.0, 29.0, 51.0, 99.0, 119.0, 128.0, 128.0, 104.0, 69.0, 55.0, 32.0, 22.0, 17.0, 14.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008611679077148438, -0.000834144651889801, -0.0008071213960647583, -0.0007800981402397156, -0.0007530748844146729, -0.0007260516285896301, -0.0006990283727645874, -0.0006720051169395447, -0.000644981861114502, -0.0006179586052894592, -0.0005909353494644165, -0.0005639120936393738, -0.0005368888378143311, -0.0005098655819892883, -0.0004828423261642456, -0.0004558190703392029, -0.00042879581451416016, -0.00040177255868911743, -0.0003747493028640747, -0.000347726047039032, -0.00032070279121398926, -0.00029367953538894653, -0.0002666562795639038, -0.00023963302373886108, -0.00021260976791381836, -0.00018558651208877563, -0.0001585632562637329, -0.00013154000043869019, -0.00010451674461364746, -7.749348878860474e-05, -5.047023296356201e-05, -2.3446977138519287e-05, 3.5762786865234375e-06, 3.059953451156616e-05, 5.762279033660889e-05, 8.464604616165161e-05, 0.00011166930198669434, 0.00013869255781173706, 0.00016571581363677979, 0.0001927390694618225, 0.00021976232528686523, 0.00024678558111190796, 0.0002738088369369507, 0.0003008320927619934, 0.00032785534858703613, 0.00035487860441207886, 0.0003819018602371216, 0.0004089251160621643, 0.00043594837188720703, 0.00046297162771224976, 0.0004899948835372925, 0.0005170181393623352, 0.0005440413951873779, 0.0005710646510124207, 0.0005980879068374634, 0.0006251111626625061, 0.0006521344184875488, 0.0006791576743125916, 0.0007061809301376343, 0.000733204185962677, 0.0007602274417877197, 0.0007872506976127625, 0.0008142739534378052, 0.0008412972092628479, 0.0008683204650878906]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 12.0, 16.0, 14.0, 34.0, 43.0, 72.0, 81.0, 144.0, 192.0, 319.0, 418.0, 666.0, 998.0, 1497.0, 2489.0, 4024.0, 6641.0, 11711.0, 21656.0, 43078.0, 86395.0, 171776.0, 270644.0, 205776.0, 106411.0, 52093.0, 26702.0, 14208.0, 7847.0, 4597.0, 2814.0, 1783.0, 1099.0, 745.0, 499.0, 338.0, 232.0, 153.0, 115.0, 80.0, 49.0, 27.0, 20.0, 17.0, 13.0, 3.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1171875, -3.98284912109375, -3.8485107421875, -3.71417236328125, -3.579833984375, -3.44549560546875, -3.3111572265625, -3.17681884765625, -3.04248046875, -2.90814208984375, -2.7738037109375, -2.63946533203125, -2.505126953125, -2.37078857421875, -2.2364501953125, -2.10211181640625, -1.9677734375, -1.83343505859375, -1.6990966796875, -1.56475830078125, -1.430419921875, -1.29608154296875, -1.1617431640625, -1.02740478515625, -0.89306640625, -0.75872802734375, -0.6243896484375, -0.49005126953125, -0.355712890625, -0.22137451171875, -0.0870361328125, 0.04730224609375, 0.181640625, 0.31597900390625, 0.4503173828125, 0.58465576171875, 0.718994140625, 0.85333251953125, 0.9876708984375, 1.12200927734375, 1.25634765625, 1.39068603515625, 1.5250244140625, 1.65936279296875, 1.793701171875, 1.92803955078125, 2.0623779296875, 2.19671630859375, 2.3310546875, 2.46539306640625, 2.5997314453125, 2.73406982421875, 2.868408203125, 3.00274658203125, 3.1370849609375, 3.27142333984375, 3.40576171875, 3.54010009765625, 3.6744384765625, 3.80877685546875, 3.943115234375, 4.07745361328125, 4.2117919921875, 4.34613037109375, 4.48046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 4.0, 2.0, 4.0, 6.0, 14.0, 8.0, 6.0, 14.0, 23.0, 21.0, 29.0, 48.0, 42.0, 63.0, 84.0, 96.0, 88.0, 76.0, 79.0, 56.0, 64.0, 30.0, 29.0, 21.0, 16.0, 13.0, 11.0, 9.0, 8.0, 5.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8544921875, -1.8017730712890625, -1.749053955078125, -1.6963348388671875, -1.64361572265625, -1.5908966064453125, -1.538177490234375, -1.4854583740234375, -1.4327392578125, -1.3800201416015625, -1.327301025390625, -1.2745819091796875, -1.22186279296875, -1.1691436767578125, -1.116424560546875, -1.0637054443359375, -1.010986328125, -0.9582672119140625, -0.905548095703125, -0.8528289794921875, -0.80010986328125, -0.7473907470703125, -0.694671630859375, -0.6419525146484375, -0.5892333984375, -0.5365142822265625, -0.483795166015625, -0.4310760498046875, -0.37835693359375, -0.3256378173828125, -0.272918701171875, -0.2201995849609375, -0.16748046875, -0.1147613525390625, -0.062042236328125, -0.0093231201171875, 0.04339599609375, 0.0961151123046875, 0.148834228515625, 0.2015533447265625, 0.2542724609375, 0.3069915771484375, 0.359710693359375, 0.4124298095703125, 0.46514892578125, 0.5178680419921875, 0.570587158203125, 0.6233062744140625, 0.676025390625, 0.7287445068359375, 0.781463623046875, 0.8341827392578125, 0.88690185546875, 0.9396209716796875, 0.992340087890625, 1.0450592041015625, 1.0977783203125, 1.1504974365234375, 1.203216552734375, 1.2559356689453125, 1.30865478515625, 1.3613739013671875, 1.414093017578125, 1.4668121337890625, 1.51953125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 9.0, 13.0, 9.0, 12.0, 11.0, 26.0, 32.0, 25.0, 24.0, 34.0, 32.0, 29.0, 29.0, 38.0, 43.0, 42.0, 61.0, 34.0, 45.0, 37.0, 52.0, 36.0, 37.0, 37.0, 33.0, 33.0, 25.0, 22.0, 20.0, 19.0, 16.0, 14.0, 15.0, 6.0, 7.0, 8.0, 6.0, 7.0, 5.0, 4.0, 5.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.369163513183594, -19.670391082763672, -18.971620559692383, -18.27284812927246, -17.574077606201172, -16.87530517578125, -16.176532745361328, -15.477762222290039, -14.778990745544434, -14.080219268798828, -13.381447792053223, -12.682676315307617, -11.983903884887695, -11.285133361816406, -10.586360931396484, -9.887589454650879, -9.188817977905273, -8.490046501159668, -7.7912750244140625, -7.092503070831299, -6.393731594085693, -5.694960117340088, -4.996188163757324, -4.297416687011719, -3.5986452102661133, -2.899873733520508, -2.2011020183563232, -1.5023303031921387, -0.8035588264465332, -0.10478734970092773, 0.5939846038818359, 1.2927560806274414, 1.991525650024414, 2.6902971267700195, 3.389068841934204, 4.087840557098389, 4.786612033843994, 5.4853835105896, 6.184155464172363, 6.882926940917969, 7.581698417663574, 8.28046989440918, 8.979241371154785, 9.67801284790039, 10.376785278320312, 11.075555801391602, 11.774328231811523, 12.473099708557129, 13.171871185302734, 13.87064266204834, 14.569414138793945, 15.268186569213867, 15.966957092285156, 16.665729522705078, 17.364501953125, 18.06327247619629, 18.762042999267578, 19.4608154296875, 20.15958595275879, 20.85835838317871, 21.55712890625, 22.255901336669922, 22.954673767089844, 23.653444290161133, 24.352216720581055]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 4.0, 2.0, 3.0, 5.0, 1.0, 5.0, 3.0, 8.0, 5.0, 11.0, 8.0, 13.0, 10.0, 16.0, 14.0, 20.0, 15.0, 33.0, 29.0, 26.0, 26.0, 34.0, 33.0, 40.0, 31.0, 31.0, 32.0, 40.0, 44.0, 34.0, 36.0, 37.0, 35.0, 29.0, 34.0, 28.0, 30.0, 24.0, 28.0, 27.0, 20.0, 19.0, 10.0, 9.0, 8.0, 6.0, 9.0, 8.0, 10.0, 6.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-20.63979721069336, -19.99089813232422, -19.341999053955078, -18.69310188293457, -18.04420280456543, -17.39530372619629, -16.74640464782715, -16.097505569458008, -15.448607444763184, -14.799708366394043, -14.150810241699219, -13.501911163330078, -12.853012084960938, -12.204113960266113, -11.555214881896973, -10.906316757202148, -10.257417678833008, -9.608518600463867, -8.959620475769043, -8.310721397399902, -7.66182279586792, -7.0129241943359375, -6.364025115966797, -5.7151265144348145, -5.066227912902832, -4.41732931137085, -3.768430471420288, -3.1195316314697266, -2.470633029937744, -1.8217344284057617, -1.1728355884552002, -0.5239367485046387, 0.12496376037597656, 0.7738624811172485, 1.4227612018585205, 2.071660041809082, 2.7205586433410645, 3.369457244873047, 4.0183563232421875, 4.66725492477417, 5.316153526306152, 5.965052127838135, 6.613950729370117, 7.262849807739258, 7.91174840927124, 8.560647010803223, 9.209546089172363, 9.858444213867188, 10.507343292236328, 11.156242370605469, 11.805140495300293, 12.454039573669434, 13.102937698364258, 13.751836776733398, 14.400735855102539, 15.04963493347168, 15.698533058166504, 16.347431182861328, 16.99633026123047, 17.64522933959961, 18.29412841796875, 18.94302749633789, 19.5919246673584, 20.24082374572754, 20.88972282409668]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 12.0, 16.0, 18.0, 32.0, 51.0, 77.0, 147.0, 210.0, 328.0, 591.0, 1044.0, 1664.0, 2795.0, 4839.0, 8296.0, 14311.0, 23361.0, 38083.0, 59542.0, 85895.0, 113654.0, 133382.0, 137721.0, 124883.0, 100596.0, 72545.0, 48857.0, 30631.0, 18537.0, 10942.0, 6348.0, 3674.0, 2200.0, 1322.0, 732.0, 473.0, 277.0, 184.0, 109.0, 75.0, 42.0, 27.0, 18.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.96875, -19.308837890625, -18.64892578125, -17.989013671875, -17.3291015625, -16.669189453125, -16.00927734375, -15.349365234375, -14.689453125, -14.029541015625, -13.36962890625, -12.709716796875, -12.0498046875, -11.389892578125, -10.72998046875, -10.070068359375, -9.41015625, -8.750244140625, -8.09033203125, -7.430419921875, -6.7705078125, -6.110595703125, -5.45068359375, -4.790771484375, -4.130859375, -3.470947265625, -2.81103515625, -2.151123046875, -1.4912109375, -0.831298828125, -0.17138671875, 0.488525390625, 1.1484375, 1.808349609375, 2.46826171875, 3.128173828125, 3.7880859375, 4.447998046875, 5.10791015625, 5.767822265625, 6.427734375, 7.087646484375, 7.74755859375, 8.407470703125, 9.0673828125, 9.727294921875, 10.38720703125, 11.047119140625, 11.70703125, 12.366943359375, 13.02685546875, 13.686767578125, 14.3466796875, 15.006591796875, 15.66650390625, 16.326416015625, 16.986328125, 17.646240234375, 18.30615234375, 18.966064453125, 19.6259765625, 20.285888671875, 20.94580078125, 21.605712890625, 22.265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 4.0, 7.0, 8.0, 4.0, 9.0, 10.0, 9.0, 22.0, 19.0, 17.0, 25.0, 25.0, 29.0, 37.0, 34.0, 32.0, 44.0, 33.0, 36.0, 42.0, 34.0, 40.0, 35.0, 47.0, 32.0, 36.0, 35.0, 36.0, 36.0, 40.0, 21.0, 14.0, 21.0, 17.0, 17.0, 13.0, 12.0, 11.0, 12.0, 9.0, 5.0, 5.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-22.546875, -21.88330078125, -21.2197265625, -20.55615234375, -19.892578125, -19.22900390625, -18.5654296875, -17.90185546875, -17.23828125, -16.57470703125, -15.9111328125, -15.24755859375, -14.583984375, -13.92041015625, -13.2568359375, -12.59326171875, -11.9296875, -11.26611328125, -10.6025390625, -9.93896484375, -9.275390625, -8.61181640625, -7.9482421875, -7.28466796875, -6.62109375, -5.95751953125, -5.2939453125, -4.63037109375, -3.966796875, -3.30322265625, -2.6396484375, -1.97607421875, -1.3125, -0.64892578125, 0.0146484375, 0.67822265625, 1.341796875, 2.00537109375, 2.6689453125, 3.33251953125, 3.99609375, 4.65966796875, 5.3232421875, 5.98681640625, 6.650390625, 7.31396484375, 7.9775390625, 8.64111328125, 9.3046875, 9.96826171875, 10.6318359375, 11.29541015625, 11.958984375, 12.62255859375, 13.2861328125, 13.94970703125, 14.61328125, 15.27685546875, 15.9404296875, 16.60400390625, 17.267578125, 17.93115234375, 18.5947265625, 19.25830078125, 19.921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 14.0, 22.0, 39.0, 31.0, 56.0, 102.0, 148.0, 309.0, 461.0, 717.0, 1130.0, 1743.0, 2802.0, 4355.0, 6649.0, 10375.0, 15408.0, 22760.0, 32659.0, 45653.0, 61364.0, 78227.0, 93059.0, 104137.0, 107137.0, 102113.0, 90238.0, 74437.0, 57166.0, 42782.0, 30390.0, 20939.0, 14483.0, 9598.0, 6225.0, 4001.0, 2453.0, 1630.0, 1059.0, 650.0, 407.0, 246.0, 159.0, 87.0, 55.0, 28.0, 21.0, 9.0, 13.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.5, -17.891357421875, -17.28271484375, -16.674072265625, -16.0654296875, -15.456787109375, -14.84814453125, -14.239501953125, -13.630859375, -13.022216796875, -12.41357421875, -11.804931640625, -11.1962890625, -10.587646484375, -9.97900390625, -9.370361328125, -8.76171875, -8.153076171875, -7.54443359375, -6.935791015625, -6.3271484375, -5.718505859375, -5.10986328125, -4.501220703125, -3.892578125, -3.283935546875, -2.67529296875, -2.066650390625, -1.4580078125, -0.849365234375, -0.24072265625, 0.367919921875, 0.9765625, 1.585205078125, 2.19384765625, 2.802490234375, 3.4111328125, 4.019775390625, 4.62841796875, 5.237060546875, 5.845703125, 6.454345703125, 7.06298828125, 7.671630859375, 8.2802734375, 8.888916015625, 9.49755859375, 10.106201171875, 10.71484375, 11.323486328125, 11.93212890625, 12.540771484375, 13.1494140625, 13.758056640625, 14.36669921875, 14.975341796875, 15.583984375, 16.192626953125, 16.80126953125, 17.409912109375, 18.0185546875, 18.627197265625, 19.23583984375, 19.844482421875, 20.453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 8.0, 8.0, 10.0, 10.0, 18.0, 5.0, 14.0, 27.0, 19.0, 16.0, 18.0, 28.0, 36.0, 31.0, 25.0, 37.0, 42.0, 30.0, 43.0, 42.0, 39.0, 40.0, 38.0, 38.0, 32.0, 31.0, 37.0, 41.0, 27.0, 27.0, 26.0, 24.0, 23.0, 16.0, 19.0, 13.0, 6.0, 8.0, 10.0, 11.0, 5.0, 6.0, 3.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0], "bins": [-13.9765625, -13.52734375, -13.078125, -12.62890625, -12.1796875, -11.73046875, -11.28125, -10.83203125, -10.3828125, -9.93359375, -9.484375, -9.03515625, -8.5859375, -8.13671875, -7.6875, -7.23828125, -6.7890625, -6.33984375, -5.890625, -5.44140625, -4.9921875, -4.54296875, -4.09375, -3.64453125, -3.1953125, -2.74609375, -2.296875, -1.84765625, -1.3984375, -0.94921875, -0.5, -0.05078125, 0.3984375, 0.84765625, 1.296875, 1.74609375, 2.1953125, 2.64453125, 3.09375, 3.54296875, 3.9921875, 4.44140625, 4.890625, 5.33984375, 5.7890625, 6.23828125, 6.6875, 7.13671875, 7.5859375, 8.03515625, 8.484375, 8.93359375, 9.3828125, 9.83203125, 10.28125, 10.73046875, 11.1796875, 11.62890625, 12.078125, 12.52734375, 12.9765625, 13.42578125, 13.875, 14.32421875, 14.7734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 4.0, 2.0, 9.0, 7.0, 11.0, 21.0, 28.0, 48.0, 74.0, 127.0, 151.0, 262.0, 377.0, 633.0, 1034.0, 1738.0, 2727.0, 4662.0, 8005.0, 13841.0, 24036.0, 40053.0, 64442.0, 96362.0, 129017.0, 149970.0, 147479.0, 124033.0, 90094.0, 59827.0, 36882.0, 21777.0, 12620.0, 7377.0, 4172.0, 2597.0, 1521.0, 912.0, 578.0, 364.0, 235.0, 164.0, 102.0, 61.0, 34.0, 25.0, 20.0, 11.0, 8.0, 7.0, 6.0, 8.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.01171875, -4.83837890625, -4.6650390625, -4.49169921875, -4.318359375, -4.14501953125, -3.9716796875, -3.79833984375, -3.625, -3.45166015625, -3.2783203125, -3.10498046875, -2.931640625, -2.75830078125, -2.5849609375, -2.41162109375, -2.23828125, -2.06494140625, -1.8916015625, -1.71826171875, -1.544921875, -1.37158203125, -1.1982421875, -1.02490234375, -0.8515625, -0.67822265625, -0.5048828125, -0.33154296875, -0.158203125, 0.01513671875, 0.1884765625, 0.36181640625, 0.53515625, 0.70849609375, 0.8818359375, 1.05517578125, 1.228515625, 1.40185546875, 1.5751953125, 1.74853515625, 1.921875, 2.09521484375, 2.2685546875, 2.44189453125, 2.615234375, 2.78857421875, 2.9619140625, 3.13525390625, 3.30859375, 3.48193359375, 3.6552734375, 3.82861328125, 4.001953125, 4.17529296875, 4.3486328125, 4.52197265625, 4.6953125, 4.86865234375, 5.0419921875, 5.21533203125, 5.388671875, 5.56201171875, 5.7353515625, 5.90869140625, 6.08203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 3.0, 5.0, 11.0, 10.0, 8.0, 9.0, 20.0, 26.0, 21.0, 28.0, 21.0, 28.0, 39.0, 48.0, 31.0, 55.0, 48.0, 46.0, 48.0, 53.0, 55.0, 46.0, 51.0, 37.0, 41.0, 36.0, 33.0, 27.0, 18.0, 14.0, 19.0, 10.0, 12.0, 12.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005631446838378906, -0.0005464404821395874, -0.0005297362804412842, -0.000513032078742981, -0.0004963278770446777, -0.0004796236753463745, -0.0004629194736480713, -0.00044621527194976807, -0.00042951107025146484, -0.0004128068685531616, -0.0003961026668548584, -0.0003793984651565552, -0.00036269426345825195, -0.00034599006175994873, -0.0003292858600616455, -0.0003125816583633423, -0.00029587745666503906, -0.00027917325496673584, -0.0002624690532684326, -0.0002457648515701294, -0.00022906064987182617, -0.00021235644817352295, -0.00019565224647521973, -0.0001789480447769165, -0.00016224384307861328, -0.00014553964138031006, -0.00012883543968200684, -0.00011213123798370361, -9.542703628540039e-05, -7.872283458709717e-05, -6.201863288879395e-05, -4.531443119049072e-05, -2.86102294921875e-05, -1.1906027793884277e-05, 4.798173904418945e-06, 2.1502375602722168e-05, 3.820657730102539e-05, 5.491077899932861e-05, 7.161498069763184e-05, 8.831918239593506e-05, 0.00010502338409423828, 0.0001217275857925415, 0.00013843178749084473, 0.00015513598918914795, 0.00017184019088745117, 0.0001885443925857544, 0.00020524859428405762, 0.00022195279598236084, 0.00023865699768066406, 0.0002553611993789673, 0.0002720654010772705, 0.00028876960277557373, 0.00030547380447387695, 0.0003221780061721802, 0.0003388822078704834, 0.0003555864095687866, 0.00037229061126708984, 0.00038899481296539307, 0.0004056990146636963, 0.0004224032163619995, 0.00043910741806030273, 0.00045581161975860596, 0.0004725158214569092, 0.0004892200231552124, 0.0005059242248535156]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 10.0, 11.0, 12.0, 20.0, 34.0, 74.0, 90.0, 152.0, 267.0, 420.0, 688.0, 1136.0, 1791.0, 2802.0, 4755.0, 7436.0, 12010.0, 19527.0, 30149.0, 44807.0, 64915.0, 86927.0, 107605.0, 121824.0, 124203.0, 112713.0, 92432.0, 70103.0, 49952.0, 33754.0, 21928.0, 13757.0, 8420.0, 5410.0, 3205.0, 1923.0, 1278.0, 758.0, 501.0, 281.0, 184.0, 99.0, 66.0, 50.0, 23.0, 24.0, 16.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.74609375, -4.60284423828125, -4.4595947265625, -4.31634521484375, -4.173095703125, -4.02984619140625, -3.8865966796875, -3.74334716796875, -3.60009765625, -3.45684814453125, -3.3135986328125, -3.17034912109375, -3.027099609375, -2.88385009765625, -2.7406005859375, -2.59735107421875, -2.4541015625, -2.31085205078125, -2.1676025390625, -2.02435302734375, -1.881103515625, -1.73785400390625, -1.5946044921875, -1.45135498046875, -1.30810546875, -1.16485595703125, -1.0216064453125, -0.87835693359375, -0.735107421875, -0.59185791015625, -0.4486083984375, -0.30535888671875, -0.162109375, -0.01885986328125, 0.1243896484375, 0.26763916015625, 0.410888671875, 0.55413818359375, 0.6973876953125, 0.84063720703125, 0.98388671875, 1.12713623046875, 1.2703857421875, 1.41363525390625, 1.556884765625, 1.70013427734375, 1.8433837890625, 1.98663330078125, 2.1298828125, 2.27313232421875, 2.4163818359375, 2.55963134765625, 2.702880859375, 2.84613037109375, 2.9893798828125, 3.13262939453125, 3.27587890625, 3.41912841796875, 3.5623779296875, 3.70562744140625, 3.848876953125, 3.99212646484375, 4.1353759765625, 4.27862548828125, 4.421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 10.0, 13.0, 18.0, 14.0, 30.0, 29.0, 25.0, 40.0, 39.0, 50.0, 54.0, 52.0, 73.0, 54.0, 68.0, 67.0, 46.0, 55.0, 39.0, 32.0, 30.0, 34.0, 27.0, 22.0, 20.0, 11.0, 8.0, 9.0, 9.0, 3.0, 6.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.9765625, -2.9020843505859375, -2.827606201171875, -2.7531280517578125, -2.67864990234375, -2.6041717529296875, -2.529693603515625, -2.4552154541015625, -2.3807373046875, -2.3062591552734375, -2.231781005859375, -2.1573028564453125, -2.08282470703125, -2.0083465576171875, -1.933868408203125, -1.8593902587890625, -1.784912109375, -1.7104339599609375, -1.635955810546875, -1.5614776611328125, -1.48699951171875, -1.4125213623046875, -1.338043212890625, -1.2635650634765625, -1.1890869140625, -1.1146087646484375, -1.040130615234375, -0.9656524658203125, -0.89117431640625, -0.8166961669921875, -0.742218017578125, -0.6677398681640625, -0.59326171875, -0.5187835693359375, -0.444305419921875, -0.3698272705078125, -0.29534912109375, -0.2208709716796875, -0.146392822265625, -0.0719146728515625, 0.0025634765625, 0.0770416259765625, 0.151519775390625, 0.2259979248046875, 0.30047607421875, 0.3749542236328125, 0.449432373046875, 0.5239105224609375, 0.598388671875, 0.6728668212890625, 0.747344970703125, 0.8218231201171875, 0.89630126953125, 0.9707794189453125, 1.045257568359375, 1.1197357177734375, 1.1942138671875, 1.2686920166015625, 1.343170166015625, 1.4176483154296875, 1.49212646484375, 1.5666046142578125, 1.641082763671875, 1.7155609130859375, 1.7900390625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 6.0, 3.0, 12.0, 8.0, 17.0, 17.0, 19.0, 13.0, 19.0, 19.0, 19.0, 38.0, 24.0, 38.0, 37.0, 34.0, 48.0, 45.0, 42.0, 50.0, 46.0, 43.0, 40.0, 39.0, 39.0, 43.0, 33.0, 40.0, 27.0, 16.0, 19.0, 22.0, 17.0, 8.0, 8.0, 11.0, 14.0, 6.0, 4.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-21.251632690429688, -20.585906982421875, -19.920183181762695, -19.254457473754883, -18.588733673095703, -17.92300796508789, -17.25728416442871, -16.5915584564209, -15.925833702087402, -15.260108947753906, -14.59438419342041, -13.928659439086914, -13.262933731079102, -12.597209930419922, -11.93148422241211, -11.265759468078613, -10.600034713745117, -9.934309959411621, -9.268585205078125, -8.602860450744629, -7.937135219573975, -7.2714104652404785, -6.605685234069824, -5.939960479736328, -5.274235725402832, -4.608510971069336, -3.9427859783172607, -3.2770609855651855, -2.6113362312316895, -1.9456114768981934, -1.2798864841461182, -0.614161491394043, 0.05156517028808594, 0.7172900438308716, 1.3830149173736572, 2.0487399101257324, 2.7144646644592285, 3.3801894187927246, 4.045914649963379, 4.711639404296875, 5.377364158630371, 6.043088912963867, 6.708813667297363, 7.374538898468018, 8.040264129638672, 8.705987930297852, 9.371713638305664, 10.03743839263916, 10.703163146972656, 11.368887901306152, 12.034612655639648, 12.700337409973145, 13.36606216430664, 14.031787872314453, 14.69751262664795, 15.363237380981445, 16.028961181640625, 16.694686889648438, 17.360410690307617, 18.02613639831543, 18.69186019897461, 19.357585906982422, 20.0233097076416, 20.689035415649414, 21.354761123657227]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 5.0, 9.0, 10.0, 10.0, 14.0, 10.0, 23.0, 24.0, 26.0, 19.0, 28.0, 36.0, 32.0, 40.0, 42.0, 40.0, 40.0, 31.0, 39.0, 36.0, 34.0, 42.0, 37.0, 41.0, 38.0, 41.0, 32.0, 25.0, 30.0, 18.0, 21.0, 14.0, 24.0, 10.0, 12.0, 11.0, 6.0, 10.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.7653751373291, -24.02655601501465, -23.287736892700195, -22.548917770385742, -21.810096740722656, -21.071277618408203, -20.33245849609375, -19.593639373779297, -18.854820251464844, -18.11600112915039, -17.377182006835938, -16.638362884521484, -15.899542808532715, -15.160723686218262, -14.421903610229492, -13.683084487915039, -12.944265365600586, -12.205446243286133, -11.46662712097168, -10.72780704498291, -9.988987922668457, -9.250168800354004, -8.511348724365234, -7.772529602050781, -7.033710479736328, -6.294891357421875, -5.556071758270264, -4.817252159118652, -4.078433036804199, -3.339613676071167, -2.6007943153381348, -1.8619747161865234, -1.1231536865234375, -0.3843343257904053, 0.35448503494262695, 1.0933043956756592, 1.8321237564086914, 2.5709431171417236, 3.309762477874756, 4.048582077026367, 4.78740119934082, 5.526220321655273, 6.265039920806885, 7.003859519958496, 7.742678642272949, 8.481497764587402, 9.220317840576172, 9.959136962890625, 10.697956085205078, 11.436775207519531, 12.175594329833984, 12.914414405822754, 13.653233528137207, 14.39205265045166, 15.13087272644043, 15.869691848754883, 16.608510971069336, 17.34733009338379, 18.086149215698242, 18.824968338012695, 19.56378936767578, 20.302608489990234, 21.041427612304688, 21.78024673461914, 22.519065856933594]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 12.0, 15.0, 31.0, 52.0, 67.0, 153.0, 255.0, 355.0, 614.0, 1019.0, 1538.0, 2530.0, 4083.0, 6750.0, 10562.0, 17110.0, 27698.0, 43928.0, 71077.0, 110780.0, 170863.0, 253181.0, 349052.0, 444258.0, 509210.0, 515828.0, 466010.0, 376856.0, 278874.0, 191128.0, 126022.0, 81140.0, 50968.0, 31437.0, 19793.0, 11808.0, 7426.0, 4469.0, 2781.0, 1761.0, 1056.0, 661.0, 431.0, 219.0, 175.0, 97.0, 57.0, 40.0, 21.0, 14.0, 13.0, 3.0, 0.0, 4.0, 3.0, 1.0], "bins": [-15.0546875, -14.6004638671875, -14.146240234375, -13.6920166015625, -13.23779296875, -12.7835693359375, -12.329345703125, -11.8751220703125, -11.4208984375, -10.9666748046875, -10.512451171875, -10.0582275390625, -9.60400390625, -9.1497802734375, -8.695556640625, -8.2413330078125, -7.787109375, -7.3328857421875, -6.878662109375, -6.4244384765625, -5.97021484375, -5.5159912109375, -5.061767578125, -4.6075439453125, -4.1533203125, -3.6990966796875, -3.244873046875, -2.7906494140625, -2.33642578125, -1.8822021484375, -1.427978515625, -0.9737548828125, -0.51953125, -0.0653076171875, 0.388916015625, 0.8431396484375, 1.29736328125, 1.7515869140625, 2.205810546875, 2.6600341796875, 3.1142578125, 3.5684814453125, 4.022705078125, 4.4769287109375, 4.93115234375, 5.3853759765625, 5.839599609375, 6.2938232421875, 6.748046875, 7.2022705078125, 7.656494140625, 8.1107177734375, 8.56494140625, 9.0191650390625, 9.473388671875, 9.9276123046875, 10.3818359375, 10.8360595703125, 11.290283203125, 11.7445068359375, 12.19873046875, 12.6529541015625, 13.107177734375, 13.5614013671875, 14.015625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 2.0, 3.0, 11.0, 5.0, 8.0, 7.0, 4.0, 13.0, 21.0, 13.0, 21.0, 21.0, 24.0, 26.0, 23.0, 26.0, 29.0, 40.0, 49.0, 43.0, 34.0, 36.0, 40.0, 33.0, 39.0, 42.0, 37.0, 34.0, 41.0, 40.0, 30.0, 28.0, 21.0, 31.0, 12.0, 20.0, 12.0, 13.0, 13.0, 14.0, 8.0, 5.0, 7.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-18.0, -17.450927734375, -16.90185546875, -16.352783203125, -15.8037109375, -15.254638671875, -14.70556640625, -14.156494140625, -13.607421875, -13.058349609375, -12.50927734375, -11.960205078125, -11.4111328125, -10.862060546875, -10.31298828125, -9.763916015625, -9.21484375, -8.665771484375, -8.11669921875, -7.567626953125, -7.0185546875, -6.469482421875, -5.92041015625, -5.371337890625, -4.822265625, -4.273193359375, -3.72412109375, -3.175048828125, -2.6259765625, -2.076904296875, -1.52783203125, -0.978759765625, -0.4296875, 0.119384765625, 0.66845703125, 1.217529296875, 1.7666015625, 2.315673828125, 2.86474609375, 3.413818359375, 3.962890625, 4.511962890625, 5.06103515625, 5.610107421875, 6.1591796875, 6.708251953125, 7.25732421875, 7.806396484375, 8.35546875, 8.904541015625, 9.45361328125, 10.002685546875, 10.5517578125, 11.100830078125, 11.64990234375, 12.198974609375, 12.748046875, 13.297119140625, 13.84619140625, 14.395263671875, 14.9443359375, 15.493408203125, 16.04248046875, 16.591552734375, 17.140625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 10.0, 19.0, 44.0, 59.0, 104.0, 161.0, 251.0, 413.0, 728.0, 1290.0, 2318.0, 3802.0, 6410.0, 10924.0, 18424.0, 29631.0, 49008.0, 77156.0, 119453.0, 178615.0, 255114.0, 344095.0, 426808.0, 486279.0, 494435.0, 452859.0, 373803.0, 284768.0, 203380.0, 137911.0, 89778.0, 56996.0, 35715.0, 21517.0, 13334.0, 7812.0, 4494.0, 2575.0, 1570.0, 868.0, 567.0, 331.0, 200.0, 96.0, 69.0, 39.0, 28.0, 10.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-16.03125, -15.5479736328125, -15.064697265625, -14.5814208984375, -14.09814453125, -13.6148681640625, -13.131591796875, -12.6483154296875, -12.1650390625, -11.6817626953125, -11.198486328125, -10.7152099609375, -10.23193359375, -9.7486572265625, -9.265380859375, -8.7821044921875, -8.298828125, -7.8155517578125, -7.332275390625, -6.8489990234375, -6.36572265625, -5.8824462890625, -5.399169921875, -4.9158935546875, -4.4326171875, -3.9493408203125, -3.466064453125, -2.9827880859375, -2.49951171875, -2.0162353515625, -1.532958984375, -1.0496826171875, -0.56640625, -0.0831298828125, 0.400146484375, 0.8834228515625, 1.36669921875, 1.8499755859375, 2.333251953125, 2.8165283203125, 3.2998046875, 3.7830810546875, 4.266357421875, 4.7496337890625, 5.23291015625, 5.7161865234375, 6.199462890625, 6.6827392578125, 7.166015625, 7.6492919921875, 8.132568359375, 8.6158447265625, 9.09912109375, 9.5823974609375, 10.065673828125, 10.5489501953125, 11.0322265625, 11.5155029296875, 11.998779296875, 12.4820556640625, 12.96533203125, 13.4486083984375, 13.931884765625, 14.4151611328125, 14.8984375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 8.0, 3.0, 13.0, 13.0, 18.0, 21.0, 30.0, 36.0, 46.0, 50.0, 66.0, 86.0, 85.0, 130.0, 123.0, 155.0, 164.0, 184.0, 197.0, 228.0, 203.0, 252.0, 213.0, 225.0, 215.0, 167.0, 161.0, 168.0, 128.0, 115.0, 114.0, 80.0, 76.0, 70.0, 53.0, 47.0, 35.0, 19.0, 16.0, 16.0, 14.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0], "bins": [-8.171875, -7.9261474609375, -7.680419921875, -7.4346923828125, -7.18896484375, -6.9432373046875, -6.697509765625, -6.4517822265625, -6.2060546875, -5.9603271484375, -5.714599609375, -5.4688720703125, -5.22314453125, -4.9774169921875, -4.731689453125, -4.4859619140625, -4.240234375, -3.9945068359375, -3.748779296875, -3.5030517578125, -3.25732421875, -3.0115966796875, -2.765869140625, -2.5201416015625, -2.2744140625, -2.0286865234375, -1.782958984375, -1.5372314453125, -1.29150390625, -1.0457763671875, -0.800048828125, -0.5543212890625, -0.30859375, -0.0628662109375, 0.182861328125, 0.4285888671875, 0.67431640625, 0.9200439453125, 1.165771484375, 1.4114990234375, 1.6572265625, 1.9029541015625, 2.148681640625, 2.3944091796875, 2.64013671875, 2.8858642578125, 3.131591796875, 3.3773193359375, 3.623046875, 3.8687744140625, 4.114501953125, 4.3602294921875, 4.60595703125, 4.8516845703125, 5.097412109375, 5.3431396484375, 5.5888671875, 5.8345947265625, 6.080322265625, 6.3260498046875, 6.57177734375, 6.8175048828125, 7.063232421875, 7.3089599609375, 7.5546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 13.0, 10.0, 10.0, 11.0, 14.0, 19.0, 16.0, 23.0, 20.0, 25.0, 29.0, 23.0, 36.0, 41.0, 33.0, 28.0, 42.0, 46.0, 32.0, 35.0, 39.0, 47.0, 31.0, 35.0, 30.0, 20.0, 26.0, 33.0, 28.0, 24.0, 21.0, 15.0, 20.0, 22.0, 8.0, 7.0, 5.0, 8.0, 11.0, 9.0, 2.0, 6.0, 7.0, 7.0, 3.0, 1.0, 3.0, 7.0, 2.0, 2.0], "bins": [-16.19312858581543, -15.700928688049316, -15.208728790283203, -14.71652889251709, -14.224328994750977, -13.732129096984863, -13.23992919921875, -12.747729301452637, -12.255529403686523, -11.76332950592041, -11.271129608154297, -10.778929710388184, -10.28672981262207, -9.794529914855957, -9.302330017089844, -8.81013011932373, -8.317930221557617, -7.825730323791504, -7.333530426025391, -6.841330528259277, -6.349130630493164, -5.856930732727051, -5.3647308349609375, -4.872530937194824, -4.380331039428711, -3.8881311416625977, -3.3959312438964844, -2.903731346130371, -2.411531448364258, -1.9193315505981445, -1.4271316528320312, -0.934931755065918, -0.4427328109741211, 0.04946708679199219, 0.5416669845581055, 1.0338668823242188, 1.526066780090332, 2.0182666778564453, 2.5104665756225586, 3.002666473388672, 3.494866371154785, 3.9870662689208984, 4.479266166687012, 4.971466064453125, 5.463665962219238, 5.955865859985352, 6.448065757751465, 6.940265655517578, 7.432465553283691, 7.924665451049805, 8.416865348815918, 8.909065246582031, 9.401265144348145, 9.893465042114258, 10.385664939880371, 10.877864837646484, 11.370064735412598, 11.862264633178711, 12.354464530944824, 12.846664428710938, 13.33886432647705, 13.831064224243164, 14.323264122009277, 14.81546401977539, 15.307663917541504]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 0.0, 2.0, 10.0, 5.0, 6.0, 7.0, 5.0, 8.0, 10.0, 18.0, 14.0, 23.0, 16.0, 20.0, 23.0, 31.0, 22.0, 28.0, 32.0, 34.0, 43.0, 21.0, 37.0, 50.0, 32.0, 35.0, 40.0, 42.0, 33.0, 40.0, 33.0, 33.0, 26.0, 29.0, 25.0, 33.0, 21.0, 20.0, 16.0, 11.0, 12.0, 13.0, 11.0, 9.0, 4.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-19.54261589050293, -18.945056915283203, -18.347496032714844, -17.749937057495117, -17.15237808227539, -16.55481719970703, -15.957258224487305, -15.359699249267578, -14.762139320373535, -14.164579391479492, -13.567020416259766, -12.969460487365723, -12.37190055847168, -11.774341583251953, -11.17678165435791, -10.579221725463867, -9.98166275024414, -9.384102821350098, -8.786543846130371, -8.188983917236328, -7.591424465179443, -6.993865013122559, -6.396305084228516, -5.798745632171631, -5.201186180114746, -4.603626728057861, -4.006067276000977, -3.4085073471069336, -2.810947895050049, -2.213388442993164, -1.6158287525177002, -1.0182690620422363, -0.4207115173339844, 0.17684805393218994, 0.7744076251983643, 1.3719671964645386, 1.969526767730713, 2.5670862197875977, 3.1646459102630615, 3.7622056007385254, 4.35976505279541, 4.957324504852295, 5.55488395690918, 6.152443885803223, 6.750003337860107, 7.347562789916992, 7.945122718811035, 8.542682647705078, 9.140241622924805, 9.737801551818848, 10.335360527038574, 10.932920455932617, 11.530479431152344, 12.128039360046387, 12.72559928894043, 13.323158264160156, 13.9207181930542, 14.518278121948242, 15.115837097167969, 15.713397026062012, 16.310956954956055, 16.90851593017578, 17.506074905395508, 18.103635787963867, 18.701194763183594]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 5.0, 11.0, 9.0, 26.0, 19.0, 30.0, 54.0, 67.0, 93.0, 126.0, 198.0, 282.0, 440.0, 636.0, 977.0, 1537.0, 2483.0, 4162.0, 7036.0, 12238.0, 22190.0, 40413.0, 73920.0, 128360.0, 191655.0, 206083.0, 151071.0, 90521.0, 50024.0, 27316.0, 15030.0, 8399.0, 4974.0, 2906.0, 1824.0, 1094.0, 791.0, 491.0, 319.0, 223.0, 167.0, 110.0, 74.0, 54.0, 45.0, 20.0, 21.0, 16.0, 6.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.883544921875, -9.53271484375, -9.181884765625, -8.8310546875, -8.480224609375, -8.12939453125, -7.778564453125, -7.427734375, -7.076904296875, -6.72607421875, -6.375244140625, -6.0244140625, -5.673583984375, -5.32275390625, -4.971923828125, -4.62109375, -4.270263671875, -3.91943359375, -3.568603515625, -3.2177734375, -2.866943359375, -2.51611328125, -2.165283203125, -1.814453125, -1.463623046875, -1.11279296875, -0.761962890625, -0.4111328125, -0.060302734375, 0.29052734375, 0.641357421875, 0.9921875, 1.343017578125, 1.69384765625, 2.044677734375, 2.3955078125, 2.746337890625, 3.09716796875, 3.447998046875, 3.798828125, 4.149658203125, 4.50048828125, 4.851318359375, 5.2021484375, 5.552978515625, 5.90380859375, 6.254638671875, 6.60546875, 6.956298828125, 7.30712890625, 7.657958984375, 8.0087890625, 8.359619140625, 8.71044921875, 9.061279296875, 9.412109375, 9.762939453125, 10.11376953125, 10.464599609375, 10.8154296875, 11.166259765625, 11.51708984375, 11.867919921875, 12.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 9.0, 7.0, 9.0, 7.0, 12.0, 11.0, 15.0, 24.0, 19.0, 23.0, 24.0, 26.0, 24.0, 34.0, 33.0, 37.0, 30.0, 33.0, 44.0, 35.0, 40.0, 58.0, 41.0, 34.0, 46.0, 35.0, 36.0, 28.0, 32.0, 25.0, 29.0, 21.0, 16.0, 18.0, 20.0, 10.0, 11.0, 9.0, 6.0, 7.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.885009765625, -19.25439453125, -18.623779296875, -17.9931640625, -17.362548828125, -16.73193359375, -16.101318359375, -15.470703125, -14.840087890625, -14.20947265625, -13.578857421875, -12.9482421875, -12.317626953125, -11.68701171875, -11.056396484375, -10.42578125, -9.795166015625, -9.16455078125, -8.533935546875, -7.9033203125, -7.272705078125, -6.64208984375, -6.011474609375, -5.380859375, -4.750244140625, -4.11962890625, -3.489013671875, -2.8583984375, -2.227783203125, -1.59716796875, -0.966552734375, -0.3359375, 0.294677734375, 0.92529296875, 1.555908203125, 2.1865234375, 2.817138671875, 3.44775390625, 4.078369140625, 4.708984375, 5.339599609375, 5.97021484375, 6.600830078125, 7.2314453125, 7.862060546875, 8.49267578125, 9.123291015625, 9.75390625, 10.384521484375, 11.01513671875, 11.645751953125, 12.2763671875, 12.906982421875, 13.53759765625, 14.168212890625, 14.798828125, 15.429443359375, 16.06005859375, 16.690673828125, 17.3212890625, 17.951904296875, 18.58251953125, 19.213134765625, 19.84375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 4.0, 9.0, 8.0, 13.0, 14.0, 37.0, 30.0, 53.0, 81.0, 113.0, 180.0, 225.0, 375.0, 556.0, 904.0, 1525.0, 2741.0, 5482.0, 12152.0, 33178.0, 100862.0, 276421.0, 356530.0, 167130.0, 54593.0, 18797.0, 7632.0, 3653.0, 1950.0, 1162.0, 689.0, 479.0, 294.0, 212.0, 144.0, 100.0, 69.0, 47.0, 31.0, 23.0, 21.0, 11.0, 10.0, 5.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.671875, -12.29052734375, -11.9091796875, -11.52783203125, -11.146484375, -10.76513671875, -10.3837890625, -10.00244140625, -9.62109375, -9.23974609375, -8.8583984375, -8.47705078125, -8.095703125, -7.71435546875, -7.3330078125, -6.95166015625, -6.5703125, -6.18896484375, -5.8076171875, -5.42626953125, -5.044921875, -4.66357421875, -4.2822265625, -3.90087890625, -3.51953125, -3.13818359375, -2.7568359375, -2.37548828125, -1.994140625, -1.61279296875, -1.2314453125, -0.85009765625, -0.46875, -0.08740234375, 0.2939453125, 0.67529296875, 1.056640625, 1.43798828125, 1.8193359375, 2.20068359375, 2.58203125, 2.96337890625, 3.3447265625, 3.72607421875, 4.107421875, 4.48876953125, 4.8701171875, 5.25146484375, 5.6328125, 6.01416015625, 6.3955078125, 6.77685546875, 7.158203125, 7.53955078125, 7.9208984375, 8.30224609375, 8.68359375, 9.06494140625, 9.4462890625, 9.82763671875, 10.208984375, 10.59033203125, 10.9716796875, 11.35302734375, 11.734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 6.0, 3.0, 6.0, 4.0, 8.0, 13.0, 12.0, 11.0, 16.0, 23.0, 26.0, 33.0, 24.0, 28.0, 36.0, 32.0, 42.0, 41.0, 35.0, 51.0, 50.0, 49.0, 37.0, 41.0, 35.0, 37.0, 27.0, 31.0, 36.0, 36.0, 29.0, 24.0, 20.0, 18.0, 8.0, 15.0, 18.0, 9.0, 7.0, 10.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.5703125, -14.0848388671875, -13.599365234375, -13.1138916015625, -12.62841796875, -12.1429443359375, -11.657470703125, -11.1719970703125, -10.6865234375, -10.2010498046875, -9.715576171875, -9.2301025390625, -8.74462890625, -8.2591552734375, -7.773681640625, -7.2882080078125, -6.802734375, -6.3172607421875, -5.831787109375, -5.3463134765625, -4.86083984375, -4.3753662109375, -3.889892578125, -3.4044189453125, -2.9189453125, -2.4334716796875, -1.947998046875, -1.4625244140625, -0.97705078125, -0.4915771484375, -0.006103515625, 0.4793701171875, 0.96484375, 1.4503173828125, 1.935791015625, 2.4212646484375, 2.90673828125, 3.3922119140625, 3.877685546875, 4.3631591796875, 4.8486328125, 5.3341064453125, 5.819580078125, 6.3050537109375, 6.79052734375, 7.2760009765625, 7.761474609375, 8.2469482421875, 8.732421875, 9.2178955078125, 9.703369140625, 10.1888427734375, 10.67431640625, 11.1597900390625, 11.645263671875, 12.1307373046875, 12.6162109375, 13.1016845703125, 13.587158203125, 14.0726318359375, 14.55810546875, 15.0435791015625, 15.529052734375, 16.0145263671875, 16.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 14.0, 14.0, 27.0, 31.0, 45.0, 66.0, 77.0, 120.0, 162.0, 244.0, 407.0, 660.0, 1070.0, 1776.0, 3260.0, 6447.0, 14348.0, 37689.0, 124540.0, 457610.0, 282364.0, 71732.0, 24660.0, 10176.0, 4865.0, 2427.0, 1372.0, 750.0, 502.0, 314.0, 199.0, 139.0, 101.0, 69.0, 61.0, 56.0, 42.0, 31.0, 24.0, 14.0, 12.0, 9.0, 9.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.50390625, -5.33074951171875, -5.1575927734375, -4.98443603515625, -4.811279296875, -4.63812255859375, -4.4649658203125, -4.29180908203125, -4.11865234375, -3.94549560546875, -3.7723388671875, -3.59918212890625, -3.426025390625, -3.25286865234375, -3.0797119140625, -2.90655517578125, -2.7333984375, -2.56024169921875, -2.3870849609375, -2.21392822265625, -2.040771484375, -1.86761474609375, -1.6944580078125, -1.52130126953125, -1.34814453125, -1.17498779296875, -1.0018310546875, -0.82867431640625, -0.655517578125, -0.48236083984375, -0.3092041015625, -0.13604736328125, 0.037109375, 0.21026611328125, 0.3834228515625, 0.55657958984375, 0.729736328125, 0.90289306640625, 1.0760498046875, 1.24920654296875, 1.42236328125, 1.59552001953125, 1.7686767578125, 1.94183349609375, 2.114990234375, 2.28814697265625, 2.4613037109375, 2.63446044921875, 2.8076171875, 2.98077392578125, 3.1539306640625, 3.32708740234375, 3.500244140625, 3.67340087890625, 3.8465576171875, 4.01971435546875, 4.19287109375, 4.36602783203125, 4.5391845703125, 4.71234130859375, 4.885498046875, 5.05865478515625, 5.2318115234375, 5.40496826171875, 5.578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 4.0, 5.0, 8.0, 8.0, 8.0, 9.0, 19.0, 17.0, 24.0, 29.0, 27.0, 29.0, 53.0, 67.0, 93.0, 95.0, 77.0, 77.0, 59.0, 61.0, 46.0, 33.0, 30.0, 21.0, 20.0, 17.0, 10.0, 7.0, 13.0, 9.0, 8.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007414817810058594, -0.0007174909114837646, -0.0006935000419616699, -0.0006695091724395752, -0.0006455183029174805, -0.0006215274333953857, -0.000597536563873291, -0.0005735456943511963, -0.0005495548248291016, -0.0005255639553070068, -0.0005015730857849121, -0.0004775822162628174, -0.00045359134674072266, -0.00042960047721862793, -0.0004056096076965332, -0.0003816187381744385, -0.00035762786865234375, -0.000333636999130249, -0.0003096461296081543, -0.00028565526008605957, -0.00026166439056396484, -0.00023767352104187012, -0.0002136826515197754, -0.00018969178199768066, -0.00016570091247558594, -0.0001417100429534912, -0.00011771917343139648, -9.372830390930176e-05, -6.973743438720703e-05, -4.5746564865112305e-05, -2.1755695343017578e-05, 2.2351741790771484e-06, 2.6226043701171875e-05, 5.02169132232666e-05, 7.420778274536133e-05, 9.819865226745605e-05, 0.00012218952178955078, 0.0001461803913116455, 0.00017017126083374023, 0.00019416213035583496, 0.0002181529998779297, 0.00024214386940002441, 0.00026613473892211914, 0.00029012560844421387, 0.0003141164779663086, 0.0003381073474884033, 0.00036209821701049805, 0.0003860890865325928, 0.0004100799560546875, 0.0004340708255767822, 0.00045806169509887695, 0.0004820525646209717, 0.0005060434341430664, 0.0005300343036651611, 0.0005540251731872559, 0.0005780160427093506, 0.0006020069122314453, 0.00062599778175354, 0.0006499886512756348, 0.0006739795207977295, 0.0006979703903198242, 0.0007219612598419189, 0.0007459521293640137, 0.0007699429988861084, 0.0007939338684082031]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 10.0, 7.0, 14.0, 21.0, 13.0, 37.0, 46.0, 75.0, 119.0, 152.0, 220.0, 352.0, 561.0, 910.0, 1584.0, 2749.0, 4867.0, 10047.0, 20338.0, 43204.0, 96357.0, 219802.0, 324894.0, 176550.0, 76519.0, 34800.0, 16373.0, 8038.0, 4128.0, 2259.0, 1267.0, 798.0, 502.0, 305.0, 201.0, 140.0, 76.0, 60.0, 46.0, 33.0, 25.0, 14.0, 5.0, 13.0, 9.0, 8.0, 2.0, 8.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.578125, -5.358154296875, -5.13818359375, -4.918212890625, -4.6982421875, -4.478271484375, -4.25830078125, -4.038330078125, -3.818359375, -3.598388671875, -3.37841796875, -3.158447265625, -2.9384765625, -2.718505859375, -2.49853515625, -2.278564453125, -2.05859375, -1.838623046875, -1.61865234375, -1.398681640625, -1.1787109375, -0.958740234375, -0.73876953125, -0.518798828125, -0.298828125, -0.078857421875, 0.14111328125, 0.361083984375, 0.5810546875, 0.801025390625, 1.02099609375, 1.240966796875, 1.4609375, 1.680908203125, 1.90087890625, 2.120849609375, 2.3408203125, 2.560791015625, 2.78076171875, 3.000732421875, 3.220703125, 3.440673828125, 3.66064453125, 3.880615234375, 4.1005859375, 4.320556640625, 4.54052734375, 4.760498046875, 4.98046875, 5.200439453125, 5.42041015625, 5.640380859375, 5.8603515625, 6.080322265625, 6.30029296875, 6.520263671875, 6.740234375, 6.960205078125, 7.18017578125, 7.400146484375, 7.6201171875, 7.840087890625, 8.06005859375, 8.280029296875, 8.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 10.0, 7.0, 14.0, 17.0, 25.0, 16.0, 27.0, 27.0, 28.0, 51.0, 51.0, 54.0, 62.0, 73.0, 60.0, 63.0, 51.0, 68.0, 67.0, 41.0, 43.0, 22.0, 23.0, 23.0, 18.0, 17.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.451171875, -1.391754150390625, -1.33233642578125, -1.272918701171875, -1.2135009765625, -1.154083251953125, -1.09466552734375, -1.035247802734375, -0.975830078125, -0.916412353515625, -0.85699462890625, -0.797576904296875, -0.7381591796875, -0.678741455078125, -0.61932373046875, -0.559906005859375, -0.50048828125, -0.441070556640625, -0.38165283203125, -0.322235107421875, -0.2628173828125, -0.203399658203125, -0.14398193359375, -0.084564208984375, -0.025146484375, 0.034271240234375, 0.09368896484375, 0.153106689453125, 0.2125244140625, 0.271942138671875, 0.33135986328125, 0.390777587890625, 0.4501953125, 0.509613037109375, 0.56903076171875, 0.628448486328125, 0.6878662109375, 0.747283935546875, 0.80670166015625, 0.866119384765625, 0.925537109375, 0.984954833984375, 1.04437255859375, 1.103790283203125, 1.1632080078125, 1.222625732421875, 1.28204345703125, 1.341461181640625, 1.40087890625, 1.460296630859375, 1.51971435546875, 1.579132080078125, 1.6385498046875, 1.697967529296875, 1.75738525390625, 1.816802978515625, 1.876220703125, 1.935638427734375, 1.99505615234375, 2.054473876953125, 2.1138916015625, 2.173309326171875, 2.23272705078125, 2.292144775390625, 2.3515625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 10.0, 12.0, 14.0, 10.0, 16.0, 17.0, 22.0, 16.0, 28.0, 24.0, 21.0, 32.0, 34.0, 35.0, 42.0, 40.0, 43.0, 48.0, 43.0, 42.0, 34.0, 23.0, 49.0, 34.0, 30.0, 29.0, 39.0, 28.0, 19.0, 21.0, 20.0, 15.0, 10.0, 17.0, 9.0, 7.0, 7.0, 10.0, 4.0, 5.0, 6.0, 4.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.254413604736328, -15.745338439941406, -15.236262321472168, -14.727187156677246, -14.218111991882324, -13.709035873413086, -13.199960708618164, -12.690885543823242, -12.18181037902832, -11.672735214233398, -11.16365909576416, -10.654583930969238, -10.145508766174316, -9.636432647705078, -9.127357482910156, -8.618282318115234, -8.109206199645996, -7.600130558013916, -7.091055393218994, -6.581979751586914, -6.072904586791992, -5.563828945159912, -5.054753303527832, -4.54567813873291, -4.03660249710083, -3.527527093887329, -3.018451690673828, -2.509376049041748, -2.000300645828247, -1.491225242614746, -0.982149600982666, -0.47307419776916504, 0.03600120544433594, 0.5450766682624817, 1.0541521310806274, 1.563227653503418, 2.072303056716919, 2.58137845993042, 3.0904541015625, 3.599529504776001, 4.108604907989502, 4.617680549621582, 5.126755714416504, 5.635831356048584, 6.144906997680664, 6.653982162475586, 7.163057804107666, 7.672133445739746, 8.181208610534668, 8.69028377532959, 9.199359893798828, 9.70843505859375, 10.217510223388672, 10.726585388183594, 11.235661506652832, 11.744736671447754, 12.253812789916992, 12.762887954711914, 13.271964073181152, 13.781039237976074, 14.290114402770996, 14.799190521240234, 15.308265686035156, 15.817340850830078, 16.326416015625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 4.0, 2.0, 1.0, 7.0, 9.0, 3.0, 8.0, 6.0, 8.0, 9.0, 11.0, 13.0, 24.0, 16.0, 23.0, 20.0, 23.0, 21.0, 37.0, 23.0, 25.0, 47.0, 26.0, 39.0, 41.0, 40.0, 32.0, 37.0, 38.0, 31.0, 37.0, 29.0, 37.0, 37.0, 17.0, 30.0, 33.0, 26.0, 20.0, 13.0, 21.0, 11.0, 17.0, 7.0, 13.0, 7.0, 6.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-18.023099899291992, -17.46468734741211, -16.90627670288086, -16.347864151000977, -15.789453506469727, -15.231040954589844, -14.672629356384277, -14.114217758178711, -13.555806159973145, -12.997394561767578, -12.438982963562012, -11.880571365356445, -11.322158813476562, -10.763748168945312, -10.20533561706543, -9.646924018859863, -9.088512420654297, -8.53010082244873, -7.971689224243164, -7.4132771492004395, -6.854865550994873, -6.296453952789307, -5.738041877746582, -5.179630279541016, -4.621218681335449, -4.062807083129883, -3.5043952465057373, -2.945983409881592, -2.3875718116760254, -1.829160213470459, -1.2707483768463135, -0.712336540222168, -0.15392303466796875, 0.4044886827468872, 0.9629004001617432, 1.5213121175765991, 2.079723834991455, 2.6381354331970215, 3.196547269821167, 3.7549591064453125, 4.313370704650879, 4.871782302856445, 5.430193901062012, 5.988605976104736, 6.547017574310303, 7.105429172515869, 7.663841247558594, 8.22225284576416, 8.780664443969727, 9.339076042175293, 9.89748764038086, 10.455899238586426, 11.014310836791992, 11.572723388671875, 12.131134986877441, 12.689546585083008, 13.247958183288574, 13.80636978149414, 14.364781379699707, 14.923192977905273, 15.481605529785156, 16.040016174316406, 16.59842872619629, 17.156841278076172, 17.715251922607422]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 13.0, 12.0, 25.0, 28.0, 38.0, 68.0, 93.0, 161.0, 203.0, 336.0, 482.0, 785.0, 1142.0, 1689.0, 2632.0, 3669.0, 5444.0, 8058.0, 11409.0, 16397.0, 22710.0, 30831.0, 41287.0, 52788.0, 64949.0, 76636.0, 86695.0, 91736.0, 91483.0, 86891.0, 77615.0, 66313.0, 53829.0, 42144.0, 31857.0, 23496.0, 16870.0, 11938.0, 8260.0, 5632.0, 3901.0, 2647.0, 1835.0, 1198.0, 791.0, 530.0, 351.0, 205.0, 169.0, 118.0, 63.0, 29.0, 32.0, 24.0, 10.0, 13.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.9921875, -10.6263427734375, -10.260498046875, -9.8946533203125, -9.52880859375, -9.1629638671875, -8.797119140625, -8.4312744140625, -8.0654296875, -7.6995849609375, -7.333740234375, -6.9678955078125, -6.60205078125, -6.2362060546875, -5.870361328125, -5.5045166015625, -5.138671875, -4.7728271484375, -4.406982421875, -4.0411376953125, -3.67529296875, -3.3094482421875, -2.943603515625, -2.5777587890625, -2.2119140625, -1.8460693359375, -1.480224609375, -1.1143798828125, -0.74853515625, -0.3826904296875, -0.016845703125, 0.3489990234375, 0.71484375, 1.0806884765625, 1.446533203125, 1.8123779296875, 2.17822265625, 2.5440673828125, 2.909912109375, 3.2757568359375, 3.6416015625, 4.0074462890625, 4.373291015625, 4.7391357421875, 5.10498046875, 5.4708251953125, 5.836669921875, 6.2025146484375, 6.568359375, 6.9342041015625, 7.300048828125, 7.6658935546875, 8.03173828125, 8.3975830078125, 8.763427734375, 9.1292724609375, 9.4951171875, 9.8609619140625, 10.226806640625, 10.5926513671875, 10.95849609375, 11.3243408203125, 11.690185546875, 12.0560302734375, 12.421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 5.0, 4.0, 11.0, 8.0, 12.0, 7.0, 9.0, 13.0, 13.0, 14.0, 18.0, 22.0, 24.0, 24.0, 29.0, 41.0, 28.0, 27.0, 36.0, 34.0, 35.0, 42.0, 42.0, 47.0, 32.0, 31.0, 30.0, 31.0, 34.0, 40.0, 31.0, 38.0, 16.0, 19.0, 23.0, 17.0, 14.0, 16.0, 12.0, 11.0, 15.0, 10.0, 4.0, 7.0, 6.0, 8.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.5625, -17.0107421875, -16.458984375, -15.9072265625, -15.35546875, -14.8037109375, -14.251953125, -13.7001953125, -13.1484375, -12.5966796875, -12.044921875, -11.4931640625, -10.94140625, -10.3896484375, -9.837890625, -9.2861328125, -8.734375, -8.1826171875, -7.630859375, -7.0791015625, -6.52734375, -5.9755859375, -5.423828125, -4.8720703125, -4.3203125, -3.7685546875, -3.216796875, -2.6650390625, -2.11328125, -1.5615234375, -1.009765625, -0.4580078125, 0.09375, 0.6455078125, 1.197265625, 1.7490234375, 2.30078125, 2.8525390625, 3.404296875, 3.9560546875, 4.5078125, 5.0595703125, 5.611328125, 6.1630859375, 6.71484375, 7.2666015625, 7.818359375, 8.3701171875, 8.921875, 9.4736328125, 10.025390625, 10.5771484375, 11.12890625, 11.6806640625, 12.232421875, 12.7841796875, 13.3359375, 13.8876953125, 14.439453125, 14.9912109375, 15.54296875, 16.0947265625, 16.646484375, 17.1982421875, 17.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 9.0, 30.0, 27.0, 59.0, 90.0, 132.0, 203.0, 349.0, 546.0, 830.0, 1332.0, 2156.0, 3304.0, 5241.0, 8106.0, 12514.0, 18827.0, 28025.0, 40125.0, 55617.0, 73233.0, 90695.0, 104478.0, 111087.0, 108531.0, 96725.0, 80446.0, 62988.0, 45932.0, 32790.0, 22266.0, 14991.0, 9693.0, 6216.0, 4094.0, 2480.0, 1573.0, 1016.0, 643.0, 429.0, 276.0, 142.0, 102.0, 66.0, 56.0, 31.0, 12.0, 14.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-16.59375, -16.1014404296875, -15.609130859375, -15.1168212890625, -14.62451171875, -14.1322021484375, -13.639892578125, -13.1475830078125, -12.6552734375, -12.1629638671875, -11.670654296875, -11.1783447265625, -10.68603515625, -10.1937255859375, -9.701416015625, -9.2091064453125, -8.716796875, -8.2244873046875, -7.732177734375, -7.2398681640625, -6.74755859375, -6.2552490234375, -5.762939453125, -5.2706298828125, -4.7783203125, -4.2860107421875, -3.793701171875, -3.3013916015625, -2.80908203125, -2.3167724609375, -1.824462890625, -1.3321533203125, -0.83984375, -0.3475341796875, 0.144775390625, 0.6370849609375, 1.12939453125, 1.6217041015625, 2.114013671875, 2.6063232421875, 3.0986328125, 3.5909423828125, 4.083251953125, 4.5755615234375, 5.06787109375, 5.5601806640625, 6.052490234375, 6.5447998046875, 7.037109375, 7.5294189453125, 8.021728515625, 8.5140380859375, 9.00634765625, 9.4986572265625, 9.990966796875, 10.4832763671875, 10.9755859375, 11.4678955078125, 11.960205078125, 12.4525146484375, 12.94482421875, 13.4371337890625, 13.929443359375, 14.4217529296875, 14.9140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 12.0, 12.0, 9.0, 9.0, 16.0, 29.0, 20.0, 24.0, 29.0, 31.0, 36.0, 25.0, 35.0, 42.0, 35.0, 48.0, 44.0, 38.0, 56.0, 33.0, 37.0, 39.0, 33.0, 41.0, 30.0, 26.0, 38.0, 31.0, 20.0, 21.0, 16.0, 19.0, 16.0, 2.0, 6.0, 13.0, 7.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.75, -11.322998046875, -10.89599609375, -10.468994140625, -10.0419921875, -9.614990234375, -9.18798828125, -8.760986328125, -8.333984375, -7.906982421875, -7.47998046875, -7.052978515625, -6.6259765625, -6.198974609375, -5.77197265625, -5.344970703125, -4.91796875, -4.490966796875, -4.06396484375, -3.636962890625, -3.2099609375, -2.782958984375, -2.35595703125, -1.928955078125, -1.501953125, -1.074951171875, -0.64794921875, -0.220947265625, 0.2060546875, 0.633056640625, 1.06005859375, 1.487060546875, 1.9140625, 2.341064453125, 2.76806640625, 3.195068359375, 3.6220703125, 4.049072265625, 4.47607421875, 4.903076171875, 5.330078125, 5.757080078125, 6.18408203125, 6.611083984375, 7.0380859375, 7.465087890625, 7.89208984375, 8.319091796875, 8.74609375, 9.173095703125, 9.60009765625, 10.027099609375, 10.4541015625, 10.881103515625, 11.30810546875, 11.735107421875, 12.162109375, 12.589111328125, 13.01611328125, 13.443115234375, 13.8701171875, 14.297119140625, 14.72412109375, 15.151123046875, 15.578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 10.0, 3.0, 4.0, 6.0, 20.0, 23.0, 32.0, 49.0, 89.0, 119.0, 183.0, 299.0, 421.0, 657.0, 1008.0, 1638.0, 2721.0, 4690.0, 7942.0, 13619.0, 23264.0, 39727.0, 65676.0, 99924.0, 134706.0, 155722.0, 151254.0, 122685.0, 86842.0, 55147.0, 33095.0, 19196.0, 11162.0, 6535.0, 3862.0, 2239.0, 1450.0, 875.0, 566.0, 364.0, 247.0, 179.0, 101.0, 73.0, 47.0, 35.0, 25.0, 12.0, 11.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.640625, -5.45147705078125, -5.2623291015625, -5.07318115234375, -4.884033203125, -4.69488525390625, -4.5057373046875, -4.31658935546875, -4.12744140625, -3.93829345703125, -3.7491455078125, -3.55999755859375, -3.370849609375, -3.18170166015625, -2.9925537109375, -2.80340576171875, -2.6142578125, -2.42510986328125, -2.2359619140625, -2.04681396484375, -1.857666015625, -1.66851806640625, -1.4793701171875, -1.29022216796875, -1.10107421875, -0.91192626953125, -0.7227783203125, -0.53363037109375, -0.344482421875, -0.15533447265625, 0.0338134765625, 0.22296142578125, 0.412109375, 0.60125732421875, 0.7904052734375, 0.97955322265625, 1.168701171875, 1.35784912109375, 1.5469970703125, 1.73614501953125, 1.92529296875, 2.11444091796875, 2.3035888671875, 2.49273681640625, 2.681884765625, 2.87103271484375, 3.0601806640625, 3.24932861328125, 3.4384765625, 3.62762451171875, 3.8167724609375, 4.00592041015625, 4.195068359375, 4.38421630859375, 4.5733642578125, 4.76251220703125, 4.95166015625, 5.14080810546875, 5.3299560546875, 5.51910400390625, 5.708251953125, 5.89739990234375, 6.0865478515625, 6.27569580078125, 6.46484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 4.0, 18.0, 13.0, 14.0, 13.0, 17.0, 25.0, 25.0, 30.0, 27.0, 54.0, 44.0, 30.0, 53.0, 43.0, 47.0, 46.0, 37.0, 53.0, 43.0, 51.0, 39.0, 35.0, 29.0, 33.0, 24.0, 19.0, 25.0, 16.0, 20.0, 9.0, 12.0, 8.0, 8.0, 6.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005345344543457031, -0.0005172118544578552, -0.0004998892545700073, -0.0004825666546821594, -0.0004652440547943115, -0.0004479214549064636, -0.0004305988550186157, -0.0004132762551307678, -0.0003959536552429199, -0.000378631055355072, -0.0003613084554672241, -0.0003439858555793762, -0.0003266632556915283, -0.0003093406558036804, -0.0002920180559158325, -0.0002746954560279846, -0.0002573728561401367, -0.00024005025625228882, -0.00022272765636444092, -0.00020540505647659302, -0.00018808245658874512, -0.00017075985670089722, -0.00015343725681304932, -0.00013611465692520142, -0.00011879205703735352, -0.00010146945714950562, -8.414685726165771e-05, -6.682425737380981e-05, -4.9501657485961914e-05, -3.2179057598114014e-05, -1.4856457710266113e-05, 2.466142177581787e-06, 1.9788742065429688e-05, 3.711134195327759e-05, 5.443394184112549e-05, 7.175654172897339e-05, 8.907914161682129e-05, 0.00010640174150466919, 0.0001237243413925171, 0.000141046941280365, 0.0001583695411682129, 0.0001756921410560608, 0.0001930147409439087, 0.0002103373408317566, 0.0002276599407196045, 0.0002449825406074524, 0.0002623051404953003, 0.0002796277403831482, 0.0002969503402709961, 0.000314272940158844, 0.0003315955400466919, 0.0003489181399345398, 0.0003662407398223877, 0.0003835633397102356, 0.0004008859395980835, 0.0004182085394859314, 0.0004355311393737793, 0.0004528537392616272, 0.0004701763391494751, 0.000487498939037323, 0.0005048215389251709, 0.0005221441388130188, 0.0005394667387008667, 0.0005567893385887146, 0.0005741119384765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 24.0, 29.0, 58.0, 114.0, 196.0, 388.0, 683.0, 1407.0, 2685.0, 5292.0, 10330.0, 19820.0, 37460.0, 65606.0, 105353.0, 146545.0, 169817.0, 161828.0, 127273.0, 85165.0, 50311.0, 28059.0, 14584.0, 7540.0, 3886.0, 1922.0, 1015.0, 509.0, 295.0, 175.0, 80.0, 52.0, 21.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.919189453125, -5.71337890625, -5.507568359375, -5.3017578125, -5.095947265625, -4.89013671875, -4.684326171875, -4.478515625, -4.272705078125, -4.06689453125, -3.861083984375, -3.6552734375, -3.449462890625, -3.24365234375, -3.037841796875, -2.83203125, -2.626220703125, -2.42041015625, -2.214599609375, -2.0087890625, -1.802978515625, -1.59716796875, -1.391357421875, -1.185546875, -0.979736328125, -0.77392578125, -0.568115234375, -0.3623046875, -0.156494140625, 0.04931640625, 0.255126953125, 0.4609375, 0.666748046875, 0.87255859375, 1.078369140625, 1.2841796875, 1.489990234375, 1.69580078125, 1.901611328125, 2.107421875, 2.313232421875, 2.51904296875, 2.724853515625, 2.9306640625, 3.136474609375, 3.34228515625, 3.548095703125, 3.75390625, 3.959716796875, 4.16552734375, 4.371337890625, 4.5771484375, 4.782958984375, 4.98876953125, 5.194580078125, 5.400390625, 5.606201171875, 5.81201171875, 6.017822265625, 6.2236328125, 6.429443359375, 6.63525390625, 6.841064453125, 7.046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 5.0, 7.0, 7.0, 14.0, 14.0, 20.0, 21.0, 21.0, 21.0, 23.0, 29.0, 27.0, 33.0, 34.0, 33.0, 52.0, 46.0, 37.0, 50.0, 29.0, 50.0, 45.0, 34.0, 39.0, 41.0, 33.0, 36.0, 27.0, 20.0, 23.0, 23.0, 19.0, 13.0, 15.0, 7.0, 7.0, 10.0, 6.0, 4.0, 3.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8115234375, -1.75238037109375, -1.6932373046875, -1.63409423828125, -1.574951171875, -1.51580810546875, -1.4566650390625, -1.39752197265625, -1.33837890625, -1.27923583984375, -1.2200927734375, -1.16094970703125, -1.101806640625, -1.04266357421875, -0.9835205078125, -0.92437744140625, -0.865234375, -0.80609130859375, -0.7469482421875, -0.68780517578125, -0.628662109375, -0.56951904296875, -0.5103759765625, -0.45123291015625, -0.39208984375, -0.33294677734375, -0.2738037109375, -0.21466064453125, -0.155517578125, -0.09637451171875, -0.0372314453125, 0.02191162109375, 0.0810546875, 0.14019775390625, 0.1993408203125, 0.25848388671875, 0.317626953125, 0.37677001953125, 0.4359130859375, 0.49505615234375, 0.55419921875, 0.61334228515625, 0.6724853515625, 0.73162841796875, 0.790771484375, 0.84991455078125, 0.9090576171875, 0.96820068359375, 1.02734375, 1.08648681640625, 1.1456298828125, 1.20477294921875, 1.263916015625, 1.32305908203125, 1.3822021484375, 1.44134521484375, 1.50048828125, 1.55963134765625, 1.6187744140625, 1.67791748046875, 1.737060546875, 1.79620361328125, 1.8553466796875, 1.91448974609375, 1.9736328125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 6.0, 5.0, 2.0, 8.0, 7.0, 13.0, 12.0, 13.0, 15.0, 12.0, 20.0, 21.0, 31.0, 24.0, 40.0, 31.0, 29.0, 37.0, 32.0, 37.0, 34.0, 36.0, 49.0, 39.0, 41.0, 34.0, 33.0, 30.0, 30.0, 44.0, 29.0, 35.0, 24.0, 27.0, 20.0, 16.0, 14.0, 12.0, 6.0, 7.0, 9.0, 11.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.05389976501465, -15.5481595993042, -15.042420387268066, -14.536680221557617, -14.030940055847168, -13.525199890136719, -13.019460678100586, -12.513720512390137, -12.007980346679688, -11.502240180969238, -10.996500968933105, -10.490760803222656, -9.985020637512207, -9.479280471801758, -8.973541259765625, -8.467801094055176, -7.962061882019043, -7.456322193145752, -6.950582027435303, -6.444842338562012, -5.9391021728515625, -5.4333624839782715, -4.9276227951049805, -4.421882629394531, -3.9161429405212402, -3.41040301322937, -2.9046630859375, -2.398923397064209, -1.8931834697723389, -1.3874435424804688, -0.8817038536071777, -0.3759639263153076, 0.1297760009765625, 0.6355158686637878, 1.1412557363510132, 1.6469955444335938, 2.152735471725464, 2.658475399017334, 3.164215087890625, 3.669955015182495, 4.175694942474365, 4.681434631347656, 5.1871747970581055, 5.6929144859313965, 6.1986541748046875, 6.704394340515137, 7.210134029388428, 7.715873718261719, 8.221613883972168, 8.727354049682617, 9.23309326171875, 9.7388334274292, 10.244573593139648, 10.750312805175781, 11.25605297088623, 11.76179313659668, 12.267532348632812, 12.773272514343262, 13.279011726379395, 13.784751892089844, 14.290492057800293, 14.796232223510742, 15.301971435546875, 15.807711601257324, 16.313451766967773]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 5.0, 5.0, 7.0, 12.0, 10.0, 13.0, 17.0, 21.0, 23.0, 29.0, 34.0, 23.0, 38.0, 44.0, 38.0, 29.0, 35.0, 44.0, 51.0, 30.0, 49.0, 50.0, 43.0, 41.0, 37.0, 38.0, 34.0, 35.0, 29.0, 25.0, 16.0, 21.0, 12.0, 10.0, 10.0, 4.0, 5.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.502573013305664, -22.80191421508789, -22.101255416870117, -21.400596618652344, -20.69993782043457, -19.999279022216797, -19.298622131347656, -18.597963333129883, -17.89730453491211, -17.196645736694336, -16.495986938476562, -15.795328140258789, -15.094670295715332, -14.394011497497559, -13.693352699279785, -12.992694854736328, -12.292035102844238, -11.591376304626465, -10.890717506408691, -10.190059661865234, -9.489400863647461, -8.788742065429688, -8.088083267211914, -7.387424945831299, -6.686766147613525, -5.986107349395752, -5.285449028015137, -4.584790229797363, -3.884131669998169, -3.1834731101989746, -2.482814311981201, -1.782155990600586, -1.0814971923828125, -0.3808385729789734, 0.3198200464248657, 1.0204787254333496, 1.721137285232544, 2.4217958450317383, 3.1224546432495117, 3.823112964630127, 4.5237717628479, 5.224430561065674, 5.925088882446289, 6.6257476806640625, 7.326406478881836, 8.02706527709961, 8.727724075317383, 9.42838191986084, 10.129040718078613, 10.829699516296387, 11.53035831451416, 12.231016159057617, 12.93167495727539, 13.632333755493164, 14.332992553710938, 15.033651351928711, 15.734310150146484, 16.434968948364258, 17.13562774658203, 17.836286544799805, 18.536945343017578, 19.23760223388672, 19.938262939453125, 20.638919830322266, 21.33957862854004]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 7.0, 5.0, 10.0, 15.0, 25.0, 44.0, 93.0, 136.0, 224.0, 419.0, 667.0, 1155.0, 1975.0, 3418.0, 6007.0, 10591.0, 18634.0, 33088.0, 57899.0, 98267.0, 164404.0, 258805.0, 377733.0, 502103.0, 580568.0, 576183.0, 494413.0, 373236.0, 251456.0, 158074.0, 95210.0, 55161.0, 31918.0, 18138.0, 10345.0, 5913.0, 3354.0, 1984.0, 1101.0, 599.0, 373.0, 233.0, 120.0, 87.0, 52.0, 26.0, 12.0, 4.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2421875, -11.7708740234375, -11.299560546875, -10.8282470703125, -10.35693359375, -9.8856201171875, -9.414306640625, -8.9429931640625, -8.4716796875, -8.0003662109375, -7.529052734375, -7.0577392578125, -6.58642578125, -6.1151123046875, -5.643798828125, -5.1724853515625, -4.701171875, -4.2298583984375, -3.758544921875, -3.2872314453125, -2.81591796875, -2.3446044921875, -1.873291015625, -1.4019775390625, -0.9306640625, -0.4593505859375, 0.011962890625, 0.4832763671875, 0.95458984375, 1.4259033203125, 1.897216796875, 2.3685302734375, 2.83984375, 3.3111572265625, 3.782470703125, 4.2537841796875, 4.72509765625, 5.1964111328125, 5.667724609375, 6.1390380859375, 6.6103515625, 7.0816650390625, 7.552978515625, 8.0242919921875, 8.49560546875, 8.9669189453125, 9.438232421875, 9.9095458984375, 10.380859375, 10.8521728515625, 11.323486328125, 11.7947998046875, 12.26611328125, 12.7374267578125, 13.208740234375, 13.6800537109375, 14.1513671875, 14.6226806640625, 15.093994140625, 15.5653076171875, 16.03662109375, 16.5079345703125, 16.979248046875, 17.4505615234375, 17.921875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 7.0, 3.0, 7.0, 13.0, 12.0, 10.0, 15.0, 16.0, 23.0, 32.0, 39.0, 32.0, 26.0, 36.0, 39.0, 41.0, 34.0, 36.0, 44.0, 44.0, 45.0, 40.0, 43.0, 45.0, 47.0, 29.0, 35.0, 36.0, 29.0, 20.0, 20.0, 20.0, 15.0, 11.0, 4.0, 8.0, 9.0, 11.0, 1.0, 3.0, 8.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.46875, -15.94384765625, -15.4189453125, -14.89404296875, -14.369140625, -13.84423828125, -13.3193359375, -12.79443359375, -12.26953125, -11.74462890625, -11.2197265625, -10.69482421875, -10.169921875, -9.64501953125, -9.1201171875, -8.59521484375, -8.0703125, -7.54541015625, -7.0205078125, -6.49560546875, -5.970703125, -5.44580078125, -4.9208984375, -4.39599609375, -3.87109375, -3.34619140625, -2.8212890625, -2.29638671875, -1.771484375, -1.24658203125, -0.7216796875, -0.19677734375, 0.328125, 0.85302734375, 1.3779296875, 1.90283203125, 2.427734375, 2.95263671875, 3.4775390625, 4.00244140625, 4.52734375, 5.05224609375, 5.5771484375, 6.10205078125, 6.626953125, 7.15185546875, 7.6767578125, 8.20166015625, 8.7265625, 9.25146484375, 9.7763671875, 10.30126953125, 10.826171875, 11.35107421875, 11.8759765625, 12.40087890625, 12.92578125, 13.45068359375, 13.9755859375, 14.50048828125, 15.025390625, 15.55029296875, 16.0751953125, 16.60009765625, 17.125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 6.0, 5.0, 6.0, 9.0, 18.0, 28.0, 52.0, 84.0, 133.0, 215.0, 338.0, 531.0, 908.0, 1436.0, 2322.0, 3866.0, 6293.0, 9839.0, 15447.0, 24708.0, 37810.0, 57524.0, 85382.0, 122883.0, 169961.0, 228593.0, 289490.0, 349700.0, 393859.0, 415865.0, 406973.0, 370429.0, 316246.0, 253666.0, 193719.0, 142663.0, 99520.0, 68293.0, 44891.0, 29700.0, 19234.0, 11973.0, 7445.0, 4755.0, 2889.0, 1723.0, 1106.0, 691.0, 378.0, 269.0, 180.0, 108.0, 47.0, 32.0, 22.0, 15.0, 10.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-11.171875, -10.80810546875, -10.4443359375, -10.08056640625, -9.716796875, -9.35302734375, -8.9892578125, -8.62548828125, -8.26171875, -7.89794921875, -7.5341796875, -7.17041015625, -6.806640625, -6.44287109375, -6.0791015625, -5.71533203125, -5.3515625, -4.98779296875, -4.6240234375, -4.26025390625, -3.896484375, -3.53271484375, -3.1689453125, -2.80517578125, -2.44140625, -2.07763671875, -1.7138671875, -1.35009765625, -0.986328125, -0.62255859375, -0.2587890625, 0.10498046875, 0.46875, 0.83251953125, 1.1962890625, 1.56005859375, 1.923828125, 2.28759765625, 2.6513671875, 3.01513671875, 3.37890625, 3.74267578125, 4.1064453125, 4.47021484375, 4.833984375, 5.19775390625, 5.5615234375, 5.92529296875, 6.2890625, 6.65283203125, 7.0166015625, 7.38037109375, 7.744140625, 8.10791015625, 8.4716796875, 8.83544921875, 9.19921875, 9.56298828125, 9.9267578125, 10.29052734375, 10.654296875, 11.01806640625, 11.3818359375, 11.74560546875, 12.109375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 7.0, 9.0, 11.0, 9.0, 15.0, 22.0, 27.0, 31.0, 35.0, 38.0, 69.0, 73.0, 71.0, 99.0, 116.0, 118.0, 155.0, 170.0, 219.0, 187.0, 210.0, 218.0, 214.0, 182.0, 217.0, 196.0, 168.0, 166.0, 137.0, 164.0, 118.0, 114.0, 95.0, 77.0, 57.0, 56.0, 40.0, 30.0, 33.0, 17.0, 16.0, 30.0, 9.0, 11.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.207763671875, -5.98974609375, -5.771728515625, -5.5537109375, -5.335693359375, -5.11767578125, -4.899658203125, -4.681640625, -4.463623046875, -4.24560546875, -4.027587890625, -3.8095703125, -3.591552734375, -3.37353515625, -3.155517578125, -2.9375, -2.719482421875, -2.50146484375, -2.283447265625, -2.0654296875, -1.847412109375, -1.62939453125, -1.411376953125, -1.193359375, -0.975341796875, -0.75732421875, -0.539306640625, -0.3212890625, -0.103271484375, 0.11474609375, 0.332763671875, 0.55078125, 0.768798828125, 0.98681640625, 1.204833984375, 1.4228515625, 1.640869140625, 1.85888671875, 2.076904296875, 2.294921875, 2.512939453125, 2.73095703125, 2.948974609375, 3.1669921875, 3.385009765625, 3.60302734375, 3.821044921875, 4.0390625, 4.257080078125, 4.47509765625, 4.693115234375, 4.9111328125, 5.129150390625, 5.34716796875, 5.565185546875, 5.783203125, 6.001220703125, 6.21923828125, 6.437255859375, 6.6552734375, 6.873291015625, 7.09130859375, 7.309326171875, 7.52734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 7.0, 6.0, 10.0, 10.0, 13.0, 12.0, 23.0, 24.0, 23.0, 15.0, 22.0, 26.0, 23.0, 40.0, 35.0, 41.0, 38.0, 34.0, 45.0, 36.0, 42.0, 47.0, 35.0, 46.0, 40.0, 23.0, 34.0, 25.0, 40.0, 32.0, 24.0, 17.0, 11.0, 14.0, 14.0, 10.0, 13.0, 9.0, 8.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.987288475036621, -15.524848937988281, -15.062409400939941, -14.599970817565918, -14.137531280517578, -13.675091743469238, -13.212652206420898, -12.750213623046875, -12.287774085998535, -11.825334548950195, -11.362895011901855, -10.900456428527832, -10.438016891479492, -9.975577354431152, -9.513137817382812, -9.050699234008789, -8.588258743286133, -8.125819206237793, -7.663380146026611, -7.2009406089782715, -6.73850154876709, -6.27606201171875, -5.81362247467041, -5.3511834144592285, -4.888744354248047, -4.426304817199707, -3.9638657569885254, -3.5014262199401855, -3.038987159729004, -2.576547622680664, -2.1141083240509033, -1.6516690254211426, -1.189229965209961, -0.7267906665802002, -0.2643513083457947, 0.19808804988861084, 0.6605273485183716, 1.1229667663574219, 1.5854060649871826, 2.0478453636169434, 2.510284662246704, 2.972723960876465, 3.4351632595062256, 3.8976025581359863, 4.360042095184326, 4.822481155395508, 5.284920692443848, 5.7473602294921875, 6.209799289703369, 6.672238826751709, 7.134677886962891, 7.5971174240112305, 8.05955696105957, 8.521995544433594, 8.984435081481934, 9.446874618530273, 9.909314155578613, 10.371753692626953, 10.834193229675293, 11.296631813049316, 11.759071350097656, 12.221510887145996, 12.683950424194336, 13.14638900756836, 13.6088285446167]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 3.0, 7.0, 4.0, 16.0, 7.0, 13.0, 15.0, 12.0, 14.0, 30.0, 39.0, 25.0, 35.0, 31.0, 38.0, 43.0, 48.0, 49.0, 41.0, 51.0, 52.0, 40.0, 47.0, 43.0, 36.0, 41.0, 32.0, 43.0, 24.0, 20.0, 28.0, 17.0, 7.0, 14.0, 7.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.085586547851562, -19.4284610748291, -18.771333694458008, -18.114208221435547, -17.457080841064453, -16.799955368041992, -16.14282989501953, -15.485703468322754, -14.828577041625977, -14.1714506149292, -13.514324188232422, -12.857198715209961, -12.200072288513184, -11.542945861816406, -10.885820388793945, -10.228693962097168, -9.57156753540039, -8.914441108703613, -8.257314682006836, -7.600189208984375, -6.943062782287598, -6.28593635559082, -5.628810405731201, -4.971684455871582, -4.314558029174805, -3.6574318408966064, -3.000305652618408, -2.34317946434021, -1.6860532760620117, -1.0289270877838135, -0.37180089950561523, 0.2853250503540039, 0.9424514770507812, 1.5995776653289795, 2.2567038536071777, 2.913830041885376, 3.570956230163574, 4.228082656860352, 4.885208606719971, 5.54233455657959, 6.199460983276367, 6.8565874099731445, 7.513713359832764, 8.170839309692383, 8.82796573638916, 9.485092163085938, 10.142217636108398, 10.799344062805176, 11.456470489501953, 12.11359691619873, 12.770723342895508, 13.427848815917969, 14.084975242614746, 14.742101669311523, 15.399227142333984, 16.056354522705078, 16.71347999572754, 17.37060546875, 18.027732849121094, 18.684858322143555, 19.341983795166016, 19.99911117553711, 20.65623664855957, 21.31336212158203, 21.970489501953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 5.0, 17.0, 21.0, 26.0, 34.0, 45.0, 87.0, 145.0, 202.0, 282.0, 436.0, 648.0, 1006.0, 1520.0, 2395.0, 3618.0, 5207.0, 8039.0, 12272.0, 18178.0, 27188.0, 40536.0, 57474.0, 78683.0, 103685.0, 123861.0, 129326.0, 117023.0, 93311.0, 70036.0, 49966.0, 34137.0, 23374.0, 15452.0, 10296.0, 6639.0, 4568.0, 3001.0, 1982.0, 1337.0, 850.0, 560.0, 356.0, 253.0, 157.0, 112.0, 74.0, 52.0, 25.0, 22.0, 13.0, 15.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.296875, -4.15020751953125, -4.0035400390625, -3.85687255859375, -3.710205078125, -3.56353759765625, -3.4168701171875, -3.27020263671875, -3.12353515625, -2.97686767578125, -2.8302001953125, -2.68353271484375, -2.536865234375, -2.39019775390625, -2.2435302734375, -2.09686279296875, -1.9501953125, -1.80352783203125, -1.6568603515625, -1.51019287109375, -1.363525390625, -1.21685791015625, -1.0701904296875, -0.92352294921875, -0.77685546875, -0.63018798828125, -0.4835205078125, -0.33685302734375, -0.190185546875, -0.04351806640625, 0.1031494140625, 0.24981689453125, 0.396484375, 0.54315185546875, 0.6898193359375, 0.83648681640625, 0.983154296875, 1.12982177734375, 1.2764892578125, 1.42315673828125, 1.56982421875, 1.71649169921875, 1.8631591796875, 2.00982666015625, 2.156494140625, 2.30316162109375, 2.4498291015625, 2.59649658203125, 2.7431640625, 2.88983154296875, 3.0364990234375, 3.18316650390625, 3.329833984375, 3.47650146484375, 3.6231689453125, 3.76983642578125, 3.91650390625, 4.06317138671875, 4.2098388671875, 4.35650634765625, 4.503173828125, 4.64984130859375, 4.7965087890625, 4.94317626953125, 5.08984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 10.0, 14.0, 20.0, 11.0, 17.0, 19.0, 23.0, 34.0, 32.0, 27.0, 28.0, 53.0, 46.0, 43.0, 43.0, 45.0, 36.0, 43.0, 43.0, 56.0, 40.0, 38.0, 36.0, 23.0, 33.0, 34.0, 22.0, 23.0, 20.0, 12.0, 12.0, 6.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.890625, -19.249267578125, -18.60791015625, -17.966552734375, -17.3251953125, -16.683837890625, -16.04248046875, -15.401123046875, -14.759765625, -14.118408203125, -13.47705078125, -12.835693359375, -12.1943359375, -11.552978515625, -10.91162109375, -10.270263671875, -9.62890625, -8.987548828125, -8.34619140625, -7.704833984375, -7.0634765625, -6.422119140625, -5.78076171875, -5.139404296875, -4.498046875, -3.856689453125, -3.21533203125, -2.573974609375, -1.9326171875, -1.291259765625, -0.64990234375, -0.008544921875, 0.6328125, 1.274169921875, 1.91552734375, 2.556884765625, 3.1982421875, 3.839599609375, 4.48095703125, 5.122314453125, 5.763671875, 6.405029296875, 7.04638671875, 7.687744140625, 8.3291015625, 8.970458984375, 9.61181640625, 10.253173828125, 10.89453125, 11.535888671875, 12.17724609375, 12.818603515625, 13.4599609375, 14.101318359375, 14.74267578125, 15.384033203125, 16.025390625, 16.666748046875, 17.30810546875, 17.949462890625, 18.5908203125, 19.232177734375, 19.87353515625, 20.514892578125, 21.15625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 4.0, 4.0, 12.0, 16.0, 28.0, 36.0, 46.0, 85.0, 79.0, 149.0, 195.0, 335.0, 472.0, 711.0, 1097.0, 1613.0, 2543.0, 4244.0, 6885.0, 11722.0, 20632.0, 36185.0, 62497.0, 103488.0, 152846.0, 184081.0, 166551.0, 117134.0, 72828.0, 42529.0, 24279.0, 13857.0, 8139.0, 4813.0, 2928.0, 1919.0, 1188.0, 780.0, 503.0, 330.0, 250.0, 174.0, 103.0, 85.0, 58.0, 34.0, 19.0, 12.0, 12.0, 11.0, 6.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.66796875, -4.52044677734375, -4.3729248046875, -4.22540283203125, -4.077880859375, -3.93035888671875, -3.7828369140625, -3.63531494140625, -3.48779296875, -3.34027099609375, -3.1927490234375, -3.04522705078125, -2.897705078125, -2.75018310546875, -2.6026611328125, -2.45513916015625, -2.3076171875, -2.16009521484375, -2.0125732421875, -1.86505126953125, -1.717529296875, -1.57000732421875, -1.4224853515625, -1.27496337890625, -1.12744140625, -0.97991943359375, -0.8323974609375, -0.68487548828125, -0.537353515625, -0.38983154296875, -0.2423095703125, -0.09478759765625, 0.052734375, 0.20025634765625, 0.3477783203125, 0.49530029296875, 0.642822265625, 0.79034423828125, 0.9378662109375, 1.08538818359375, 1.23291015625, 1.38043212890625, 1.5279541015625, 1.67547607421875, 1.822998046875, 1.97052001953125, 2.1180419921875, 2.26556396484375, 2.4130859375, 2.56060791015625, 2.7081298828125, 2.85565185546875, 3.003173828125, 3.15069580078125, 3.2982177734375, 3.44573974609375, 3.59326171875, 3.74078369140625, 3.8883056640625, 4.03582763671875, 4.183349609375, 4.33087158203125, 4.4783935546875, 4.62591552734375, 4.7734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 8.0, 13.0, 16.0, 18.0, 10.0, 13.0, 26.0, 28.0, 24.0, 29.0, 26.0, 32.0, 41.0, 35.0, 37.0, 42.0, 36.0, 46.0, 41.0, 38.0, 39.0, 43.0, 29.0, 30.0, 29.0, 34.0, 21.0, 32.0, 30.0, 23.0, 22.0, 12.0, 18.0, 14.0, 8.0, 8.0, 10.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1875, -10.7919921875, -10.396484375, -10.0009765625, -9.60546875, -9.2099609375, -8.814453125, -8.4189453125, -8.0234375, -7.6279296875, -7.232421875, -6.8369140625, -6.44140625, -6.0458984375, -5.650390625, -5.2548828125, -4.859375, -4.4638671875, -4.068359375, -3.6728515625, -3.27734375, -2.8818359375, -2.486328125, -2.0908203125, -1.6953125, -1.2998046875, -0.904296875, -0.5087890625, -0.11328125, 0.2822265625, 0.677734375, 1.0732421875, 1.46875, 1.8642578125, 2.259765625, 2.6552734375, 3.05078125, 3.4462890625, 3.841796875, 4.2373046875, 4.6328125, 5.0283203125, 5.423828125, 5.8193359375, 6.21484375, 6.6103515625, 7.005859375, 7.4013671875, 7.796875, 8.1923828125, 8.587890625, 8.9833984375, 9.37890625, 9.7744140625, 10.169921875, 10.5654296875, 10.9609375, 11.3564453125, 11.751953125, 12.1474609375, 12.54296875, 12.9384765625, 13.333984375, 13.7294921875, 14.125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 17.0, 26.0, 39.0, 73.0, 121.0, 173.0, 311.0, 492.0, 955.0, 1818.0, 3716.0, 7579.0, 17046.0, 41227.0, 110061.0, 295575.0, 342629.0, 137762.0, 50391.0, 20339.0, 8946.0, 4331.0, 2167.0, 1135.0, 653.0, 382.0, 231.0, 137.0, 84.0, 44.0, 28.0, 19.0, 12.0, 11.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.451171875, -2.37237548828125, -2.2935791015625, -2.21478271484375, -2.135986328125, -2.05718994140625, -1.9783935546875, -1.89959716796875, -1.82080078125, -1.74200439453125, -1.6632080078125, -1.58441162109375, -1.505615234375, -1.42681884765625, -1.3480224609375, -1.26922607421875, -1.1904296875, -1.11163330078125, -1.0328369140625, -0.95404052734375, -0.875244140625, -0.79644775390625, -0.7176513671875, -0.63885498046875, -0.56005859375, -0.48126220703125, -0.4024658203125, -0.32366943359375, -0.244873046875, -0.16607666015625, -0.0872802734375, -0.00848388671875, 0.0703125, 0.14910888671875, 0.2279052734375, 0.30670166015625, 0.385498046875, 0.46429443359375, 0.5430908203125, 0.62188720703125, 0.70068359375, 0.77947998046875, 0.8582763671875, 0.93707275390625, 1.015869140625, 1.09466552734375, 1.1734619140625, 1.25225830078125, 1.3310546875, 1.40985107421875, 1.4886474609375, 1.56744384765625, 1.646240234375, 1.72503662109375, 1.8038330078125, 1.88262939453125, 1.96142578125, 2.04022216796875, 2.1190185546875, 2.19781494140625, 2.276611328125, 2.35540771484375, 2.4342041015625, 2.51300048828125, 2.591796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 14.0, 7.0, 10.0, 16.0, 16.0, 17.0, 18.0, 29.0, 28.0, 40.0, 57.0, 61.0, 76.0, 86.0, 105.0, 93.0, 78.0, 54.0, 34.0, 11.0, 29.0, 16.0, 16.0, 15.0, 13.0, 14.0, 7.0, 5.0, 6.0, 3.0, 8.0, 0.0, 2.0, 5.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036072731018066406, -0.0003479085862636566, -0.00033508986234664917, -0.0003222711384296417, -0.0003094524145126343, -0.00029663369059562683, -0.0002838149666786194, -0.00027099624276161194, -0.0002581775188446045, -0.00024535879492759705, -0.0002325400710105896, -0.00021972134709358215, -0.0002069026231765747, -0.00019408389925956726, -0.00018126517534255981, -0.00016844645142555237, -0.00015562772750854492, -0.00014280900359153748, -0.00012999027967453003, -0.00011717155575752258, -0.00010435283184051514, -9.153410792350769e-05, -7.871538400650024e-05, -6.58966600894928e-05, -5.307793617248535e-05, -4.0259212255477905e-05, -2.744048833847046e-05, -1.4621764421463013e-05, -1.8030405044555664e-06, 1.101568341255188e-05, 2.3834407329559326e-05, 3.665313124656677e-05, 4.947185516357422e-05, 6.229057908058167e-05, 7.510930299758911e-05, 8.792802691459656e-05, 0.000100746750831604, 0.00011356547474861145, 0.0001263841986656189, 0.00013920292258262634, 0.0001520216464996338, 0.00016484037041664124, 0.00017765909433364868, 0.00019047781825065613, 0.00020329654216766357, 0.00021611526608467102, 0.00022893399000167847, 0.0002417527139186859, 0.00025457143783569336, 0.0002673901617527008, 0.00028020888566970825, 0.0002930276095867157, 0.00030584633350372314, 0.0003186650574207306, 0.00033148378133773804, 0.0003443025052547455, 0.00035712122917175293, 0.0003699399530887604, 0.0003827586770057678, 0.00039557740092277527, 0.0004083961248397827, 0.00042121484875679016, 0.0004340335726737976, 0.00044685229659080505, 0.0004596710205078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 8.0, 14.0, 25.0, 31.0, 49.0, 68.0, 79.0, 129.0, 211.0, 249.0, 379.0, 579.0, 932.0, 1420.0, 2305.0, 3695.0, 6052.0, 10493.0, 18339.0, 32811.0, 57764.0, 100474.0, 166368.0, 216636.0, 174962.0, 108374.0, 62446.0, 35079.0, 19943.0, 11472.0, 6513.0, 3855.0, 2402.0, 1536.0, 924.0, 644.0, 421.0, 265.0, 183.0, 115.0, 87.0, 56.0, 49.0, 38.0, 24.0, 13.0, 11.0, 10.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.537109375, -2.4541015625, -2.37109375, -2.2880859375, -2.205078125, -2.1220703125, -2.0390625, -1.9560546875, -1.873046875, -1.7900390625, -1.70703125, -1.6240234375, -1.541015625, -1.4580078125, -1.375, -1.2919921875, -1.208984375, -1.1259765625, -1.04296875, -0.9599609375, -0.876953125, -0.7939453125, -0.7109375, -0.6279296875, -0.544921875, -0.4619140625, -0.37890625, -0.2958984375, -0.212890625, -0.1298828125, -0.046875, 0.0361328125, 0.119140625, 0.2021484375, 0.28515625, 0.3681640625, 0.451171875, 0.5341796875, 0.6171875, 0.7001953125, 0.783203125, 0.8662109375, 0.94921875, 1.0322265625, 1.115234375, 1.1982421875, 1.28125, 1.3642578125, 1.447265625, 1.5302734375, 1.61328125, 1.6962890625, 1.779296875, 1.8623046875, 1.9453125, 2.0283203125, 2.111328125, 2.1943359375, 2.27734375, 2.3603515625, 2.443359375, 2.5263671875, 2.609375, 2.6923828125, 2.775390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 7.0, 14.0, 10.0, 22.0, 28.0, 24.0, 35.0, 42.0, 37.0, 67.0, 62.0, 62.0, 83.0, 63.0, 75.0, 59.0, 58.0, 47.0, 42.0, 29.0, 26.0, 16.0, 12.0, 10.0, 10.0, 5.0, 8.0, 12.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1318359375, -1.095458984375, -1.05908203125, -1.022705078125, -0.986328125, -0.949951171875, -0.91357421875, -0.877197265625, -0.8408203125, -0.804443359375, -0.76806640625, -0.731689453125, -0.6953125, -0.658935546875, -0.62255859375, -0.586181640625, -0.5498046875, -0.513427734375, -0.47705078125, -0.440673828125, -0.404296875, -0.367919921875, -0.33154296875, -0.295166015625, -0.2587890625, -0.222412109375, -0.18603515625, -0.149658203125, -0.11328125, -0.076904296875, -0.04052734375, -0.004150390625, 0.0322265625, 0.068603515625, 0.10498046875, 0.141357421875, 0.177734375, 0.214111328125, 0.25048828125, 0.286865234375, 0.3232421875, 0.359619140625, 0.39599609375, 0.432373046875, 0.46875, 0.505126953125, 0.54150390625, 0.577880859375, 0.6142578125, 0.650634765625, 0.68701171875, 0.723388671875, 0.759765625, 0.796142578125, 0.83251953125, 0.868896484375, 0.9052734375, 0.941650390625, 0.97802734375, 1.014404296875, 1.05078125, 1.087158203125, 1.12353515625, 1.159912109375, 1.1962890625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 10.0, 5.0, 8.0, 11.0, 8.0, 16.0, 19.0, 24.0, 11.0, 18.0, 20.0, 17.0, 30.0, 40.0, 29.0, 34.0, 32.0, 37.0, 45.0, 40.0, 40.0, 38.0, 30.0, 53.0, 34.0, 38.0, 32.0, 38.0, 36.0, 27.0, 35.0, 17.0, 21.0, 14.0, 7.0, 15.0, 12.0, 12.0, 6.0, 11.0, 11.0, 6.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-15.69510269165039, -15.243623733520508, -14.792144775390625, -14.340665817260742, -13.889187812805176, -13.437708854675293, -12.98622989654541, -12.534750938415527, -12.083272933959961, -11.631793975830078, -11.180315017700195, -10.728836059570312, -10.277358055114746, -9.825879096984863, -9.37440013885498, -8.922921180725098, -8.471442222595215, -8.019963264465332, -7.568484783172607, -7.117005825042725, -6.66552734375, -6.214048385620117, -5.762569427490234, -5.311090469360352, -4.859611988067627, -4.408133029937744, -3.9566545486450195, -3.5051755905151367, -3.053696870803833, -2.6022181510925293, -2.1507391929626465, -1.6992604732513428, -1.2477827072143555, -0.796303927898407, -0.3448251485824585, 0.10665369033813477, 0.5581324100494385, 1.0096111297607422, 1.461090087890625, 1.9125688076019287, 2.3640475273132324, 2.815526247024536, 3.26700496673584, 3.7184839248657227, 4.1699628829956055, 4.62144136428833, 5.072920322418213, 5.5243988037109375, 5.97587776184082, 6.427356719970703, 6.878835201263428, 7.3303141593933105, 7.781792640686035, 8.233271598815918, 8.6847505569458, 9.136229515075684, 9.58770751953125, 10.039186477661133, 10.490665435791016, 10.942144393920898, 11.393622398376465, 11.845101356506348, 12.29658031463623, 12.748059272766113, 13.199538230895996]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 8.0, 5.0, 18.0, 11.0, 13.0, 13.0, 9.0, 23.0, 34.0, 35.0, 26.0, 36.0, 34.0, 44.0, 47.0, 48.0, 46.0, 38.0, 56.0, 45.0, 37.0, 43.0, 49.0, 45.0, 29.0, 39.0, 30.0, 19.0, 23.0, 24.0, 10.0, 13.0, 13.0, 10.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.151615142822266, -18.512569427490234, -17.873523712158203, -17.23447608947754, -16.595430374145508, -15.956384658813477, -15.317338943481445, -14.678293228149414, -14.039246559143066, -13.400200843811035, -12.761154174804688, -12.122108459472656, -11.483062744140625, -10.844016075134277, -10.204970359802246, -9.565923690795898, -8.926877975463867, -8.287832260131836, -7.648785591125488, -7.009739875793457, -6.370693683624268, -5.731647491455078, -5.092601776123047, -4.453555583953857, -3.814509391784668, -3.1754631996154785, -2.536417245864868, -1.8973711729049683, -1.2583250999450684, -0.6192789077758789, 0.019767045974731445, 0.6588129997253418, 1.2978572845458984, 1.9369033575057983, 2.5759494304656982, 3.2149953842163086, 3.854041576385498, 4.4930877685546875, 5.132133483886719, 5.771179676055908, 6.410225868225098, 7.049272060394287, 7.688318252563477, 8.327363967895508, 8.966409683227539, 9.605456352233887, 10.244502067565918, 10.883548736572266, 11.522594451904297, 12.161640167236328, 12.800686836242676, 13.439732551574707, 14.078779220581055, 14.717824935913086, 15.356870651245117, 15.995916366577148, 16.634963989257812, 17.274009704589844, 17.913055419921875, 18.55210304260254, 19.19114875793457, 19.8301944732666, 20.469240188598633, 21.108285903930664, 21.747331619262695]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 23.0, 40.0, 47.0, 83.0, 139.0, 219.0, 351.0, 547.0, 862.0, 1376.0, 2294.0, 3700.0, 5744.0, 9258.0, 14192.0, 21365.0, 31988.0, 45134.0, 61576.0, 79616.0, 95348.0, 107170.0, 110631.0, 105675.0, 92225.0, 75509.0, 57859.0, 41759.0, 29374.0, 19502.0, 12801.0, 8296.0, 5187.0, 3248.0, 2024.0, 1281.0, 766.0, 516.0, 308.0, 178.0, 119.0, 87.0, 43.0, 37.0, 13.0, 15.0, 11.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.65625, -12.23974609375, -11.8232421875, -11.40673828125, -10.990234375, -10.57373046875, -10.1572265625, -9.74072265625, -9.32421875, -8.90771484375, -8.4912109375, -8.07470703125, -7.658203125, -7.24169921875, -6.8251953125, -6.40869140625, -5.9921875, -5.57568359375, -5.1591796875, -4.74267578125, -4.326171875, -3.90966796875, -3.4931640625, -3.07666015625, -2.66015625, -2.24365234375, -1.8271484375, -1.41064453125, -0.994140625, -0.57763671875, -0.1611328125, 0.25537109375, 0.671875, 1.08837890625, 1.5048828125, 1.92138671875, 2.337890625, 2.75439453125, 3.1708984375, 3.58740234375, 4.00390625, 4.42041015625, 4.8369140625, 5.25341796875, 5.669921875, 6.08642578125, 6.5029296875, 6.91943359375, 7.3359375, 7.75244140625, 8.1689453125, 8.58544921875, 9.001953125, 9.41845703125, 9.8349609375, 10.25146484375, 10.66796875, 11.08447265625, 11.5009765625, 11.91748046875, 12.333984375, 12.75048828125, 13.1669921875, 13.58349609375, 14.0]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 4.0, 7.0, 7.0, 9.0, 12.0, 8.0, 17.0, 9.0, 20.0, 15.0, 20.0, 33.0, 29.0, 33.0, 35.0, 52.0, 44.0, 41.0, 49.0, 56.0, 46.0, 35.0, 39.0, 39.0, 45.0, 40.0, 45.0, 37.0, 20.0, 27.0, 34.0, 17.0, 15.0, 17.0, 9.0, 9.0, 3.0, 6.0, 4.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.1396484375, -16.529296875, -15.9189453125, -15.30859375, -14.6982421875, -14.087890625, -13.4775390625, -12.8671875, -12.2568359375, -11.646484375, -11.0361328125, -10.42578125, -9.8154296875, -9.205078125, -8.5947265625, -7.984375, -7.3740234375, -6.763671875, -6.1533203125, -5.54296875, -4.9326171875, -4.322265625, -3.7119140625, -3.1015625, -2.4912109375, -1.880859375, -1.2705078125, -0.66015625, -0.0498046875, 0.560546875, 1.1708984375, 1.78125, 2.3916015625, 3.001953125, 3.6123046875, 4.22265625, 4.8330078125, 5.443359375, 6.0537109375, 6.6640625, 7.2744140625, 7.884765625, 8.4951171875, 9.10546875, 9.7158203125, 10.326171875, 10.9365234375, 11.546875, 12.1572265625, 12.767578125, 13.3779296875, 13.98828125, 14.5986328125, 15.208984375, 15.8193359375, 16.4296875, 17.0400390625, 17.650390625, 18.2607421875, 18.87109375, 19.4814453125, 20.091796875, 20.7021484375, 21.3125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 8.0, 17.0, 40.0, 49.0, 75.0, 122.0, 202.0, 336.0, 504.0, 829.0, 1263.0, 1979.0, 3170.0, 4788.0, 7511.0, 11627.0, 17717.0, 26335.0, 37884.0, 52742.0, 69714.0, 87210.0, 102046.0, 110081.0, 108549.0, 99135.0, 83881.0, 66099.0, 48816.0, 35689.0, 24176.0, 16165.0, 10672.0, 6939.0, 4570.0, 2770.0, 1838.0, 1086.0, 685.0, 460.0, 256.0, 194.0, 116.0, 67.0, 50.0, 37.0, 19.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-14.21875, -13.7864990234375, -13.354248046875, -12.9219970703125, -12.48974609375, -12.0574951171875, -11.625244140625, -11.1929931640625, -10.7607421875, -10.3284912109375, -9.896240234375, -9.4639892578125, -9.03173828125, -8.5994873046875, -8.167236328125, -7.7349853515625, -7.302734375, -6.8704833984375, -6.438232421875, -6.0059814453125, -5.57373046875, -5.1414794921875, -4.709228515625, -4.2769775390625, -3.8447265625, -3.4124755859375, -2.980224609375, -2.5479736328125, -2.11572265625, -1.6834716796875, -1.251220703125, -0.8189697265625, -0.38671875, 0.0455322265625, 0.477783203125, 0.9100341796875, 1.34228515625, 1.7745361328125, 2.206787109375, 2.6390380859375, 3.0712890625, 3.5035400390625, 3.935791015625, 4.3680419921875, 4.80029296875, 5.2325439453125, 5.664794921875, 6.0970458984375, 6.529296875, 6.9615478515625, 7.393798828125, 7.8260498046875, 8.25830078125, 8.6905517578125, 9.122802734375, 9.5550537109375, 9.9873046875, 10.4195556640625, 10.851806640625, 11.2840576171875, 11.71630859375, 12.1485595703125, 12.580810546875, 13.0130615234375, 13.4453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 12.0, 16.0, 7.0, 17.0, 13.0, 20.0, 19.0, 17.0, 21.0, 24.0, 31.0, 25.0, 27.0, 32.0, 39.0, 32.0, 40.0, 32.0, 41.0, 39.0, 43.0, 39.0, 26.0, 40.0, 26.0, 37.0, 26.0, 29.0, 26.0, 18.0, 24.0, 17.0, 16.0, 16.0, 10.0, 12.0, 12.0, 12.0, 7.0, 9.0, 10.0, 3.0, 2.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.8515625, -9.522705078125, -9.19384765625, -8.864990234375, -8.5361328125, -8.207275390625, -7.87841796875, -7.549560546875, -7.220703125, -6.891845703125, -6.56298828125, -6.234130859375, -5.9052734375, -5.576416015625, -5.24755859375, -4.918701171875, -4.58984375, -4.260986328125, -3.93212890625, -3.603271484375, -3.2744140625, -2.945556640625, -2.61669921875, -2.287841796875, -1.958984375, -1.630126953125, -1.30126953125, -0.972412109375, -0.6435546875, -0.314697265625, 0.01416015625, 0.343017578125, 0.671875, 1.000732421875, 1.32958984375, 1.658447265625, 1.9873046875, 2.316162109375, 2.64501953125, 2.973876953125, 3.302734375, 3.631591796875, 3.96044921875, 4.289306640625, 4.6181640625, 4.947021484375, 5.27587890625, 5.604736328125, 5.93359375, 6.262451171875, 6.59130859375, 6.920166015625, 7.2490234375, 7.577880859375, 7.90673828125, 8.235595703125, 8.564453125, 8.893310546875, 9.22216796875, 9.551025390625, 9.8798828125, 10.208740234375, 10.53759765625, 10.866455078125, 11.1953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 9.0, 8.0, 11.0, 30.0, 32.0, 44.0, 79.0, 99.0, 136.0, 182.0, 294.0, 420.0, 580.0, 882.0, 1361.0, 2055.0, 3123.0, 4857.0, 7472.0, 11691.0, 18530.0, 29742.0, 47680.0, 73726.0, 107493.0, 138447.0, 152840.0, 138906.0, 106550.0, 73089.0, 47489.0, 29191.0, 18466.0, 11512.0, 7427.0, 4814.0, 3072.0, 2010.0, 1346.0, 913.0, 601.0, 408.0, 283.0, 193.0, 132.0, 100.0, 73.0, 36.0, 30.0, 34.0, 18.0, 16.0, 12.0, 4.0, 5.0, 4.0, 2.0], "bins": [-6.84765625, -6.6431884765625, -6.438720703125, -6.2342529296875, -6.02978515625, -5.8253173828125, -5.620849609375, -5.4163818359375, -5.2119140625, -5.0074462890625, -4.802978515625, -4.5985107421875, -4.39404296875, -4.1895751953125, -3.985107421875, -3.7806396484375, -3.576171875, -3.3717041015625, -3.167236328125, -2.9627685546875, -2.75830078125, -2.5538330078125, -2.349365234375, -2.1448974609375, -1.9404296875, -1.7359619140625, -1.531494140625, -1.3270263671875, -1.12255859375, -0.9180908203125, -0.713623046875, -0.5091552734375, -0.3046875, -0.1002197265625, 0.104248046875, 0.3087158203125, 0.51318359375, 0.7176513671875, 0.922119140625, 1.1265869140625, 1.3310546875, 1.5355224609375, 1.739990234375, 1.9444580078125, 2.14892578125, 2.3533935546875, 2.557861328125, 2.7623291015625, 2.966796875, 3.1712646484375, 3.375732421875, 3.5802001953125, 3.78466796875, 3.9891357421875, 4.193603515625, 4.3980712890625, 4.6025390625, 4.8070068359375, 5.011474609375, 5.2159423828125, 5.42041015625, 5.6248779296875, 5.829345703125, 6.0338134765625, 6.23828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 9.0, 21.0, 19.0, 12.0, 19.0, 19.0, 19.0, 30.0, 35.0, 47.0, 45.0, 53.0, 60.0, 62.0, 50.0, 58.0, 57.0, 53.0, 40.0, 52.0, 42.0, 38.0, 20.0, 21.0, 21.0, 15.0, 9.0, 12.0, 15.0, 9.0, 7.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007724761962890625, -0.000749543309211731, -0.0007266104221343994, -0.0007036775350570679, -0.0006807446479797363, -0.0006578117609024048, -0.0006348788738250732, -0.0006119459867477417, -0.0005890130996704102, -0.0005660802125930786, -0.0005431473255157471, -0.0005202144384384155, -0.000497281551361084, -0.00047434866428375244, -0.0004514157772064209, -0.00042848289012908936, -0.0004055500030517578, -0.00038261711597442627, -0.0003596842288970947, -0.0003367513418197632, -0.00031381845474243164, -0.0002908855676651001, -0.00026795268058776855, -0.000245019793510437, -0.00022208690643310547, -0.00019915401935577393, -0.00017622113227844238, -0.00015328824520111084, -0.0001303553581237793, -0.00010742247104644775, -8.448958396911621e-05, -6.155669689178467e-05, -3.8623809814453125e-05, -1.5690922737121582e-05, 7.241964340209961e-06, 3.0174851417541504e-05, 5.310773849487305e-05, 7.604062557220459e-05, 9.897351264953613e-05, 0.00012190639972686768, 0.00014483928680419922, 0.00016777217388153076, 0.0001907050609588623, 0.00021363794803619385, 0.0002365708351135254, 0.00025950372219085693, 0.0002824366092681885, 0.00030536949634552, 0.00032830238342285156, 0.0003512352705001831, 0.00037416815757751465, 0.0003971010446548462, 0.00042003393173217773, 0.0004429668188095093, 0.0004658997058868408, 0.0004888325929641724, 0.0005117654800415039, 0.0005346983671188354, 0.000557631254196167, 0.0005805641412734985, 0.0006034970283508301, 0.0006264299154281616, 0.0006493628025054932, 0.0006722956895828247, 0.0006952285766601562]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 11.0, 21.0, 28.0, 46.0, 74.0, 113.0, 152.0, 246.0, 421.0, 637.0, 1043.0, 1619.0, 2558.0, 3998.0, 6589.0, 10171.0, 16059.0, 25053.0, 38641.0, 57283.0, 80595.0, 106091.0, 126257.0, 131772.0, 121117.0, 99011.0, 73144.0, 51168.0, 33988.0, 22389.0, 14058.0, 9020.0, 5672.0, 3506.0, 2144.0, 1383.0, 921.0, 523.0, 379.0, 244.0, 162.0, 76.0, 61.0, 48.0, 25.0, 14.0, 12.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.7935791015625, -5.614501953125, -5.4354248046875, -5.25634765625, -5.0772705078125, -4.898193359375, -4.7191162109375, -4.5400390625, -4.3609619140625, -4.181884765625, -4.0028076171875, -3.82373046875, -3.6446533203125, -3.465576171875, -3.2864990234375, -3.107421875, -2.9283447265625, -2.749267578125, -2.5701904296875, -2.39111328125, -2.2120361328125, -2.032958984375, -1.8538818359375, -1.6748046875, -1.4957275390625, -1.316650390625, -1.1375732421875, -0.95849609375, -0.7794189453125, -0.600341796875, -0.4212646484375, -0.2421875, -0.0631103515625, 0.115966796875, 0.2950439453125, 0.47412109375, 0.6531982421875, 0.832275390625, 1.0113525390625, 1.1904296875, 1.3695068359375, 1.548583984375, 1.7276611328125, 1.90673828125, 2.0858154296875, 2.264892578125, 2.4439697265625, 2.623046875, 2.8021240234375, 2.981201171875, 3.1602783203125, 3.33935546875, 3.5184326171875, 3.697509765625, 3.8765869140625, 4.0556640625, 4.2347412109375, 4.413818359375, 4.5928955078125, 4.77197265625, 4.9510498046875, 5.130126953125, 5.3092041015625, 5.48828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 7.0, 8.0, 12.0, 11.0, 10.0, 14.0, 25.0, 24.0, 27.0, 33.0, 36.0, 42.0, 38.0, 52.0, 50.0, 58.0, 58.0, 51.0, 68.0, 51.0, 47.0, 39.0, 38.0, 35.0, 23.0, 18.0, 25.0, 17.0, 23.0, 13.0, 11.0, 10.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.887420654296875, -2.79437255859375, -2.701324462890625, -2.6082763671875, -2.515228271484375, -2.42218017578125, -2.329132080078125, -2.236083984375, -2.143035888671875, -2.04998779296875, -1.956939697265625, -1.8638916015625, -1.770843505859375, -1.67779541015625, -1.584747314453125, -1.49169921875, -1.398651123046875, -1.30560302734375, -1.212554931640625, -1.1195068359375, -1.026458740234375, -0.93341064453125, -0.840362548828125, -0.747314453125, -0.654266357421875, -0.56121826171875, -0.468170166015625, -0.3751220703125, -0.282073974609375, -0.18902587890625, -0.095977783203125, -0.0029296875, 0.090118408203125, 0.18316650390625, 0.276214599609375, 0.3692626953125, 0.462310791015625, 0.55535888671875, 0.648406982421875, 0.741455078125, 0.834503173828125, 0.92755126953125, 1.020599365234375, 1.1136474609375, 1.206695556640625, 1.29974365234375, 1.392791748046875, 1.48583984375, 1.578887939453125, 1.67193603515625, 1.764984130859375, 1.8580322265625, 1.951080322265625, 2.04412841796875, 2.137176513671875, 2.230224609375, 2.323272705078125, 2.41632080078125, 2.509368896484375, 2.6024169921875, 2.695465087890625, 2.78851318359375, 2.881561279296875, 2.974609375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 4.0, 11.0, 11.0, 16.0, 18.0, 19.0, 28.0, 20.0, 20.0, 27.0, 30.0, 27.0, 45.0, 48.0, 37.0, 43.0, 57.0, 51.0, 55.0, 56.0, 47.0, 46.0, 32.0, 36.0, 33.0, 32.0, 24.0, 17.0, 17.0, 17.0, 20.0, 11.0, 10.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.530940055847168, -15.007871627807617, -14.484803199768066, -13.961734771728516, -13.438666343688965, -12.915597915649414, -12.392528533935547, -11.869461059570312, -11.346391677856445, -10.823323249816895, -10.300254821777344, -9.777186393737793, -9.254117965698242, -8.731049537658691, -8.20798110961914, -7.684912204742432, -7.161844253540039, -6.638775825500488, -6.1157073974609375, -5.592638969421387, -5.069570541381836, -4.546502113342285, -4.023433208465576, -3.5003647804260254, -2.9772963523864746, -2.454227924346924, -1.9311593770980835, -1.4080908298492432, -0.8850224018096924, -0.3619539737701416, 0.16111469268798828, 0.6841831207275391, 1.2072525024414062, 1.730320930480957, 2.253389358520508, 2.7764580249786377, 3.2995264530181885, 3.8225948810577393, 4.345663547515869, 4.86873197555542, 5.391800403594971, 5.9148688316345215, 6.437937259674072, 6.961006164550781, 7.484074592590332, 8.007143020629883, 8.530211448669434, 9.053279876708984, 9.576348304748535, 10.099416732788086, 10.622485160827637, 11.145553588867188, 11.668622016906738, 12.191690444946289, 12.714759826660156, 13.23782730102539, 13.760896682739258, 14.283965110778809, 14.80703353881836, 15.33010196685791, 15.853170394897461, 16.376239776611328, 16.899307250976562, 17.42237663269043, 17.945444107055664]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 7.0, 6.0, 10.0, 4.0, 10.0, 15.0, 14.0, 21.0, 21.0, 18.0, 21.0, 31.0, 38.0, 31.0, 34.0, 37.0, 40.0, 46.0, 47.0, 43.0, 36.0, 45.0, 47.0, 43.0, 53.0, 44.0, 32.0, 25.0, 22.0, 33.0, 20.0, 17.0, 9.0, 21.0, 17.0, 8.0, 4.0, 8.0, 7.0, 5.0, 7.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.78479766845703, -19.147563934326172, -18.51032829284668, -17.87309455871582, -17.235858917236328, -16.59862518310547, -15.961389541625977, -15.324155807495117, -14.686920166015625, -14.04968547821045, -13.412450790405273, -12.775216102600098, -12.137981414794922, -11.500746726989746, -10.86351203918457, -10.226278305053711, -9.589043617248535, -8.95180892944336, -8.314574241638184, -7.677339553833008, -7.040104866027832, -6.402870178222656, -5.765635967254639, -5.128401279449463, -4.491166591644287, -3.8539319038391113, -3.2166972160339355, -2.579462766647339, -1.942228078842163, -1.3049933910369873, -0.6677589416503906, -0.030524253845214844, 0.6067104339599609, 1.2439451217651367, 1.881179690361023, 2.518414258956909, 3.155648946762085, 3.7928836345672607, 4.430118083953857, 5.067352771759033, 5.704587459564209, 6.341822147369385, 6.9790568351745605, 7.616291046142578, 8.253525733947754, 8.89076042175293, 9.527995109558105, 10.165229797363281, 10.802464485168457, 11.439699172973633, 12.076933860778809, 12.714168548583984, 13.35140323638916, 13.988637924194336, 14.625871658325195, 15.263107299804688, 15.900341033935547, 16.537574768066406, 17.1748104095459, 17.812044143676758, 18.44927978515625, 19.08651351928711, 19.7237491607666, 20.36098289489746, 20.998218536376953]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 5.0, 8.0, 7.0, 10.0, 13.0, 20.0, 61.0, 101.0, 155.0, 234.0, 417.0, 671.0, 1169.0, 1878.0, 3090.0, 5027.0, 8764.0, 14563.0, 24310.0, 39497.0, 63377.0, 101108.0, 154711.0, 228799.0, 317742.0, 410911.0, 482666.0, 508195.0, 480856.0, 407056.0, 312212.0, 222751.0, 149995.0, 96206.0, 61458.0, 38003.0, 23015.0, 13986.0, 8299.0, 5129.0, 3103.0, 1834.0, 1075.0, 664.0, 447.0, 273.0, 152.0, 98.0, 72.0, 35.0, 21.0, 17.0, 9.0, 6.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.640625, -11.2586669921875, -10.876708984375, -10.4947509765625, -10.11279296875, -9.7308349609375, -9.348876953125, -8.9669189453125, -8.5849609375, -8.2030029296875, -7.821044921875, -7.4390869140625, -7.05712890625, -6.6751708984375, -6.293212890625, -5.9112548828125, -5.529296875, -5.1473388671875, -4.765380859375, -4.3834228515625, -4.00146484375, -3.6195068359375, -3.237548828125, -2.8555908203125, -2.4736328125, -2.0916748046875, -1.709716796875, -1.3277587890625, -0.94580078125, -0.5638427734375, -0.181884765625, 0.2000732421875, 0.58203125, 0.9639892578125, 1.345947265625, 1.7279052734375, 2.10986328125, 2.4918212890625, 2.873779296875, 3.2557373046875, 3.6376953125, 4.0196533203125, 4.401611328125, 4.7835693359375, 5.16552734375, 5.5474853515625, 5.929443359375, 6.3114013671875, 6.693359375, 7.0753173828125, 7.457275390625, 7.8392333984375, 8.22119140625, 8.6031494140625, 8.985107421875, 9.3670654296875, 9.7490234375, 10.1309814453125, 10.512939453125, 10.8948974609375, 11.27685546875, 11.6588134765625, 12.040771484375, 12.4227294921875, 12.8046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 4.0, 8.0, 5.0, 10.0, 12.0, 16.0, 27.0, 22.0, 31.0, 19.0, 26.0, 30.0, 36.0, 39.0, 38.0, 39.0, 40.0, 38.0, 38.0, 40.0, 46.0, 45.0, 35.0, 48.0, 42.0, 43.0, 32.0, 24.0, 21.0, 26.0, 11.0, 17.0, 19.0, 10.0, 6.0, 12.0, 8.0, 3.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3671875, -12.9053955078125, -12.443603515625, -11.9818115234375, -11.52001953125, -11.0582275390625, -10.596435546875, -10.1346435546875, -9.6728515625, -9.2110595703125, -8.749267578125, -8.2874755859375, -7.82568359375, -7.3638916015625, -6.902099609375, -6.4403076171875, -5.978515625, -5.5167236328125, -5.054931640625, -4.5931396484375, -4.13134765625, -3.6695556640625, -3.207763671875, -2.7459716796875, -2.2841796875, -1.8223876953125, -1.360595703125, -0.8988037109375, -0.43701171875, 0.0247802734375, 0.486572265625, 0.9483642578125, 1.41015625, 1.8719482421875, 2.333740234375, 2.7955322265625, 3.25732421875, 3.7191162109375, 4.180908203125, 4.6427001953125, 5.1044921875, 5.5662841796875, 6.028076171875, 6.4898681640625, 6.95166015625, 7.4134521484375, 7.875244140625, 8.3370361328125, 8.798828125, 9.2606201171875, 9.722412109375, 10.1842041015625, 10.64599609375, 11.1077880859375, 11.569580078125, 12.0313720703125, 12.4931640625, 12.9549560546875, 13.416748046875, 13.8785400390625, 14.34033203125, 14.8021240234375, 15.263916015625, 15.7257080078125, 16.1875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 18.0, 17.0, 26.0, 53.0, 91.0, 126.0, 237.0, 368.0, 634.0, 1098.0, 1745.0, 2853.0, 4702.0, 7520.0, 12377.0, 20120.0, 31733.0, 49787.0, 75187.0, 110413.0, 157735.0, 214909.0, 280260.0, 341432.0, 392349.0, 420767.0, 418210.0, 386854.0, 333944.0, 269651.0, 206354.0, 150687.0, 105407.0, 71127.0, 46869.0, 29677.0, 18986.0, 11705.0, 7335.0, 4374.0, 2602.0, 1580.0, 941.0, 562.0, 371.0, 187.0, 117.0, 82.0, 44.0, 28.0, 19.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-10.8359375, -10.49658203125, -10.1572265625, -9.81787109375, -9.478515625, -9.13916015625, -8.7998046875, -8.46044921875, -8.12109375, -7.78173828125, -7.4423828125, -7.10302734375, -6.763671875, -6.42431640625, -6.0849609375, -5.74560546875, -5.40625, -5.06689453125, -4.7275390625, -4.38818359375, -4.048828125, -3.70947265625, -3.3701171875, -3.03076171875, -2.69140625, -2.35205078125, -2.0126953125, -1.67333984375, -1.333984375, -0.99462890625, -0.6552734375, -0.31591796875, 0.0234375, 0.36279296875, 0.7021484375, 1.04150390625, 1.380859375, 1.72021484375, 2.0595703125, 2.39892578125, 2.73828125, 3.07763671875, 3.4169921875, 3.75634765625, 4.095703125, 4.43505859375, 4.7744140625, 5.11376953125, 5.453125, 5.79248046875, 6.1318359375, 6.47119140625, 6.810546875, 7.14990234375, 7.4892578125, 7.82861328125, 8.16796875, 8.50732421875, 8.8466796875, 9.18603515625, 9.525390625, 9.86474609375, 10.2041015625, 10.54345703125, 10.8828125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 8.0, 7.0, 18.0, 16.0, 27.0, 29.0, 45.0, 59.0, 72.0, 69.0, 85.0, 121.0, 124.0, 140.0, 154.0, 170.0, 184.0, 206.0, 219.0, 203.0, 239.0, 220.0, 194.0, 191.0, 190.0, 153.0, 139.0, 143.0, 114.0, 103.0, 81.0, 76.0, 52.0, 53.0, 36.0, 19.0, 22.0, 28.0, 14.0, 7.0, 15.0, 6.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-6.9140625, -6.70562744140625, -6.4971923828125, -6.28875732421875, -6.080322265625, -5.87188720703125, -5.6634521484375, -5.45501708984375, -5.24658203125, -5.03814697265625, -4.8297119140625, -4.62127685546875, -4.412841796875, -4.20440673828125, -3.9959716796875, -3.78753662109375, -3.5791015625, -3.37066650390625, -3.1622314453125, -2.95379638671875, -2.745361328125, -2.53692626953125, -2.3284912109375, -2.12005615234375, -1.91162109375, -1.70318603515625, -1.4947509765625, -1.28631591796875, -1.077880859375, -0.86944580078125, -0.6610107421875, -0.45257568359375, -0.244140625, -0.03570556640625, 0.1727294921875, 0.38116455078125, 0.589599609375, 0.79803466796875, 1.0064697265625, 1.21490478515625, 1.42333984375, 1.63177490234375, 1.8402099609375, 2.04864501953125, 2.257080078125, 2.46551513671875, 2.6739501953125, 2.88238525390625, 3.0908203125, 3.29925537109375, 3.5076904296875, 3.71612548828125, 3.924560546875, 4.13299560546875, 4.3414306640625, 4.54986572265625, 4.75830078125, 4.96673583984375, 5.1751708984375, 5.38360595703125, 5.592041015625, 5.80047607421875, 6.0089111328125, 6.21734619140625, 6.42578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 16.0, 12.0, 14.0, 13.0, 18.0, 15.0, 25.0, 23.0, 37.0, 33.0, 37.0, 50.0, 54.0, 41.0, 65.0, 50.0, 48.0, 36.0, 43.0, 33.0, 37.0, 51.0, 38.0, 29.0, 36.0, 20.0, 19.0, 21.0, 16.0, 11.0, 10.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.11312484741211, -12.629949569702148, -12.146774291992188, -11.663599014282227, -11.180423736572266, -10.697248458862305, -10.214073181152344, -9.7308988571167, -9.247723579406738, -8.764548301696777, -8.281373023986816, -7.7981977462768555, -7.315022945404053, -6.831847667694092, -6.348672389984131, -5.865497589111328, -5.382321834564209, -4.899146556854248, -4.415971279144287, -3.9327962398529053, -3.4496212005615234, -2.9664459228515625, -2.4832706451416016, -2.0000956058502197, -1.5169203281402588, -1.0337451696395874, -0.5505699515342712, -0.06739473342895508, 0.4157804250717163, 0.8989555835723877, 1.3821308612823486, 1.8653059005737305, 2.3484811782836914, 2.8316564559936523, 3.314831495285034, 3.798006772994995, 4.281181812286377, 4.764357089996338, 5.247532367706299, 5.730707168579102, 6.2138824462890625, 6.697057723999023, 7.180233001708984, 7.663408279418945, 8.146583557128906, 8.629758834838867, 9.112934112548828, 9.596108436584473, 10.07928466796875, 10.562459945678711, 11.045635223388672, 11.528810501098633, 12.011985778808594, 12.495161056518555, 12.978336334228516, 13.46151065826416, 13.944685935974121, 14.427861213684082, 14.911036491394043, 15.394211769104004, 15.877387046813965, 16.36056137084961, 16.84373664855957, 17.32691192626953, 17.810087203979492]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 6.0, 7.0, 13.0, 14.0, 13.0, 17.0, 21.0, 20.0, 32.0, 27.0, 42.0, 23.0, 32.0, 35.0, 35.0, 36.0, 53.0, 41.0, 61.0, 32.0, 38.0, 57.0, 25.0, 38.0, 39.0, 28.0, 31.0, 29.0, 23.0, 28.0, 21.0, 13.0, 8.0, 10.0, 7.0, 8.0, 7.0, 6.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.314741134643555, -17.746463775634766, -17.17818832397461, -16.60991096496582, -16.04163360595703, -15.473356246948242, -14.90507984161377, -14.336803436279297, -13.768526077270508, -13.200248718261719, -12.631972312927246, -12.063695907592773, -11.495418548583984, -10.927141189575195, -10.358864784240723, -9.79058837890625, -9.222311019897461, -8.654033660888672, -8.0857572555542, -7.517480373382568, -6.9492034912109375, -6.380926609039307, -5.812649726867676, -5.244372844696045, -4.676095962524414, -4.107819080352783, -3.5395421981811523, -2.9712653160095215, -2.4029884338378906, -1.8347115516662598, -1.266434669494629, -0.698157787322998, -0.12987899780273438, 0.4383978843688965, 1.0066747665405273, 1.5749516487121582, 2.143228530883789, 2.71150541305542, 3.279782295227051, 3.8480591773986816, 4.4163360595703125, 4.984612941741943, 5.552889823913574, 6.121166706085205, 6.689443588256836, 7.257720470428467, 7.825997352600098, 8.39427375793457, 8.96255111694336, 9.530828475952148, 10.099104881286621, 10.667381286621094, 11.235658645629883, 11.803936004638672, 12.372212409973145, 12.940488815307617, 13.508766174316406, 14.077043533325195, 14.645319938659668, 15.21359634399414, 15.78187370300293, 16.35015106201172, 16.918426513671875, 17.486703872680664, 18.054981231689453]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 5.0, 9.0, 14.0, 10.0, 19.0, 26.0, 34.0, 63.0, 91.0, 166.0, 181.0, 328.0, 507.0, 837.0, 1351.0, 2252.0, 3881.0, 6885.0, 11872.0, 20455.0, 35503.0, 60069.0, 95320.0, 138621.0, 168983.0, 163741.0, 126732.0, 84683.0, 52721.0, 30983.0, 17580.0, 10174.0, 5860.0, 3418.0, 2090.0, 1136.0, 733.0, 421.0, 279.0, 181.0, 112.0, 75.0, 49.0, 33.0, 26.0, 14.0, 7.0, 8.0, 4.0, 9.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.15625, -4.01226806640625, -3.8682861328125, -3.72430419921875, -3.580322265625, -3.43634033203125, -3.2923583984375, -3.14837646484375, -3.00439453125, -2.86041259765625, -2.7164306640625, -2.57244873046875, -2.428466796875, -2.28448486328125, -2.1405029296875, -1.99652099609375, -1.8525390625, -1.70855712890625, -1.5645751953125, -1.42059326171875, -1.276611328125, -1.13262939453125, -0.9886474609375, -0.84466552734375, -0.70068359375, -0.55670166015625, -0.4127197265625, -0.26873779296875, -0.124755859375, 0.01922607421875, 0.1632080078125, 0.30718994140625, 0.451171875, 0.59515380859375, 0.7391357421875, 0.88311767578125, 1.027099609375, 1.17108154296875, 1.3150634765625, 1.45904541015625, 1.60302734375, 1.74700927734375, 1.8909912109375, 2.03497314453125, 2.178955078125, 2.32293701171875, 2.4669189453125, 2.61090087890625, 2.7548828125, 2.89886474609375, 3.0428466796875, 3.18682861328125, 3.330810546875, 3.47479248046875, 3.6187744140625, 3.76275634765625, 3.90673828125, 4.05072021484375, 4.1947021484375, 4.33868408203125, 4.482666015625, 4.62664794921875, 4.7706298828125, 4.91461181640625, 5.05859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 11.0, 9.0, 6.0, 5.0, 12.0, 13.0, 19.0, 26.0, 25.0, 21.0, 24.0, 32.0, 43.0, 33.0, 34.0, 36.0, 43.0, 50.0, 39.0, 48.0, 38.0, 35.0, 48.0, 34.0, 35.0, 38.0, 31.0, 29.0, 27.0, 29.0, 19.0, 17.0, 18.0, 12.0, 11.0, 6.0, 12.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.328125, -18.7626953125, -18.197265625, -17.6318359375, -17.06640625, -16.5009765625, -15.935546875, -15.3701171875, -14.8046875, -14.2392578125, -13.673828125, -13.1083984375, -12.54296875, -11.9775390625, -11.412109375, -10.8466796875, -10.28125, -9.7158203125, -9.150390625, -8.5849609375, -8.01953125, -7.4541015625, -6.888671875, -6.3232421875, -5.7578125, -5.1923828125, -4.626953125, -4.0615234375, -3.49609375, -2.9306640625, -2.365234375, -1.7998046875, -1.234375, -0.6689453125, -0.103515625, 0.4619140625, 1.02734375, 1.5927734375, 2.158203125, 2.7236328125, 3.2890625, 3.8544921875, 4.419921875, 4.9853515625, 5.55078125, 6.1162109375, 6.681640625, 7.2470703125, 7.8125, 8.3779296875, 8.943359375, 9.5087890625, 10.07421875, 10.6396484375, 11.205078125, 11.7705078125, 12.3359375, 12.9013671875, 13.466796875, 14.0322265625, 14.59765625, 15.1630859375, 15.728515625, 16.2939453125, 16.859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 7.0, 21.0, 12.0, 18.0, 36.0, 63.0, 78.0, 131.0, 225.0, 326.0, 495.0, 875.0, 1364.0, 2166.0, 3785.0, 6245.0, 10792.0, 18143.0, 30383.0, 49797.0, 77139.0, 111102.0, 142689.0, 156261.0, 140093.0, 106533.0, 72995.0, 46476.0, 28537.0, 17256.0, 9923.0, 5731.0, 3473.0, 2057.0, 1311.0, 766.0, 464.0, 282.0, 184.0, 108.0, 73.0, 52.0, 25.0, 28.0, 10.0, 11.0, 7.0, 6.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.134765625, -3.035064697265625, -2.93536376953125, -2.835662841796875, -2.7359619140625, -2.636260986328125, -2.53656005859375, -2.436859130859375, -2.337158203125, -2.237457275390625, -2.13775634765625, -2.038055419921875, -1.9383544921875, -1.838653564453125, -1.73895263671875, -1.639251708984375, -1.53955078125, -1.439849853515625, -1.34014892578125, -1.240447998046875, -1.1407470703125, -1.041046142578125, -0.94134521484375, -0.841644287109375, -0.741943359375, -0.642242431640625, -0.54254150390625, -0.442840576171875, -0.3431396484375, -0.243438720703125, -0.14373779296875, -0.044036865234375, 0.0556640625, 0.155364990234375, 0.25506591796875, 0.354766845703125, 0.4544677734375, 0.554168701171875, 0.65386962890625, 0.753570556640625, 0.853271484375, 0.952972412109375, 1.05267333984375, 1.152374267578125, 1.2520751953125, 1.351776123046875, 1.45147705078125, 1.551177978515625, 1.65087890625, 1.750579833984375, 1.85028076171875, 1.949981689453125, 2.0496826171875, 2.149383544921875, 2.24908447265625, 2.348785400390625, 2.448486328125, 2.548187255859375, 2.64788818359375, 2.747589111328125, 2.8472900390625, 2.946990966796875, 3.04669189453125, 3.146392822265625, 3.24609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 7.0, 9.0, 8.0, 9.0, 12.0, 12.0, 13.0, 17.0, 16.0, 19.0, 26.0, 21.0, 35.0, 28.0, 27.0, 47.0, 41.0, 25.0, 36.0, 53.0, 42.0, 34.0, 36.0, 34.0, 34.0, 34.0, 22.0, 43.0, 29.0, 29.0, 24.0, 22.0, 24.0, 27.0, 21.0, 16.0, 18.0, 9.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.6796875, -11.3209228515625, -10.962158203125, -10.6033935546875, -10.24462890625, -9.8858642578125, -9.527099609375, -9.1683349609375, -8.8095703125, -8.4508056640625, -8.092041015625, -7.7332763671875, -7.37451171875, -7.0157470703125, -6.656982421875, -6.2982177734375, -5.939453125, -5.5806884765625, -5.221923828125, -4.8631591796875, -4.50439453125, -4.1456298828125, -3.786865234375, -3.4281005859375, -3.0693359375, -2.7105712890625, -2.351806640625, -1.9930419921875, -1.63427734375, -1.2755126953125, -0.916748046875, -0.5579833984375, -0.19921875, 0.1595458984375, 0.518310546875, 0.8770751953125, 1.23583984375, 1.5946044921875, 1.953369140625, 2.3121337890625, 2.6708984375, 3.0296630859375, 3.388427734375, 3.7471923828125, 4.10595703125, 4.4647216796875, 4.823486328125, 5.1822509765625, 5.541015625, 5.8997802734375, 6.258544921875, 6.6173095703125, 6.97607421875, 7.3348388671875, 7.693603515625, 8.0523681640625, 8.4111328125, 8.7698974609375, 9.128662109375, 9.4874267578125, 9.84619140625, 10.2049560546875, 10.563720703125, 10.9224853515625, 11.28125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 5.0, 14.0, 9.0, 20.0, 27.0, 31.0, 48.0, 71.0, 127.0, 182.0, 263.0, 423.0, 604.0, 1017.0, 1510.0, 2443.0, 4025.0, 6733.0, 11698.0, 21043.0, 40164.0, 78118.0, 145912.0, 228209.0, 218778.0, 134157.0, 70498.0, 36620.0, 18931.0, 10819.0, 6189.0, 3563.0, 2220.0, 1486.0, 866.0, 607.0, 378.0, 268.0, 160.0, 114.0, 64.0, 49.0, 37.0, 16.0, 18.0, 8.0, 7.0, 8.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6727828979492188, -0.6468353271484375, -0.6208877563476562, -0.594940185546875, -0.5689926147460938, -0.5430450439453125, -0.5170974731445312, -0.49114990234375, -0.46520233154296875, -0.4392547607421875, -0.41330718994140625, -0.387359619140625, -0.36141204833984375, -0.3354644775390625, -0.30951690673828125, -0.2835693359375, -0.25762176513671875, -0.2316741943359375, -0.20572662353515625, -0.179779052734375, -0.15383148193359375, -0.1278839111328125, -0.10193634033203125, -0.07598876953125, -0.05004119873046875, -0.0240936279296875, 0.00185394287109375, 0.027801513671875, 0.05374908447265625, 0.0796966552734375, 0.10564422607421875, 0.131591796875, 0.15753936767578125, 0.1834869384765625, 0.20943450927734375, 0.235382080078125, 0.26132965087890625, 0.2872772216796875, 0.31322479248046875, 0.33917236328125, 0.36511993408203125, 0.3910675048828125, 0.41701507568359375, 0.442962646484375, 0.46891021728515625, 0.4948577880859375, 0.5208053588867188, 0.5467529296875, 0.5727005004882812, 0.5986480712890625, 0.6245956420898438, 0.650543212890625, 0.6764907836914062, 0.7024383544921875, 0.7283859252929688, 0.75433349609375, 0.7802810668945312, 0.8062286376953125, 0.8321762084960938, 0.858123779296875, 0.8840713500976562, 0.9100189208984375, 0.9359664916992188, 0.9619140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 3.0, 5.0, 13.0, 21.0, 16.0, 17.0, 23.0, 35.0, 37.0, 51.0, 67.0, 85.0, 87.0, 95.0, 85.0, 73.0, 64.0, 54.0, 44.0, 36.0, 19.0, 14.0, 15.0, 11.0, 4.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024247169494628906, -0.00023613683879375458, -0.0002298019826412201, -0.0002234671264886856, -0.00021713227033615112, -0.00021079741418361664, -0.00020446255803108215, -0.00019812770187854767, -0.00019179284572601318, -0.0001854579895734787, -0.00017912313342094421, -0.00017278827726840973, -0.00016645342111587524, -0.00016011856496334076, -0.00015378370881080627, -0.0001474488526582718, -0.0001411139965057373, -0.00013477914035320282, -0.00012844428420066833, -0.00012210942804813385, -0.00011577457189559937, -0.00010943971574306488, -0.0001031048595905304, -9.677000343799591e-05, -9.043514728546143e-05, -8.410029113292694e-05, -7.776543498039246e-05, -7.143057882785797e-05, -6.509572267532349e-05, -5.8760866522789e-05, -5.2426010370254517e-05, -4.609115421772003e-05, -3.975629806518555e-05, -3.342144191265106e-05, -2.7086585760116577e-05, -2.0751729607582092e-05, -1.4416873455047607e-05, -8.082017302513123e-06, -1.7471611499786377e-06, 4.587695002555847e-06, 1.0922551155090332e-05, 1.7257407307624817e-05, 2.3592263460159302e-05, 2.9927119612693787e-05, 3.626197576522827e-05, 4.2596831917762756e-05, 4.893168807029724e-05, 5.5266544222831726e-05, 6.160140037536621e-05, 6.79362565279007e-05, 7.427111268043518e-05, 8.060596883296967e-05, 8.694082498550415e-05, 9.327568113803864e-05, 9.961053729057312e-05, 0.0001059453934431076, 0.00011228024959564209, 0.00011861510574817657, 0.00012494996190071106, 0.00013128481805324554, 0.00013761967420578003, 0.00014395453035831451, 0.000150289386510849, 0.00015662424266338348, 0.00016295909881591797]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 15.0, 21.0, 36.0, 52.0, 61.0, 124.0, 187.0, 353.0, 622.0, 812.0, 1386.0, 2137.0, 3474.0, 5448.0, 8643.0, 13793.0, 21741.0, 34838.0, 54314.0, 84622.0, 125523.0, 163853.0, 165207.0, 126360.0, 85461.0, 55283.0, 34866.0, 22068.0, 13750.0, 8504.0, 5615.0, 3478.0, 2220.0, 1377.0, 898.0, 521.0, 335.0, 205.0, 129.0, 83.0, 56.0, 33.0, 23.0, 12.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2001953125, -1.1602020263671875, -1.120208740234375, -1.0802154541015625, -1.04022216796875, -1.0002288818359375, -0.960235595703125, -0.9202423095703125, -0.8802490234375, -0.8402557373046875, -0.800262451171875, -0.7602691650390625, -0.72027587890625, -0.6802825927734375, -0.640289306640625, -0.6002960205078125, -0.560302734375, -0.5203094482421875, -0.480316162109375, -0.4403228759765625, -0.40032958984375, -0.3603363037109375, -0.320343017578125, -0.2803497314453125, -0.2403564453125, -0.2003631591796875, -0.160369873046875, -0.1203765869140625, -0.08038330078125, -0.0403900146484375, -0.000396728515625, 0.0395965576171875, 0.07958984375, 0.1195831298828125, 0.159576416015625, 0.1995697021484375, 0.23956298828125, 0.2795562744140625, 0.319549560546875, 0.3595428466796875, 0.3995361328125, 0.4395294189453125, 0.479522705078125, 0.5195159912109375, 0.55950927734375, 0.5995025634765625, 0.639495849609375, 0.6794891357421875, 0.719482421875, 0.7594757080078125, 0.799468994140625, 0.8394622802734375, 0.87945556640625, 0.9194488525390625, 0.959442138671875, 0.9994354248046875, 1.0394287109375, 1.0794219970703125, 1.119415283203125, 1.1594085693359375, 1.19940185546875, 1.2393951416015625, 1.279388427734375, 1.3193817138671875, 1.359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 3.0, 9.0, 7.0, 2.0, 6.0, 14.0, 21.0, 14.0, 22.0, 20.0, 37.0, 32.0, 36.0, 37.0, 41.0, 41.0, 47.0, 56.0, 60.0, 55.0, 50.0, 52.0, 46.0, 37.0, 43.0, 27.0, 29.0, 21.0, 25.0, 16.0, 14.0, 6.0, 15.0, 3.0, 10.0, 10.0, 2.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5283203125, -0.5117645263671875, -0.495208740234375, -0.4786529541015625, -0.46209716796875, -0.4455413818359375, -0.428985595703125, -0.4124298095703125, -0.3958740234375, -0.3793182373046875, -0.362762451171875, -0.3462066650390625, -0.32965087890625, -0.3130950927734375, -0.296539306640625, -0.2799835205078125, -0.263427734375, -0.2468719482421875, -0.230316162109375, -0.2137603759765625, -0.19720458984375, -0.1806488037109375, -0.164093017578125, -0.1475372314453125, -0.1309814453125, -0.1144256591796875, -0.097869873046875, -0.0813140869140625, -0.06475830078125, -0.0482025146484375, -0.031646728515625, -0.0150909423828125, 0.00146484375, 0.0180206298828125, 0.034576416015625, 0.0511322021484375, 0.06768798828125, 0.0842437744140625, 0.100799560546875, 0.1173553466796875, 0.1339111328125, 0.1504669189453125, 0.167022705078125, 0.1835784912109375, 0.20013427734375, 0.2166900634765625, 0.233245849609375, 0.2498016357421875, 0.266357421875, 0.2829132080078125, 0.299468994140625, 0.3160247802734375, 0.33258056640625, 0.3491363525390625, 0.365692138671875, 0.3822479248046875, 0.3988037109375, 0.4153594970703125, 0.431915283203125, 0.4484710693359375, 0.46502685546875, 0.4815826416015625, 0.498138427734375, 0.5146942138671875, 0.53125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 7.0, 11.0, 11.0, 12.0, 17.0, 19.0, 17.0, 15.0, 28.0, 34.0, 24.0, 51.0, 39.0, 49.0, 51.0, 38.0, 61.0, 58.0, 51.0, 36.0, 38.0, 31.0, 40.0, 40.0, 32.0, 29.0, 33.0, 25.0, 15.0, 15.0, 14.0, 13.0, 8.0, 4.0, 8.0, 8.0, 2.0, 0.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.565869331359863, -13.09119701385498, -12.616525650024414, -12.141853332519531, -11.667181968688965, -11.192509651184082, -10.717838287353516, -10.243165969848633, -9.76849365234375, -9.293821334838867, -8.8191499710083, -8.344477653503418, -7.869806289672852, -7.395133972167969, -6.920462131500244, -6.4457902908325195, -5.971118927001953, -5.4964470863342285, -5.021775245666504, -4.547102928161621, -4.072431564331055, -3.597759485244751, -3.1230874061584473, -2.6484155654907227, -2.173743724822998, -1.6990718841552734, -1.2243999242782593, -0.7497279644012451, -0.2750561237335205, 0.1996157169342041, 0.6742877960205078, 1.1489596366882324, 1.6236305236816406, 2.0983023643493652, 2.57297420501709, 3.0476462841033936, 3.522318124771118, 3.9969899654388428, 4.4716620445251465, 4.946333885192871, 5.421005725860596, 5.89567756652832, 6.370349407196045, 6.8450212478637695, 7.319693565368652, 7.794364929199219, 8.269037246704102, 8.743709564208984, 9.21838092803955, 9.693053245544434, 10.167724609375, 10.642396926879883, 11.11706829071045, 11.591740608215332, 12.066411972045898, 12.541084289550781, 13.015756607055664, 13.490428924560547, 13.965100288391113, 14.439772605895996, 14.914443969726562, 15.389116287231445, 15.863788604736328, 16.338459014892578, 16.81313133239746]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 3.0, 9.0, 9.0, 15.0, 12.0, 14.0, 19.0, 22.0, 25.0, 26.0, 41.0, 26.0, 32.0, 34.0, 37.0, 35.0, 41.0, 42.0, 47.0, 52.0, 38.0, 56.0, 31.0, 34.0, 30.0, 39.0, 33.0, 30.0, 22.0, 30.0, 22.0, 17.0, 12.0, 10.0, 9.0, 6.0, 7.0, 4.0, 8.0, 7.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.25825309753418, -17.699724197387695, -17.141193389892578, -16.582664489746094, -16.02413558959961, -15.465606689453125, -14.907076835632324, -14.348546981811523, -13.790018081665039, -13.231489181518555, -12.672959327697754, -12.114429473876953, -11.555900573730469, -10.997371673583984, -10.438841819763184, -9.880311965942383, -9.321783065795898, -8.763254165649414, -8.204724311828613, -7.646194934844971, -7.087665557861328, -6.5291361808776855, -5.970606803894043, -5.4120774269104, -4.853548049926758, -4.295018672943115, -3.7364892959594727, -3.17795991897583, -2.6194305419921875, -2.060901165008545, -1.5023717880249023, -0.9438424110412598, -0.3853111267089844, 0.1732182502746582, 0.7317476272583008, 1.2902770042419434, 1.848806381225586, 2.4073357582092285, 2.965865135192871, 3.5243945121765137, 4.082923889160156, 4.641453266143799, 5.199982643127441, 5.758512020111084, 6.317041397094727, 6.875570774078369, 7.434100151062012, 7.992629528045654, 8.551158905029297, 9.109687805175781, 9.668217658996582, 10.226747512817383, 10.785276412963867, 11.343805313110352, 11.902335166931152, 12.460865020751953, 13.019393920898438, 13.577922821044922, 14.136452674865723, 14.694982528686523, 15.253511428833008, 15.812040328979492, 16.37057113647461, 16.929100036621094, 17.487628936767578]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 7.0, 6.0, 6.0, 8.0, 21.0, 32.0, 54.0, 70.0, 95.0, 177.0, 293.0, 429.0, 688.0, 1051.0, 1625.0, 2480.0, 3780.0, 5446.0, 8160.0, 12098.0, 17008.0, 23679.0, 32461.0, 42735.0, 54988.0, 67524.0, 79137.0, 87392.0, 91795.0, 90766.0, 86059.0, 76744.0, 65102.0, 52884.0, 41025.0, 30543.0, 22416.0, 16027.0, 11205.0, 7636.0, 5110.0, 3463.0, 2196.0, 1453.0, 953.0, 640.0, 363.0, 254.0, 170.0, 98.0, 76.0, 55.0, 38.0, 14.0, 14.0, 5.0, 5.0, 6.0, 1.0, 1.0, 1.0], "bins": [-9.3515625, -9.0584716796875, -8.765380859375, -8.4722900390625, -8.17919921875, -7.8861083984375, -7.593017578125, -7.2999267578125, -7.0068359375, -6.7137451171875, -6.420654296875, -6.1275634765625, -5.83447265625, -5.5413818359375, -5.248291015625, -4.9552001953125, -4.662109375, -4.3690185546875, -4.075927734375, -3.7828369140625, -3.48974609375, -3.1966552734375, -2.903564453125, -2.6104736328125, -2.3173828125, -2.0242919921875, -1.731201171875, -1.4381103515625, -1.14501953125, -0.8519287109375, -0.558837890625, -0.2657470703125, 0.02734375, 0.3204345703125, 0.613525390625, 0.9066162109375, 1.19970703125, 1.4927978515625, 1.785888671875, 2.0789794921875, 2.3720703125, 2.6651611328125, 2.958251953125, 3.2513427734375, 3.54443359375, 3.8375244140625, 4.130615234375, 4.4237060546875, 4.716796875, 5.0098876953125, 5.302978515625, 5.5960693359375, 5.88916015625, 6.1822509765625, 6.475341796875, 6.7684326171875, 7.0615234375, 7.3546142578125, 7.647705078125, 7.9407958984375, 8.23388671875, 8.5269775390625, 8.820068359375, 9.1131591796875, 9.40625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 9.0, 6.0, 12.0, 16.0, 11.0, 18.0, 16.0, 20.0, 35.0, 29.0, 35.0, 35.0, 35.0, 42.0, 44.0, 35.0, 42.0, 47.0, 39.0, 44.0, 59.0, 42.0, 30.0, 34.0, 34.0, 29.0, 31.0, 28.0, 28.0, 19.0, 19.0, 12.0, 5.0, 13.0, 10.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.78125, -17.221923828125, -16.66259765625, -16.103271484375, -15.5439453125, -14.984619140625, -14.42529296875, -13.865966796875, -13.306640625, -12.747314453125, -12.18798828125, -11.628662109375, -11.0693359375, -10.510009765625, -9.95068359375, -9.391357421875, -8.83203125, -8.272705078125, -7.71337890625, -7.154052734375, -6.5947265625, -6.035400390625, -5.47607421875, -4.916748046875, -4.357421875, -3.798095703125, -3.23876953125, -2.679443359375, -2.1201171875, -1.560791015625, -1.00146484375, -0.442138671875, 0.1171875, 0.676513671875, 1.23583984375, 1.795166015625, 2.3544921875, 2.913818359375, 3.47314453125, 4.032470703125, 4.591796875, 5.151123046875, 5.71044921875, 6.269775390625, 6.8291015625, 7.388427734375, 7.94775390625, 8.507080078125, 9.06640625, 9.625732421875, 10.18505859375, 10.744384765625, 11.3037109375, 11.863037109375, 12.42236328125, 12.981689453125, 13.541015625, 14.100341796875, 14.65966796875, 15.218994140625, 15.7783203125, 16.337646484375, 16.89697265625, 17.456298828125, 18.015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 17.0, 18.0, 28.0, 46.0, 84.0, 119.0, 183.0, 305.0, 483.0, 757.0, 1301.0, 2020.0, 3259.0, 5061.0, 8079.0, 12318.0, 18776.0, 27914.0, 39742.0, 55232.0, 71225.0, 88326.0, 101776.0, 108186.0, 106336.0, 96791.0, 81818.0, 65911.0, 48388.0, 34845.0, 23994.0, 16271.0, 10543.0, 6730.0, 4432.0, 2793.0, 1672.0, 1050.0, 706.0, 400.0, 247.0, 134.0, 74.0, 64.0, 38.0, 19.0, 17.0, 8.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.6656494140625, -10.307861328125, -9.9500732421875, -9.59228515625, -9.2344970703125, -8.876708984375, -8.5189208984375, -8.1611328125, -7.8033447265625, -7.445556640625, -7.0877685546875, -6.72998046875, -6.3721923828125, -6.014404296875, -5.6566162109375, -5.298828125, -4.9410400390625, -4.583251953125, -4.2254638671875, -3.86767578125, -3.5098876953125, -3.152099609375, -2.7943115234375, -2.4365234375, -2.0787353515625, -1.720947265625, -1.3631591796875, -1.00537109375, -0.6475830078125, -0.289794921875, 0.0679931640625, 0.42578125, 0.7835693359375, 1.141357421875, 1.4991455078125, 1.85693359375, 2.2147216796875, 2.572509765625, 2.9302978515625, 3.2880859375, 3.6458740234375, 4.003662109375, 4.3614501953125, 4.71923828125, 5.0770263671875, 5.434814453125, 5.7926025390625, 6.150390625, 6.5081787109375, 6.865966796875, 7.2237548828125, 7.58154296875, 7.9393310546875, 8.297119140625, 8.6549072265625, 9.0126953125, 9.3704833984375, 9.728271484375, 10.0860595703125, 10.44384765625, 10.8016357421875, 11.159423828125, 11.5172119140625, 11.875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 9.0, 13.0, 5.0, 11.0, 14.0, 15.0, 14.0, 15.0, 17.0, 28.0, 36.0, 20.0, 34.0, 46.0, 48.0, 32.0, 52.0, 40.0, 46.0, 32.0, 50.0, 36.0, 46.0, 34.0, 37.0, 36.0, 37.0, 27.0, 21.0, 20.0, 22.0, 15.0, 12.0, 14.0, 17.0, 12.0, 4.0, 9.0, 10.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4921875, -11.1280517578125, -10.763916015625, -10.3997802734375, -10.03564453125, -9.6715087890625, -9.307373046875, -8.9432373046875, -8.5791015625, -8.2149658203125, -7.850830078125, -7.4866943359375, -7.12255859375, -6.7584228515625, -6.394287109375, -6.0301513671875, -5.666015625, -5.3018798828125, -4.937744140625, -4.5736083984375, -4.20947265625, -3.8453369140625, -3.481201171875, -3.1170654296875, -2.7529296875, -2.3887939453125, -2.024658203125, -1.6605224609375, -1.29638671875, -0.9322509765625, -0.568115234375, -0.2039794921875, 0.16015625, 0.5242919921875, 0.888427734375, 1.2525634765625, 1.61669921875, 1.9808349609375, 2.344970703125, 2.7091064453125, 3.0732421875, 3.4373779296875, 3.801513671875, 4.1656494140625, 4.52978515625, 4.8939208984375, 5.258056640625, 5.6221923828125, 5.986328125, 6.3504638671875, 6.714599609375, 7.0787353515625, 7.44287109375, 7.8070068359375, 8.171142578125, 8.5352783203125, 8.8994140625, 9.2635498046875, 9.627685546875, 9.9918212890625, 10.35595703125, 10.7200927734375, 11.084228515625, 11.4483642578125, 11.8125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 12.0, 8.0, 15.0, 15.0, 21.0, 39.0, 71.0, 100.0, 181.0, 245.0, 456.0, 651.0, 1122.0, 1905.0, 3098.0, 5236.0, 8348.0, 14203.0, 23137.0, 37859.0, 58725.0, 85977.0, 114871.0, 135375.0, 139338.0, 125610.0, 99753.0, 71130.0, 46994.0, 29229.0, 17724.0, 10679.0, 6405.0, 3939.0, 2355.0, 1406.0, 873.0, 567.0, 337.0, 220.0, 137.0, 69.0, 53.0, 31.0, 15.0, 13.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1328125, -4.97357177734375, -4.8143310546875, -4.65509033203125, -4.495849609375, -4.33660888671875, -4.1773681640625, -4.01812744140625, -3.85888671875, -3.69964599609375, -3.5404052734375, -3.38116455078125, -3.221923828125, -3.06268310546875, -2.9034423828125, -2.74420166015625, -2.5849609375, -2.42572021484375, -2.2664794921875, -2.10723876953125, -1.947998046875, -1.78875732421875, -1.6295166015625, -1.47027587890625, -1.31103515625, -1.15179443359375, -0.9925537109375, -0.83331298828125, -0.674072265625, -0.51483154296875, -0.3555908203125, -0.19635009765625, -0.037109375, 0.12213134765625, 0.2813720703125, 0.44061279296875, 0.599853515625, 0.75909423828125, 0.9183349609375, 1.07757568359375, 1.23681640625, 1.39605712890625, 1.5552978515625, 1.71453857421875, 1.873779296875, 2.03302001953125, 2.1922607421875, 2.35150146484375, 2.5107421875, 2.66998291015625, 2.8292236328125, 2.98846435546875, 3.147705078125, 3.30694580078125, 3.4661865234375, 3.62542724609375, 3.78466796875, 3.94390869140625, 4.1031494140625, 4.26239013671875, 4.421630859375, 4.58087158203125, 4.7401123046875, 4.89935302734375, 5.05859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 6.0, 15.0, 17.0, 14.0, 14.0, 32.0, 33.0, 29.0, 33.0, 32.0, 37.0, 48.0, 50.0, 71.0, 40.0, 46.0, 55.0, 53.0, 56.0, 45.0, 42.0, 36.0, 27.0, 32.0, 25.0, 17.0, 16.0, 15.0, 14.0, 11.0, 5.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.000614166259765625, -0.0005970895290374756, -0.0005800127983093262, -0.0005629360675811768, -0.0005458593368530273, -0.0005287826061248779, -0.0005117058753967285, -0.0004946291446685791, -0.0004775524139404297, -0.0004604756832122803, -0.00044339895248413086, -0.00042632222175598145, -0.00040924549102783203, -0.0003921687602996826, -0.0003750920295715332, -0.0003580152988433838, -0.0003409385681152344, -0.00032386183738708496, -0.00030678510665893555, -0.00028970837593078613, -0.0002726316452026367, -0.0002555549144744873, -0.0002384781837463379, -0.00022140145301818848, -0.00020432472229003906, -0.00018724799156188965, -0.00017017126083374023, -0.00015309453010559082, -0.0001360177993774414, -0.00011894106864929199, -0.00010186433792114258, -8.478760719299316e-05, -6.771087646484375e-05, -5.0634145736694336e-05, -3.355741500854492e-05, -1.6480684280395508e-05, 5.960464477539062e-07, 1.767277717590332e-05, 3.4749507904052734e-05, 5.182623863220215e-05, 6.890296936035156e-05, 8.597970008850098e-05, 0.00010305643081665039, 0.0001201331615447998, 0.00013720989227294922, 0.00015428662300109863, 0.00017136335372924805, 0.00018844008445739746, 0.00020551681518554688, 0.0002225935459136963, 0.0002396702766418457, 0.0002567470073699951, 0.00027382373809814453, 0.00029090046882629395, 0.00030797719955444336, 0.0003250539302825928, 0.0003421306610107422, 0.0003592073917388916, 0.000376284122467041, 0.00039336085319519043, 0.00041043758392333984, 0.00042751431465148926, 0.00044459104537963867, 0.0004616677761077881, 0.0004787445068359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 11.0, 20.0, 24.0, 37.0, 52.0, 92.0, 119.0, 168.0, 259.0, 379.0, 569.0, 868.0, 1260.0, 1901.0, 2976.0, 4717.0, 7334.0, 11498.0, 17746.0, 27259.0, 40781.0, 59544.0, 81876.0, 105063.0, 121662.0, 125908.0, 116185.0, 96307.0, 72984.0, 51461.0, 34769.0, 22899.0, 14741.0, 9496.0, 6150.0, 3877.0, 2466.0, 1728.0, 1065.0, 745.0, 553.0, 317.0, 240.0, 138.0, 95.0, 80.0, 45.0, 34.0, 12.0, 22.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.84375, -4.69378662109375, -4.5438232421875, -4.39385986328125, -4.243896484375, -4.09393310546875, -3.9439697265625, -3.79400634765625, -3.64404296875, -3.49407958984375, -3.3441162109375, -3.19415283203125, -3.044189453125, -2.89422607421875, -2.7442626953125, -2.59429931640625, -2.4443359375, -2.29437255859375, -2.1444091796875, -1.99444580078125, -1.844482421875, -1.69451904296875, -1.5445556640625, -1.39459228515625, -1.24462890625, -1.09466552734375, -0.9447021484375, -0.79473876953125, -0.644775390625, -0.49481201171875, -0.3448486328125, -0.19488525390625, -0.044921875, 0.10504150390625, 0.2550048828125, 0.40496826171875, 0.554931640625, 0.70489501953125, 0.8548583984375, 1.00482177734375, 1.15478515625, 1.30474853515625, 1.4547119140625, 1.60467529296875, 1.754638671875, 1.90460205078125, 2.0545654296875, 2.20452880859375, 2.3544921875, 2.50445556640625, 2.6544189453125, 2.80438232421875, 2.954345703125, 3.10430908203125, 3.2542724609375, 3.40423583984375, 3.55419921875, 3.70416259765625, 3.8541259765625, 4.00408935546875, 4.154052734375, 4.30401611328125, 4.4539794921875, 4.60394287109375, 4.75390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 2.0, 9.0, 7.0, 7.0, 11.0, 15.0, 17.0, 12.0, 21.0, 20.0, 34.0, 31.0, 28.0, 43.0, 49.0, 53.0, 52.0, 41.0, 69.0, 46.0, 59.0, 43.0, 53.0, 41.0, 32.0, 29.0, 20.0, 21.0, 21.0, 20.0, 12.0, 14.0, 14.0, 5.0, 12.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.310546875, -2.2391357421875, -2.167724609375, -2.0963134765625, -2.02490234375, -1.9534912109375, -1.882080078125, -1.8106689453125, -1.7392578125, -1.6678466796875, -1.596435546875, -1.5250244140625, -1.45361328125, -1.3822021484375, -1.310791015625, -1.2393798828125, -1.16796875, -1.0965576171875, -1.025146484375, -0.9537353515625, -0.88232421875, -0.8109130859375, -0.739501953125, -0.6680908203125, -0.5966796875, -0.5252685546875, -0.453857421875, -0.3824462890625, -0.31103515625, -0.2396240234375, -0.168212890625, -0.0968017578125, -0.025390625, 0.0460205078125, 0.117431640625, 0.1888427734375, 0.26025390625, 0.3316650390625, 0.403076171875, 0.4744873046875, 0.5458984375, 0.6173095703125, 0.688720703125, 0.7601318359375, 0.83154296875, 0.9029541015625, 0.974365234375, 1.0457763671875, 1.1171875, 1.1885986328125, 1.260009765625, 1.3314208984375, 1.40283203125, 1.4742431640625, 1.545654296875, 1.6170654296875, 1.6884765625, 1.7598876953125, 1.831298828125, 1.9027099609375, 1.97412109375, 2.0455322265625, 2.116943359375, 2.1883544921875, 2.259765625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 8.0, 5.0, 7.0, 11.0, 15.0, 17.0, 16.0, 22.0, 22.0, 32.0, 32.0, 34.0, 43.0, 41.0, 37.0, 48.0, 49.0, 44.0, 48.0, 38.0, 42.0, 45.0, 40.0, 38.0, 44.0, 31.0, 29.0, 20.0, 26.0, 25.0, 21.0, 13.0, 8.0, 17.0, 5.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.452465057373047, -13.994357109069824, -13.536249160766602, -13.078141212463379, -12.620033264160156, -12.16192626953125, -11.703817367553711, -11.245710372924805, -10.787602424621582, -10.32949447631836, -9.871386528015137, -9.413278579711914, -8.955170631408691, -8.497062683105469, -8.038955688476562, -7.58084774017334, -7.122739315032959, -6.664631366729736, -6.206523418426514, -5.748415946960449, -5.290307998657227, -4.832200050354004, -4.374092102050781, -3.9159843921661377, -3.457876443862915, -2.9997684955596924, -2.541660785675049, -2.083552837371826, -1.625445008277893, -1.16733717918396, -0.7092292308807373, -0.25112152099609375, 0.2069864273071289, 0.665094256401062, 1.1232020854949951, 1.5813100337982178, 2.0394177436828613, 2.497525691986084, 2.9556336402893066, 3.41374135017395, 3.871849298477173, 4.329957008361816, 4.788064956665039, 5.246172904968262, 5.704280853271484, 6.162388801574707, 6.62049674987793, 7.078604221343994, 7.536712169647217, 7.9948201179504395, 8.452927589416504, 8.911035537719727, 9.36914348602295, 9.827251434326172, 10.285359382629395, 10.743467330932617, 11.20157527923584, 11.659683227539062, 12.117791175842285, 12.575899124145508, 13.03400707244873, 13.492115020751953, 13.95022201538086, 14.408329963684082, 14.866437911987305]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 1.0, 3.0, 2.0, 6.0, 18.0, 14.0, 11.0, 10.0, 17.0, 9.0, 18.0, 20.0, 22.0, 29.0, 25.0, 31.0, 31.0, 39.0, 26.0, 37.0, 33.0, 30.0, 34.0, 42.0, 40.0, 25.0, 41.0, 26.0, 26.0, 36.0, 28.0, 34.0, 32.0, 24.0, 24.0, 22.0, 24.0, 14.0, 16.0, 14.0, 11.0, 8.0, 13.0, 10.0, 2.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-16.794418334960938, -16.277511596679688, -15.76060676574707, -15.24370002746582, -14.726794242858887, -14.209888458251953, -13.69298267364502, -13.176076889038086, -12.659170150756836, -12.142264366149902, -11.625358581542969, -11.108451843261719, -10.591546058654785, -10.074640274047852, -9.557734489440918, -9.040828704833984, -8.52392292022705, -8.007017135620117, -7.490110874176025, -6.973205089569092, -6.456298828125, -5.939393043518066, -5.422487258911133, -4.905581474304199, -4.388675212860107, -3.8717691898345947, -3.354863166809082, -2.8379573822021484, -2.3210513591766357, -1.804145336151123, -1.2872395515441895, -0.7703335285186768, -0.25342750549316406, 0.26347845792770386, 0.7803844213485718, 1.297290325164795, 1.8141963481903076, 2.3311023712158203, 2.848008155822754, 3.3649141788482666, 3.8818202018737793, 4.398725986480713, 4.915632247924805, 5.432538032531738, 5.949443817138672, 6.466350078582764, 6.983255863189697, 7.500162124633789, 8.017067909240723, 8.533973693847656, 9.05087947845459, 9.567785263061523, 10.084692001342773, 10.601597785949707, 11.11850357055664, 11.635409355163574, 12.152315139770508, 12.669220924377441, 13.186126708984375, 13.703033447265625, 14.219939231872559, 14.736845016479492, 15.253750801086426, 15.77065658569336, 16.28756332397461]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 10.0, 14.0, 24.0, 42.0, 80.0, 124.0, 176.0, 290.0, 468.0, 749.0, 1097.0, 1750.0, 2652.0, 4207.0, 6729.0, 10363.0, 16080.0, 25173.0, 38260.0, 58031.0, 87264.0, 126985.0, 180052.0, 243232.0, 316650.0, 382017.0, 429160.0, 441813.0, 419845.0, 365774.0, 298043.0, 227373.0, 165489.0, 115934.0, 79223.0, 52307.0, 34352.0, 22447.0, 14536.0, 9164.0, 6043.0, 3730.0, 2403.0, 1540.0, 953.0, 614.0, 381.0, 229.0, 151.0, 110.0, 49.0, 39.0, 20.0, 23.0, 11.0, 6.0, 6.0, 2.0], "bins": [-10.3984375, -10.0867919921875, -9.775146484375, -9.4635009765625, -9.15185546875, -8.8402099609375, -8.528564453125, -8.2169189453125, -7.9052734375, -7.5936279296875, -7.281982421875, -6.9703369140625, -6.65869140625, -6.3470458984375, -6.035400390625, -5.7237548828125, -5.412109375, -5.1004638671875, -4.788818359375, -4.4771728515625, -4.16552734375, -3.8538818359375, -3.542236328125, -3.2305908203125, -2.9189453125, -2.6072998046875, -2.295654296875, -1.9840087890625, -1.67236328125, -1.3607177734375, -1.049072265625, -0.7374267578125, -0.42578125, -0.1141357421875, 0.197509765625, 0.5091552734375, 0.82080078125, 1.1324462890625, 1.444091796875, 1.7557373046875, 2.0673828125, 2.3790283203125, 2.690673828125, 3.0023193359375, 3.31396484375, 3.6256103515625, 3.937255859375, 4.2489013671875, 4.560546875, 4.8721923828125, 5.183837890625, 5.4954833984375, 5.80712890625, 6.1187744140625, 6.430419921875, 6.7420654296875, 7.0537109375, 7.3653564453125, 7.677001953125, 7.9886474609375, 8.30029296875, 8.6119384765625, 8.923583984375, 9.2352294921875, 9.546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 4.0, 13.0, 5.0, 12.0, 14.0, 14.0, 13.0, 23.0, 20.0, 26.0, 32.0, 37.0, 40.0, 24.0, 40.0, 44.0, 38.0, 38.0, 40.0, 42.0, 40.0, 39.0, 27.0, 29.0, 50.0, 36.0, 30.0, 29.0, 21.0, 29.0, 26.0, 21.0, 25.0, 10.0, 15.0, 11.0, 4.0, 8.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0, -13.55029296875, -13.1005859375, -12.65087890625, -12.201171875, -11.75146484375, -11.3017578125, -10.85205078125, -10.40234375, -9.95263671875, -9.5029296875, -9.05322265625, -8.603515625, -8.15380859375, -7.7041015625, -7.25439453125, -6.8046875, -6.35498046875, -5.9052734375, -5.45556640625, -5.005859375, -4.55615234375, -4.1064453125, -3.65673828125, -3.20703125, -2.75732421875, -2.3076171875, -1.85791015625, -1.408203125, -0.95849609375, -0.5087890625, -0.05908203125, 0.390625, 0.84033203125, 1.2900390625, 1.73974609375, 2.189453125, 2.63916015625, 3.0888671875, 3.53857421875, 3.98828125, 4.43798828125, 4.8876953125, 5.33740234375, 5.787109375, 6.23681640625, 6.6865234375, 7.13623046875, 7.5859375, 8.03564453125, 8.4853515625, 8.93505859375, 9.384765625, 9.83447265625, 10.2841796875, 10.73388671875, 11.18359375, 11.63330078125, 12.0830078125, 12.53271484375, 12.982421875, 13.43212890625, 13.8818359375, 14.33154296875, 14.78125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 13.0, 12.0, 31.0, 28.0, 64.0, 94.0, 158.0, 310.0, 478.0, 732.0, 1221.0, 1976.0, 3153.0, 4968.0, 7983.0, 12599.0, 19555.0, 30006.0, 45333.0, 67045.0, 96038.0, 134593.0, 180966.0, 233373.0, 289246.0, 339823.0, 374938.0, 390599.0, 381863.0, 352201.0, 305466.0, 250994.0, 196589.0, 146640.0, 105599.0, 74493.0, 50804.0, 33817.0, 21954.0, 14238.0, 9067.0, 5820.0, 3571.0, 2158.0, 1415.0, 875.0, 587.0, 329.0, 197.0, 108.0, 77.0, 28.0, 41.0, 12.0, 10.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.7969970703125, -8.500244140625, -8.2034912109375, -7.90673828125, -7.6099853515625, -7.313232421875, -7.0164794921875, -6.7197265625, -6.4229736328125, -6.126220703125, -5.8294677734375, -5.53271484375, -5.2359619140625, -4.939208984375, -4.6424560546875, -4.345703125, -4.0489501953125, -3.752197265625, -3.4554443359375, -3.15869140625, -2.8619384765625, -2.565185546875, -2.2684326171875, -1.9716796875, -1.6749267578125, -1.378173828125, -1.0814208984375, -0.78466796875, -0.4879150390625, -0.191162109375, 0.1055908203125, 0.40234375, 0.6990966796875, 0.995849609375, 1.2926025390625, 1.58935546875, 1.8861083984375, 2.182861328125, 2.4796142578125, 2.7763671875, 3.0731201171875, 3.369873046875, 3.6666259765625, 3.96337890625, 4.2601318359375, 4.556884765625, 4.8536376953125, 5.150390625, 5.4471435546875, 5.743896484375, 6.0406494140625, 6.33740234375, 6.6341552734375, 6.930908203125, 7.2276611328125, 7.5244140625, 7.8211669921875, 8.117919921875, 8.4146728515625, 8.71142578125, 9.0081787109375, 9.304931640625, 9.6016845703125, 9.8984375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 6.0, 7.0, 3.0, 4.0, 12.0, 8.0, 9.0, 19.0, 16.0, 27.0, 33.0, 43.0, 60.0, 60.0, 61.0, 85.0, 114.0, 118.0, 139.0, 163.0, 175.0, 169.0, 162.0, 185.0, 203.0, 195.0, 214.0, 203.0, 187.0, 194.0, 165.0, 173.0, 139.0, 127.0, 98.0, 97.0, 65.0, 61.0, 61.0, 37.0, 36.0, 29.0, 28.0, 25.0, 16.0, 17.0, 3.0, 11.0, 3.0, 5.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.8359375, -5.644775390625, -5.45361328125, -5.262451171875, -5.0712890625, -4.880126953125, -4.68896484375, -4.497802734375, -4.306640625, -4.115478515625, -3.92431640625, -3.733154296875, -3.5419921875, -3.350830078125, -3.15966796875, -2.968505859375, -2.77734375, -2.586181640625, -2.39501953125, -2.203857421875, -2.0126953125, -1.821533203125, -1.63037109375, -1.439208984375, -1.248046875, -1.056884765625, -0.86572265625, -0.674560546875, -0.4833984375, -0.292236328125, -0.10107421875, 0.090087890625, 0.28125, 0.472412109375, 0.66357421875, 0.854736328125, 1.0458984375, 1.237060546875, 1.42822265625, 1.619384765625, 1.810546875, 2.001708984375, 2.19287109375, 2.384033203125, 2.5751953125, 2.766357421875, 2.95751953125, 3.148681640625, 3.33984375, 3.531005859375, 3.72216796875, 3.913330078125, 4.1044921875, 4.295654296875, 4.48681640625, 4.677978515625, 4.869140625, 5.060302734375, 5.25146484375, 5.442626953125, 5.6337890625, 5.824951171875, 6.01611328125, 6.207275390625, 6.3984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 9.0, 4.0, 3.0, 5.0, 15.0, 9.0, 11.0, 9.0, 16.0, 13.0, 19.0, 22.0, 30.0, 20.0, 34.0, 30.0, 34.0, 38.0, 35.0, 35.0, 47.0, 52.0, 50.0, 41.0, 44.0, 34.0, 31.0, 25.0, 34.0, 33.0, 26.0, 28.0, 22.0, 21.0, 16.0, 24.0, 20.0, 6.0, 9.0, 5.0, 7.0, 11.0, 9.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-12.84615707397461, -12.451104164123535, -12.056050300598145, -11.66099739074707, -11.265944480895996, -10.870891571044922, -10.475837707519531, -10.080784797668457, -9.685731887817383, -9.290678977966309, -8.895625114440918, -8.500572204589844, -8.10551929473877, -7.710465908050537, -7.315412521362305, -6.9203596115112305, -6.525306224822998, -6.130252838134766, -5.735199928283691, -5.340146541595459, -4.945093631744385, -4.550040245056152, -4.154987335205078, -3.7599339485168457, -3.3648808002471924, -2.969827651977539, -2.5747745037078857, -2.1797213554382324, -1.7846680879592896, -1.3896149396896362, -0.9945616722106934, -0.59950852394104, -0.20445537567138672, 0.190597802400589, 0.5856509804725647, 0.9807041883468628, 1.3757573366165161, 1.7708104848861694, 2.1658637523651123, 2.5609169006347656, 2.955970048904419, 3.3510231971740723, 3.7460763454437256, 4.141129493713379, 4.536182880401611, 4.9312357902526855, 5.326289176940918, 5.721342086791992, 6.116395473480225, 6.511448860168457, 6.906501770019531, 7.301555156707764, 7.696608066558838, 8.09166145324707, 8.486714363098145, 8.881767272949219, 9.27682113647461, 9.671874046325684, 10.066927909851074, 10.461980819702148, 10.857033729553223, 11.252086639404297, 11.647140502929688, 12.042193412780762, 12.437246322631836]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 13.0, 16.0, 12.0, 13.0, 16.0, 16.0, 31.0, 23.0, 23.0, 30.0, 28.0, 33.0, 26.0, 35.0, 30.0, 43.0, 29.0, 43.0, 29.0, 42.0, 53.0, 37.0, 32.0, 37.0, 27.0, 42.0, 31.0, 31.0, 23.0, 27.0, 20.0, 17.0, 13.0, 7.0, 11.0, 10.0, 5.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-17.186349868774414, -16.683250427246094, -16.18014907836914, -15.677048683166504, -15.173948287963867, -14.670848846435547, -14.16774845123291, -13.664648056030273, -13.161547660827637, -12.658447265625, -12.155346870422363, -11.652246475219727, -11.149147033691406, -10.646045684814453, -10.142946243286133, -9.639845848083496, -9.13674545288086, -8.633645057678223, -8.130544662475586, -7.627444744110107, -7.124344348907471, -6.621243953704834, -6.1181440353393555, -5.615043640136719, -5.111943244934082, -4.608842849731445, -4.105742454528809, -3.60264253616333, -3.0995421409606934, -2.5964417457580566, -2.093341588973999, -1.5902414321899414, -1.087141990661621, -0.5840417146682739, -0.08094143867492676, 0.4221588373184204, 0.9252591133117676, 1.4283595085144043, 1.931459665298462, 2.4345598220825195, 2.9376602172851562, 3.440760612487793, 3.9438607692718506, 4.446960926055908, 4.950061321258545, 5.453161716461182, 5.95626163482666, 6.459362030029297, 6.962462425231934, 7.46556282043457, 7.968663215637207, 8.471763610839844, 8.974863052368164, 9.477964401245117, 9.981063842773438, 10.484164237976074, 10.987264633178711, 11.490365028381348, 11.993465423583984, 12.496565818786621, 12.999666213989258, 13.502765655517578, 14.005866050720215, 14.508966445922852, 15.012066841125488]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 6.0, 5.0, 12.0, 5.0, 15.0, 26.0, 37.0, 63.0, 89.0, 143.0, 208.0, 304.0, 441.0, 692.0, 1064.0, 1641.0, 2650.0, 4343.0, 7337.0, 11749.0, 19842.0, 31971.0, 51652.0, 79987.0, 116094.0, 147821.0, 157367.0, 136255.0, 100885.0, 66782.0, 42158.0, 25957.0, 15764.0, 9534.0, 5848.0, 3609.0, 2161.0, 1438.0, 920.0, 595.0, 357.0, 217.0, 177.0, 108.0, 84.0, 50.0, 36.0, 11.0, 21.0, 16.0, 3.0, 9.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.521484375, -3.40521240234375, -3.2889404296875, -3.17266845703125, -3.056396484375, -2.94012451171875, -2.8238525390625, -2.70758056640625, -2.59130859375, -2.47503662109375, -2.3587646484375, -2.24249267578125, -2.126220703125, -2.00994873046875, -1.8936767578125, -1.77740478515625, -1.6611328125, -1.54486083984375, -1.4285888671875, -1.31231689453125, -1.196044921875, -1.07977294921875, -0.9635009765625, -0.84722900390625, -0.73095703125, -0.61468505859375, -0.4984130859375, -0.38214111328125, -0.265869140625, -0.14959716796875, -0.0333251953125, 0.08294677734375, 0.19921875, 0.31549072265625, 0.4317626953125, 0.54803466796875, 0.664306640625, 0.78057861328125, 0.8968505859375, 1.01312255859375, 1.12939453125, 1.24566650390625, 1.3619384765625, 1.47821044921875, 1.594482421875, 1.71075439453125, 1.8270263671875, 1.94329833984375, 2.0595703125, 2.17584228515625, 2.2921142578125, 2.40838623046875, 2.524658203125, 2.64093017578125, 2.7572021484375, 2.87347412109375, 2.98974609375, 3.10601806640625, 3.2222900390625, 3.33856201171875, 3.454833984375, 3.57110595703125, 3.6873779296875, 3.80364990234375, 3.919921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 6.0, 10.0, 10.0, 12.0, 15.0, 15.0, 13.0, 17.0, 33.0, 20.0, 33.0, 23.0, 32.0, 19.0, 28.0, 43.0, 37.0, 40.0, 43.0, 40.0, 30.0, 48.0, 30.0, 46.0, 38.0, 39.0, 41.0, 32.0, 23.0, 26.0, 24.0, 23.0, 21.0, 13.0, 13.0, 8.0, 11.0, 11.0, 4.0, 3.0, 4.0, 6.0, 6.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-18.125, -17.6064453125, -17.087890625, -16.5693359375, -16.05078125, -15.5322265625, -15.013671875, -14.4951171875, -13.9765625, -13.4580078125, -12.939453125, -12.4208984375, -11.90234375, -11.3837890625, -10.865234375, -10.3466796875, -9.828125, -9.3095703125, -8.791015625, -8.2724609375, -7.75390625, -7.2353515625, -6.716796875, -6.1982421875, -5.6796875, -5.1611328125, -4.642578125, -4.1240234375, -3.60546875, -3.0869140625, -2.568359375, -2.0498046875, -1.53125, -1.0126953125, -0.494140625, 0.0244140625, 0.54296875, 1.0615234375, 1.580078125, 2.0986328125, 2.6171875, 3.1357421875, 3.654296875, 4.1728515625, 4.69140625, 5.2099609375, 5.728515625, 6.2470703125, 6.765625, 7.2841796875, 7.802734375, 8.3212890625, 8.83984375, 9.3583984375, 9.876953125, 10.3955078125, 10.9140625, 11.4326171875, 11.951171875, 12.4697265625, 12.98828125, 13.5068359375, 14.025390625, 14.5439453125, 15.0625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 4.0, 8.0, 10.0, 19.0, 18.0, 24.0, 40.0, 47.0, 80.0, 127.0, 191.0, 325.0, 495.0, 700.0, 1195.0, 2094.0, 3530.0, 6003.0, 10478.0, 18120.0, 30524.0, 50064.0, 80062.0, 115990.0, 148920.0, 160095.0, 140215.0, 104448.0, 69567.0, 43177.0, 25230.0, 15115.0, 8728.0, 5226.0, 2900.0, 1819.0, 1096.0, 656.0, 421.0, 269.0, 164.0, 129.0, 71.0, 56.0, 33.0, 23.0, 12.0, 11.0, 7.0, 7.0, 8.0, 2.0, 2.0, 5.0, 2.0], "bins": [-3.150390625, -3.05865478515625, -2.9669189453125, -2.87518310546875, -2.783447265625, -2.69171142578125, -2.5999755859375, -2.50823974609375, -2.41650390625, -2.32476806640625, -2.2330322265625, -2.14129638671875, -2.049560546875, -1.95782470703125, -1.8660888671875, -1.77435302734375, -1.6826171875, -1.59088134765625, -1.4991455078125, -1.40740966796875, -1.315673828125, -1.22393798828125, -1.1322021484375, -1.04046630859375, -0.94873046875, -0.85699462890625, -0.7652587890625, -0.67352294921875, -0.581787109375, -0.49005126953125, -0.3983154296875, -0.30657958984375, -0.21484375, -0.12310791015625, -0.0313720703125, 0.06036376953125, 0.152099609375, 0.24383544921875, 0.3355712890625, 0.42730712890625, 0.51904296875, 0.61077880859375, 0.7025146484375, 0.79425048828125, 0.885986328125, 0.97772216796875, 1.0694580078125, 1.16119384765625, 1.2529296875, 1.34466552734375, 1.4364013671875, 1.52813720703125, 1.619873046875, 1.71160888671875, 1.8033447265625, 1.89508056640625, 1.98681640625, 2.07855224609375, 2.1702880859375, 2.26202392578125, 2.353759765625, 2.44549560546875, 2.5372314453125, 2.62896728515625, 2.720703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 12.0, 7.0, 6.0, 13.0, 8.0, 10.0, 14.0, 15.0, 19.0, 14.0, 14.0, 16.0, 27.0, 24.0, 28.0, 27.0, 35.0, 32.0, 42.0, 38.0, 41.0, 37.0, 37.0, 34.0, 33.0, 45.0, 35.0, 20.0, 31.0, 29.0, 38.0, 20.0, 27.0, 21.0, 25.0, 14.0, 16.0, 13.0, 14.0, 15.0, 7.0, 12.0, 7.0, 9.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.796875, -10.459228515625, -10.12158203125, -9.783935546875, -9.4462890625, -9.108642578125, -8.77099609375, -8.433349609375, -8.095703125, -7.758056640625, -7.42041015625, -7.082763671875, -6.7451171875, -6.407470703125, -6.06982421875, -5.732177734375, -5.39453125, -5.056884765625, -4.71923828125, -4.381591796875, -4.0439453125, -3.706298828125, -3.36865234375, -3.031005859375, -2.693359375, -2.355712890625, -2.01806640625, -1.680419921875, -1.3427734375, -1.005126953125, -0.66748046875, -0.329833984375, 0.0078125, 0.345458984375, 0.68310546875, 1.020751953125, 1.3583984375, 1.696044921875, 2.03369140625, 2.371337890625, 2.708984375, 3.046630859375, 3.38427734375, 3.721923828125, 4.0595703125, 4.397216796875, 4.73486328125, 5.072509765625, 5.41015625, 5.747802734375, 6.08544921875, 6.423095703125, 6.7607421875, 7.098388671875, 7.43603515625, 7.773681640625, 8.111328125, 8.448974609375, 8.78662109375, 9.124267578125, 9.4619140625, 9.799560546875, 10.13720703125, 10.474853515625, 10.8125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 1.0, 5.0, 6.0, 4.0, 17.0, 16.0, 28.0, 38.0, 51.0, 79.0, 117.0, 163.0, 197.0, 287.0, 430.0, 624.0, 917.0, 1387.0, 2215.0, 3540.0, 6392.0, 11509.0, 22195.0, 45177.0, 97124.0, 190961.0, 267997.0, 197197.0, 100302.0, 47363.0, 23130.0, 11793.0, 6341.0, 3856.0, 2379.0, 1566.0, 987.0, 664.0, 467.0, 323.0, 217.0, 148.0, 98.0, 72.0, 56.0, 36.0, 25.0, 21.0, 15.0, 11.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7548828125, -0.7293167114257812, -0.7037506103515625, -0.6781845092773438, -0.652618408203125, -0.6270523071289062, -0.6014862060546875, -0.5759201049804688, -0.55035400390625, -0.5247879028320312, -0.4992218017578125, -0.47365570068359375, -0.448089599609375, -0.42252349853515625, -0.3969573974609375, -0.37139129638671875, -0.3458251953125, -0.32025909423828125, -0.2946929931640625, -0.26912689208984375, -0.243560791015625, -0.21799468994140625, -0.1924285888671875, -0.16686248779296875, -0.14129638671875, -0.11573028564453125, -0.0901641845703125, -0.06459808349609375, -0.039031982421875, -0.01346588134765625, 0.0121002197265625, 0.03766632080078125, 0.063232421875, 0.08879852294921875, 0.1143646240234375, 0.13993072509765625, 0.165496826171875, 0.19106292724609375, 0.2166290283203125, 0.24219512939453125, 0.26776123046875, 0.29332733154296875, 0.3188934326171875, 0.34445953369140625, 0.370025634765625, 0.39559173583984375, 0.4211578369140625, 0.44672393798828125, 0.4722900390625, 0.49785614013671875, 0.5234222412109375, 0.5489883422851562, 0.574554443359375, 0.6001205444335938, 0.6256866455078125, 0.6512527465820312, 0.67681884765625, 0.7023849487304688, 0.7279510498046875, 0.7535171508789062, 0.779083251953125, 0.8046493530273438, 0.8302154541015625, 0.8557815551757812, 0.88134765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 9.0, 10.0, 8.0, 14.0, 14.0, 32.0, 35.0, 46.0, 54.0, 79.0, 84.0, 119.0, 123.0, 96.0, 72.0, 49.0, 52.0, 35.0, 24.0, 13.0, 5.0, 7.0, 6.0, 4.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021159648895263672, -0.0002056807279586792, -0.00019976496696472168, -0.00019384920597076416, -0.00018793344497680664, -0.00018201768398284912, -0.0001761019229888916, -0.00017018616199493408, -0.00016427040100097656, -0.00015835464000701904, -0.00015243887901306152, -0.000146523118019104, -0.00014060735702514648, -0.00013469159603118896, -0.00012877583503723145, -0.00012286007404327393, -0.0001169443130493164, -0.00011102855205535889, -0.00010511279106140137, -9.919703006744385e-05, -9.328126907348633e-05, -8.736550807952881e-05, -8.144974708557129e-05, -7.553398609161377e-05, -6.961822509765625e-05, -6.370246410369873e-05, -5.778670310974121e-05, -5.187094211578369e-05, -4.595518112182617e-05, -4.003942012786865e-05, -3.412365913391113e-05, -2.8207898139953613e-05, -2.2292137145996094e-05, -1.6376376152038574e-05, -1.0460615158081055e-05, -4.544854164123535e-06, 1.3709068298339844e-06, 7.286667823791504e-06, 1.3202428817749023e-05, 1.9118189811706543e-05, 2.5033950805664062e-05, 3.094971179962158e-05, 3.68654727935791e-05, 4.278123378753662e-05, 4.869699478149414e-05, 5.461275577545166e-05, 6.052851676940918e-05, 6.64442777633667e-05, 7.236003875732422e-05, 7.827579975128174e-05, 8.419156074523926e-05, 9.010732173919678e-05, 9.60230827331543e-05, 0.00010193884372711182, 0.00010785460472106934, 0.00011377036571502686, 0.00011968612670898438, 0.0001256018877029419, 0.00013151764869689941, 0.00013743340969085693, 0.00014334917068481445, 0.00014926493167877197, 0.0001551806926727295, 0.000161096453666687, 0.00016701221466064453]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 11.0, 11.0, 17.0, 30.0, 51.0, 74.0, 121.0, 164.0, 235.0, 360.0, 531.0, 822.0, 1140.0, 1739.0, 2546.0, 3900.0, 6114.0, 9526.0, 15302.0, 25335.0, 41503.0, 69929.0, 113845.0, 165484.0, 186036.0, 150146.0, 98397.0, 60386.0, 35757.0, 21758.0, 13242.0, 8470.0, 5303.0, 3409.0, 2244.0, 1519.0, 944.0, 692.0, 459.0, 317.0, 193.0, 149.0, 122.0, 67.0, 63.0, 25.0, 18.0, 14.0, 10.0, 10.0, 10.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1484375, -1.110595703125, -1.07275390625, -1.034912109375, -0.9970703125, -0.959228515625, -0.92138671875, -0.883544921875, -0.845703125, -0.807861328125, -0.77001953125, -0.732177734375, -0.6943359375, -0.656494140625, -0.61865234375, -0.580810546875, -0.54296875, -0.505126953125, -0.46728515625, -0.429443359375, -0.3916015625, -0.353759765625, -0.31591796875, -0.278076171875, -0.240234375, -0.202392578125, -0.16455078125, -0.126708984375, -0.0888671875, -0.051025390625, -0.01318359375, 0.024658203125, 0.0625, 0.100341796875, 0.13818359375, 0.176025390625, 0.2138671875, 0.251708984375, 0.28955078125, 0.327392578125, 0.365234375, 0.403076171875, 0.44091796875, 0.478759765625, 0.5166015625, 0.554443359375, 0.59228515625, 0.630126953125, 0.66796875, 0.705810546875, 0.74365234375, 0.781494140625, 0.8193359375, 0.857177734375, 0.89501953125, 0.932861328125, 0.970703125, 1.008544921875, 1.04638671875, 1.084228515625, 1.1220703125, 1.159912109375, 1.19775390625, 1.235595703125, 1.2734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 10.0, 9.0, 19.0, 19.0, 19.0, 15.0, 37.0, 34.0, 43.0, 61.0, 77.0, 80.0, 87.0, 79.0, 72.0, 74.0, 54.0, 39.0, 27.0, 31.0, 26.0, 16.0, 9.0, 11.0, 6.0, 9.0, 3.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.67138671875, -0.6514053344726562, -0.6314239501953125, -0.6114425659179688, -0.591461181640625, -0.5714797973632812, -0.5514984130859375, -0.5315170288085938, -0.51153564453125, -0.49155426025390625, -0.4715728759765625, -0.45159149169921875, -0.431610107421875, -0.41162872314453125, -0.3916473388671875, -0.37166595458984375, -0.3516845703125, -0.33170318603515625, -0.3117218017578125, -0.29174041748046875, -0.271759033203125, -0.25177764892578125, -0.2317962646484375, -0.21181488037109375, -0.19183349609375, -0.17185211181640625, -0.1518707275390625, -0.13188934326171875, -0.111907958984375, -0.09192657470703125, -0.0719451904296875, -0.05196380615234375, -0.031982421875, -0.01200103759765625, 0.0079803466796875, 0.02796173095703125, 0.047943115234375, 0.06792449951171875, 0.0879058837890625, 0.10788726806640625, 0.12786865234375, 0.14785003662109375, 0.1678314208984375, 0.18781280517578125, 0.207794189453125, 0.22777557373046875, 0.2477569580078125, 0.26773834228515625, 0.2877197265625, 0.30770111083984375, 0.3276824951171875, 0.34766387939453125, 0.367645263671875, 0.38762664794921875, 0.4076080322265625, 0.42758941650390625, 0.44757080078125, 0.46755218505859375, 0.4875335693359375, 0.5075149536132812, 0.527496337890625, 0.5474777221679688, 0.5674591064453125, 0.5874404907226562, 0.607421875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 1.0, 6.0, 7.0, 11.0, 8.0, 7.0, 17.0, 10.0, 15.0, 13.0, 21.0, 23.0, 23.0, 38.0, 33.0, 25.0, 33.0, 38.0, 36.0, 31.0, 44.0, 53.0, 49.0, 33.0, 40.0, 37.0, 27.0, 31.0, 24.0, 34.0, 21.0, 28.0, 25.0, 23.0, 17.0, 18.0, 13.0, 16.0, 8.0, 9.0, 8.0, 7.0, 9.0, 2.0, 4.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-12.044129371643066, -11.671682357788086, -11.299235343933105, -10.926788330078125, -10.554340362548828, -10.181893348693848, -9.809446334838867, -9.436999320983887, -9.064552307128906, -8.692105293273926, -8.319658279418945, -7.947210788726807, -7.574763774871826, -7.202316761016846, -6.829869270324707, -6.457422256469727, -6.084975242614746, -5.712528228759766, -5.340081214904785, -4.9676337242126465, -4.595186710357666, -4.2227396965026855, -3.850292444229126, -3.4778451919555664, -3.105398178100586, -2.7329511642456055, -2.360503911972046, -1.9880567789077759, -1.6156096458435059, -1.2431625127792358, -0.8707153797149658, -0.49826812744140625, -0.12582015991210938, 0.24662697315216064, 0.6190741062164307, 0.9915212392807007, 1.3639683723449707, 1.7364155054092407, 2.1088626384735107, 2.4813098907470703, 2.853756904602051, 3.2262039184570312, 3.598651170730591, 3.9710984230041504, 4.343545436859131, 4.715992450714111, 5.08843994140625, 5.4608869552612305, 5.833333969116211, 6.205780982971191, 6.578227996826172, 6.9506754875183105, 7.323122501373291, 7.6955695152282715, 8.06801700592041, 8.44046401977539, 8.812911033630371, 9.185358047485352, 9.557805061340332, 9.930252075195312, 10.30270004272461, 10.67514705657959, 11.04759407043457, 11.42004108428955, 11.792488098144531]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 8.0, 13.0, 13.0, 13.0, 12.0, 18.0, 21.0, 29.0, 17.0, 27.0, 30.0, 30.0, 23.0, 38.0, 28.0, 37.0, 41.0, 32.0, 37.0, 30.0, 47.0, 45.0, 45.0, 40.0, 23.0, 31.0, 37.0, 36.0, 27.0, 26.0, 21.0, 18.0, 17.0, 17.0, 7.0, 8.0, 9.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0], "bins": [-17.543622970581055, -17.04429054260254, -16.54495620727539, -16.045623779296875, -15.546290397644043, -15.046957015991211, -14.547623634338379, -14.048290252685547, -13.548956871032715, -13.049623489379883, -12.55029010772705, -12.050956726074219, -11.551624298095703, -11.052290916442871, -10.552957534790039, -10.053624153137207, -9.554290771484375, -9.054957389831543, -8.555624008178711, -8.056291580200195, -7.556957721710205, -7.057624816894531, -6.558291435241699, -6.058958053588867, -5.559625625610352, -5.0602922439575195, -4.560959339141846, -4.061625957489014, -3.5622925758361816, -3.0629594326019287, -2.563626289367676, -2.0642929077148438, -1.5649595260620117, -1.0656262636184692, -0.5662930607795715, -0.06695985794067383, 0.43237340450286865, 0.9317066669464111, 1.431039810180664, 1.930373191833496, 2.429706335067749, 2.929039478302002, 3.428372859954834, 3.927706003189087, 4.42703914642334, 4.926372528076172, 5.425705909729004, 5.925039291381836, 6.42437219619751, 6.923705577850342, 7.423038482666016, 7.922371864318848, 8.42170524597168, 8.921038627624512, 9.420372009277344, 9.91970443725586, 10.419037818908691, 10.918371200561523, 11.417704582214355, 11.917037963867188, 12.416370391845703, 12.915703773498535, 13.415037155151367, 13.9143705368042, 14.413703918457031]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 6.0, 4.0, 10.0, 25.0, 32.0, 40.0, 61.0, 132.0, 194.0, 291.0, 449.0, 721.0, 1078.0, 1830.0, 2759.0, 4234.0, 6572.0, 9517.0, 14558.0, 20712.0, 29396.0, 40324.0, 52433.0, 66152.0, 79647.0, 89528.0, 96201.0, 96259.0, 91389.0, 81311.0, 68577.0, 54538.0, 41806.0, 30714.0, 22050.0, 15056.0, 10260.0, 7025.0, 4433.0, 2978.0, 1948.0, 1228.0, 755.0, 521.0, 282.0, 172.0, 123.0, 80.0, 54.0, 37.0, 20.0, 12.0, 14.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.3125, -9.0128173828125, -8.713134765625, -8.4134521484375, -8.11376953125, -7.8140869140625, -7.514404296875, -7.2147216796875, -6.9150390625, -6.6153564453125, -6.315673828125, -6.0159912109375, -5.71630859375, -5.4166259765625, -5.116943359375, -4.8172607421875, -4.517578125, -4.2178955078125, -3.918212890625, -3.6185302734375, -3.31884765625, -3.0191650390625, -2.719482421875, -2.4197998046875, -2.1201171875, -1.8204345703125, -1.520751953125, -1.2210693359375, -0.92138671875, -0.6217041015625, -0.322021484375, -0.0223388671875, 0.27734375, 0.5770263671875, 0.876708984375, 1.1763916015625, 1.47607421875, 1.7757568359375, 2.075439453125, 2.3751220703125, 2.6748046875, 2.9744873046875, 3.274169921875, 3.5738525390625, 3.87353515625, 4.1732177734375, 4.472900390625, 4.7725830078125, 5.072265625, 5.3719482421875, 5.671630859375, 5.9713134765625, 6.27099609375, 6.5706787109375, 6.870361328125, 7.1700439453125, 7.4697265625, 7.7694091796875, 8.069091796875, 8.3687744140625, 8.66845703125, 8.9681396484375, 9.267822265625, 9.5675048828125, 9.8671875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 12.0, 3.0, 17.0, 13.0, 25.0, 26.0, 21.0, 19.0, 24.0, 20.0, 43.0, 30.0, 29.0, 44.0, 37.0, 33.0, 32.0, 34.0, 42.0, 35.0, 52.0, 37.0, 35.0, 33.0, 37.0, 32.0, 27.0, 25.0, 26.0, 23.0, 24.0, 19.0, 14.0, 13.0, 8.0, 4.0, 8.0, 6.0, 5.0, 7.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0], "bins": [-18.015625, -17.51513671875, -17.0146484375, -16.51416015625, -16.013671875, -15.51318359375, -15.0126953125, -14.51220703125, -14.01171875, -13.51123046875, -13.0107421875, -12.51025390625, -12.009765625, -11.50927734375, -11.0087890625, -10.50830078125, -10.0078125, -9.50732421875, -9.0068359375, -8.50634765625, -8.005859375, -7.50537109375, -7.0048828125, -6.50439453125, -6.00390625, -5.50341796875, -5.0029296875, -4.50244140625, -4.001953125, -3.50146484375, -3.0009765625, -2.50048828125, -2.0, -1.49951171875, -0.9990234375, -0.49853515625, 0.001953125, 0.50244140625, 1.0029296875, 1.50341796875, 2.00390625, 2.50439453125, 3.0048828125, 3.50537109375, 4.005859375, 4.50634765625, 5.0068359375, 5.50732421875, 6.0078125, 6.50830078125, 7.0087890625, 7.50927734375, 8.009765625, 8.51025390625, 9.0107421875, 9.51123046875, 10.01171875, 10.51220703125, 11.0126953125, 11.51318359375, 12.013671875, 12.51416015625, 13.0146484375, 13.51513671875, 14.015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 11.0, 13.0, 8.0, 21.0, 25.0, 37.0, 66.0, 120.0, 194.0, 351.0, 512.0, 1019.0, 1790.0, 3095.0, 5398.0, 9358.0, 16215.0, 26759.0, 43182.0, 65142.0, 90551.0, 115622.0, 132294.0, 133596.0, 120025.0, 95559.0, 69213.0, 46736.0, 29337.0, 17782.0, 10423.0, 6006.0, 3486.0, 1981.0, 1145.0, 603.0, 361.0, 210.0, 109.0, 88.0, 38.0, 25.0, 19.0, 22.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.230712890625, -12.80517578125, -12.379638671875, -11.9541015625, -11.528564453125, -11.10302734375, -10.677490234375, -10.251953125, -9.826416015625, -9.40087890625, -8.975341796875, -8.5498046875, -8.124267578125, -7.69873046875, -7.273193359375, -6.84765625, -6.422119140625, -5.99658203125, -5.571044921875, -5.1455078125, -4.719970703125, -4.29443359375, -3.868896484375, -3.443359375, -3.017822265625, -2.59228515625, -2.166748046875, -1.7412109375, -1.315673828125, -0.89013671875, -0.464599609375, -0.0390625, 0.386474609375, 0.81201171875, 1.237548828125, 1.6630859375, 2.088623046875, 2.51416015625, 2.939697265625, 3.365234375, 3.790771484375, 4.21630859375, 4.641845703125, 5.0673828125, 5.492919921875, 5.91845703125, 6.343994140625, 6.76953125, 7.195068359375, 7.62060546875, 8.046142578125, 8.4716796875, 8.897216796875, 9.32275390625, 9.748291015625, 10.173828125, 10.599365234375, 11.02490234375, 11.450439453125, 11.8759765625, 12.301513671875, 12.72705078125, 13.152587890625, 13.578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 6.0, 7.0, 14.0, 11.0, 15.0, 19.0, 18.0, 21.0, 30.0, 24.0, 24.0, 26.0, 25.0, 39.0, 31.0, 40.0, 38.0, 45.0, 36.0, 42.0, 36.0, 50.0, 34.0, 37.0, 41.0, 28.0, 29.0, 27.0, 21.0, 23.0, 29.0, 22.0, 17.0, 12.0, 16.0, 9.0, 4.0, 5.0, 5.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4296875, -10.094482421875, -9.75927734375, -9.424072265625, -9.0888671875, -8.753662109375, -8.41845703125, -8.083251953125, -7.748046875, -7.412841796875, -7.07763671875, -6.742431640625, -6.4072265625, -6.072021484375, -5.73681640625, -5.401611328125, -5.06640625, -4.731201171875, -4.39599609375, -4.060791015625, -3.7255859375, -3.390380859375, -3.05517578125, -2.719970703125, -2.384765625, -2.049560546875, -1.71435546875, -1.379150390625, -1.0439453125, -0.708740234375, -0.37353515625, -0.038330078125, 0.296875, 0.632080078125, 0.96728515625, 1.302490234375, 1.6376953125, 1.972900390625, 2.30810546875, 2.643310546875, 2.978515625, 3.313720703125, 3.64892578125, 3.984130859375, 4.3193359375, 4.654541015625, 4.98974609375, 5.324951171875, 5.66015625, 5.995361328125, 6.33056640625, 6.665771484375, 7.0009765625, 7.336181640625, 7.67138671875, 8.006591796875, 8.341796875, 8.677001953125, 9.01220703125, 9.347412109375, 9.6826171875, 10.017822265625, 10.35302734375, 10.688232421875, 11.0234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 6.0, 6.0, 12.0, 8.0, 14.0, 23.0, 41.0, 67.0, 104.0, 186.0, 283.0, 486.0, 816.0, 1515.0, 2716.0, 4793.0, 8896.0, 16689.0, 31789.0, 62490.0, 115847.0, 184371.0, 216566.0, 175034.0, 106282.0, 56715.0, 29416.0, 15234.0, 8134.0, 4396.0, 2362.0, 1354.0, 783.0, 448.0, 269.0, 169.0, 98.0, 56.0, 32.0, 19.0, 19.0, 9.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.453125, -6.1993408203125, -5.945556640625, -5.6917724609375, -5.43798828125, -5.1842041015625, -4.930419921875, -4.6766357421875, -4.4228515625, -4.1690673828125, -3.915283203125, -3.6614990234375, -3.40771484375, -3.1539306640625, -2.900146484375, -2.6463623046875, -2.392578125, -2.1387939453125, -1.885009765625, -1.6312255859375, -1.37744140625, -1.1236572265625, -0.869873046875, -0.6160888671875, -0.3623046875, -0.1085205078125, 0.145263671875, 0.3990478515625, 0.65283203125, 0.9066162109375, 1.160400390625, 1.4141845703125, 1.66796875, 1.9217529296875, 2.175537109375, 2.4293212890625, 2.68310546875, 2.9368896484375, 3.190673828125, 3.4444580078125, 3.6982421875, 3.9520263671875, 4.205810546875, 4.4595947265625, 4.71337890625, 4.9671630859375, 5.220947265625, 5.4747314453125, 5.728515625, 5.9822998046875, 6.236083984375, 6.4898681640625, 6.74365234375, 6.9974365234375, 7.251220703125, 7.5050048828125, 7.7587890625, 8.0125732421875, 8.266357421875, 8.5201416015625, 8.77392578125, 9.0277099609375, 9.281494140625, 9.5352783203125, 9.7890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 6.0, 11.0, 5.0, 9.0, 11.0, 29.0, 23.0, 21.0, 33.0, 33.0, 59.0, 65.0, 55.0, 64.0, 87.0, 71.0, 65.0, 65.0, 47.0, 47.0, 32.0, 34.0, 24.0, 25.0, 19.0, 11.0, 10.0, 11.0, 5.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00078582763671875, -0.0007632747292518616, -0.0007407218217849731, -0.0007181689143180847, -0.0006956160068511963, -0.0006730630993843079, -0.0006505101919174194, -0.000627957284450531, -0.0006054043769836426, -0.0005828514695167542, -0.0005602985620498657, -0.0005377456545829773, -0.0005151927471160889, -0.0004926398396492004, -0.000470086932182312, -0.0004475340247154236, -0.00042498111724853516, -0.00040242820978164673, -0.0003798753023147583, -0.0003573223948478699, -0.00033476948738098145, -0.000312216579914093, -0.0002896636724472046, -0.00026711076498031616, -0.00024455785751342773, -0.0002220049500465393, -0.00019945204257965088, -0.00017689913511276245, -0.00015434622764587402, -0.0001317933201789856, -0.00010924041271209717, -8.668750524520874e-05, -6.413459777832031e-05, -4.1581690311431885e-05, -1.9028782844543457e-05, 3.5241246223449707e-06, 2.60770320892334e-05, 4.8629939556121826e-05, 7.118284702301025e-05, 9.373575448989868e-05, 0.00011628866195678711, 0.00013884156942367554, 0.00016139447689056396, 0.0001839473843574524, 0.00020650029182434082, 0.00022905319929122925, 0.0002516061067581177, 0.0002741590142250061, 0.00029671192169189453, 0.00031926482915878296, 0.0003418177366256714, 0.0003643706440925598, 0.00038692355155944824, 0.00040947645902633667, 0.0004320293664932251, 0.0004545822739601135, 0.00047713518142700195, 0.0004996880888938904, 0.0005222409963607788, 0.0005447939038276672, 0.0005673468112945557, 0.0005898997187614441, 0.0006124526262283325, 0.000635005533695221, 0.0006575584411621094]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 14.0, 21.0, 30.0, 40.0, 65.0, 79.0, 125.0, 171.0, 246.0, 371.0, 606.0, 922.0, 1404.0, 2260.0, 3479.0, 5610.0, 8975.0, 14031.0, 22929.0, 36064.0, 55781.0, 84522.0, 116412.0, 142454.0, 146557.0, 127362.0, 96514.0, 66107.0, 42654.0, 26958.0, 16973.0, 10624.0, 6539.0, 4117.0, 2593.0, 1733.0, 1120.0, 697.0, 494.0, 291.0, 202.0, 125.0, 90.0, 60.0, 43.0, 27.0, 23.0, 15.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.6171875, -5.43707275390625, -5.2569580078125, -5.07684326171875, -4.896728515625, -4.71661376953125, -4.5364990234375, -4.35638427734375, -4.17626953125, -3.99615478515625, -3.8160400390625, -3.63592529296875, -3.455810546875, -3.27569580078125, -3.0955810546875, -2.91546630859375, -2.7353515625, -2.55523681640625, -2.3751220703125, -2.19500732421875, -2.014892578125, -1.83477783203125, -1.6546630859375, -1.47454833984375, -1.29443359375, -1.11431884765625, -0.9342041015625, -0.75408935546875, -0.573974609375, -0.39385986328125, -0.2137451171875, -0.03363037109375, 0.146484375, 0.32659912109375, 0.5067138671875, 0.68682861328125, 0.866943359375, 1.04705810546875, 1.2271728515625, 1.40728759765625, 1.58740234375, 1.76751708984375, 1.9476318359375, 2.12774658203125, 2.307861328125, 2.48797607421875, 2.6680908203125, 2.84820556640625, 3.0283203125, 3.20843505859375, 3.3885498046875, 3.56866455078125, 3.748779296875, 3.92889404296875, 4.1090087890625, 4.28912353515625, 4.46923828125, 4.64935302734375, 4.8294677734375, 5.00958251953125, 5.189697265625, 5.36981201171875, 5.5499267578125, 5.73004150390625, 5.91015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 3.0, 4.0, 12.0, 10.0, 14.0, 10.0, 18.0, 22.0, 35.0, 40.0, 47.0, 55.0, 68.0, 69.0, 81.0, 76.0, 71.0, 72.0, 49.0, 41.0, 43.0, 30.0, 22.0, 25.0, 15.0, 15.0, 11.0, 11.0, 1.0, 5.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.048828125, -2.956817626953125, -2.86480712890625, -2.772796630859375, -2.6807861328125, -2.588775634765625, -2.49676513671875, -2.404754638671875, -2.312744140625, -2.220733642578125, -2.12872314453125, -2.036712646484375, -1.9447021484375, -1.852691650390625, -1.76068115234375, -1.668670654296875, -1.57666015625, -1.484649658203125, -1.39263916015625, -1.300628662109375, -1.2086181640625, -1.116607666015625, -1.02459716796875, -0.932586669921875, -0.840576171875, -0.748565673828125, -0.65655517578125, -0.564544677734375, -0.4725341796875, -0.380523681640625, -0.28851318359375, -0.196502685546875, -0.1044921875, -0.012481689453125, 0.07952880859375, 0.171539306640625, 0.2635498046875, 0.355560302734375, 0.44757080078125, 0.539581298828125, 0.631591796875, 0.723602294921875, 0.81561279296875, 0.907623291015625, 0.9996337890625, 1.091644287109375, 1.18365478515625, 1.275665283203125, 1.36767578125, 1.459686279296875, 1.55169677734375, 1.643707275390625, 1.7357177734375, 1.827728271484375, 1.91973876953125, 2.011749267578125, 2.103759765625, 2.195770263671875, 2.28778076171875, 2.379791259765625, 2.4718017578125, 2.563812255859375, 2.65582275390625, 2.747833251953125, 2.83984375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 5.0, 7.0, 6.0, 11.0, 14.0, 12.0, 18.0, 9.0, 20.0, 18.0, 26.0, 34.0, 28.0, 26.0, 26.0, 43.0, 41.0, 42.0, 34.0, 45.0, 32.0, 31.0, 37.0, 46.0, 39.0, 30.0, 31.0, 33.0, 31.0, 26.0, 19.0, 19.0, 14.0, 22.0, 17.0, 20.0, 16.0, 10.0, 13.0, 11.0, 8.0, 3.0, 3.0, 5.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0], "bins": [-11.96922492980957, -11.600311279296875, -11.23139762878418, -10.862483978271484, -10.493569374084473, -10.124655723571777, -9.755742073059082, -9.386828422546387, -9.017913818359375, -8.64900016784668, -8.280086517333984, -7.911172389984131, -7.542258262634277, -7.173344612121582, -6.804430961608887, -6.435517311096191, -6.066603660583496, -5.697690010070801, -5.328775882720947, -4.959862232208252, -4.590948104858398, -4.222034454345703, -3.853120803833008, -3.4842069149017334, -3.115293025970459, -2.7463791370391846, -2.37746524810791, -2.008551597595215, -1.6396377086639404, -1.270723819732666, -0.9018101692199707, -0.5328962802886963, -0.16398239135742188, 0.20493143796920776, 0.5738452672958374, 0.9427590370178223, 1.3116729259490967, 1.680586814880371, 2.0495004653930664, 2.418414354324341, 2.7873282432556152, 3.1562421321868896, 3.525156021118164, 3.8940696716308594, 4.262983322143555, 4.631897449493408, 5.0008111000061035, 5.369725227355957, 5.738638877868652, 6.107552528381348, 6.476466655731201, 6.8453803062438965, 7.21429443359375, 7.583208084106445, 7.952121734619141, 8.321035385131836, 8.689949035644531, 9.058862686157227, 9.427776336669922, 9.796689987182617, 10.165604591369629, 10.534518241882324, 10.90343189239502, 11.272345542907715, 11.641260147094727]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 14.0, 9.0, 9.0, 11.0, 13.0, 19.0, 19.0, 24.0, 19.0, 22.0, 27.0, 40.0, 38.0, 30.0, 29.0, 33.0, 60.0, 47.0, 40.0, 49.0, 31.0, 31.0, 43.0, 30.0, 36.0, 31.0, 37.0, 33.0, 24.0, 27.0, 19.0, 23.0, 19.0, 10.0, 12.0, 11.0, 6.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.43821907043457, -18.87759017944336, -18.31696128845215, -17.756332397460938, -17.195703506469727, -16.635074615478516, -16.074445724487305, -15.513816833496094, -14.953187942504883, -14.392559051513672, -13.831930160522461, -13.27130126953125, -12.710672378540039, -12.150043487548828, -11.589414596557617, -11.028785705566406, -10.468155860900879, -9.907526969909668, -9.346898078918457, -8.786269187927246, -8.225640296936035, -7.665011405944824, -7.104382038116455, -6.543753147125244, -5.983124256134033, -5.422495365142822, -4.861866474151611, -4.301237106323242, -3.7406084537506104, -3.1799795627593994, -2.6193504333496094, -2.0587215423583984, -1.4980926513671875, -0.9374637007713318, -0.3768347501754761, 0.18379426002502441, 0.7444231510162354, 1.3050520420074463, 1.8656811714172363, 2.4263100624084473, 2.986938953399658, 3.547567844390869, 4.10819673538208, 4.668826103210449, 5.22945499420166, 5.790083885192871, 6.350712776184082, 6.911341667175293, 7.471970558166504, 8.032599449157715, 8.593228340148926, 9.153857231140137, 9.714486122131348, 10.275115013122559, 10.835744857788086, 11.396373748779297, 11.957002639770508, 12.517631530761719, 13.07826042175293, 13.63888931274414, 14.199518203735352, 14.760147094726562, 15.320775985717773, 15.881404876708984, 16.442033767700195]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 12.0, 29.0, 33.0, 67.0, 132.0, 237.0, 364.0, 707.0, 1144.0, 1949.0, 3452.0, 5560.0, 9389.0, 15997.0, 26928.0, 43628.0, 70498.0, 111071.0, 169074.0, 245631.0, 333306.0, 420271.0, 482318.0, 496899.0, 463060.0, 387486.0, 298900.0, 215112.0, 145037.0, 94593.0, 59837.0, 36873.0, 22325.0, 13431.0, 7859.0, 4603.0, 2709.0, 1619.0, 860.0, 558.0, 314.0, 184.0, 92.0, 44.0, 36.0, 23.0, 11.0, 11.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.375, -10.032470703125, -9.68994140625, -9.347412109375, -9.0048828125, -8.662353515625, -8.31982421875, -7.977294921875, -7.634765625, -7.292236328125, -6.94970703125, -6.607177734375, -6.2646484375, -5.922119140625, -5.57958984375, -5.237060546875, -4.89453125, -4.552001953125, -4.20947265625, -3.866943359375, -3.5244140625, -3.181884765625, -2.83935546875, -2.496826171875, -2.154296875, -1.811767578125, -1.46923828125, -1.126708984375, -0.7841796875, -0.441650390625, -0.09912109375, 0.243408203125, 0.5859375, 0.928466796875, 1.27099609375, 1.613525390625, 1.9560546875, 2.298583984375, 2.64111328125, 2.983642578125, 3.326171875, 3.668701171875, 4.01123046875, 4.353759765625, 4.6962890625, 5.038818359375, 5.38134765625, 5.723876953125, 6.06640625, 6.408935546875, 6.75146484375, 7.093994140625, 7.4365234375, 7.779052734375, 8.12158203125, 8.464111328125, 8.806640625, 9.149169921875, 9.49169921875, 9.834228515625, 10.1767578125, 10.519287109375, 10.86181640625, 11.204345703125, 11.546875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 5.0, 9.0, 10.0, 14.0, 9.0, 10.0, 13.0, 13.0, 20.0, 18.0, 20.0, 29.0, 35.0, 34.0, 33.0, 35.0, 33.0, 44.0, 48.0, 44.0, 42.0, 36.0, 38.0, 34.0, 33.0, 35.0, 46.0, 27.0, 27.0, 24.0, 32.0, 27.0, 19.0, 14.0, 17.0, 13.0, 11.0, 7.0, 11.0, 4.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.84375, -13.4271240234375, -13.010498046875, -12.5938720703125, -12.17724609375, -11.7606201171875, -11.343994140625, -10.9273681640625, -10.5107421875, -10.0941162109375, -9.677490234375, -9.2608642578125, -8.84423828125, -8.4276123046875, -8.010986328125, -7.5943603515625, -7.177734375, -6.7611083984375, -6.344482421875, -5.9278564453125, -5.51123046875, -5.0946044921875, -4.677978515625, -4.2613525390625, -3.8447265625, -3.4281005859375, -3.011474609375, -2.5948486328125, -2.17822265625, -1.7615966796875, -1.344970703125, -0.9283447265625, -0.51171875, -0.0950927734375, 0.321533203125, 0.7381591796875, 1.15478515625, 1.5714111328125, 1.988037109375, 2.4046630859375, 2.8212890625, 3.2379150390625, 3.654541015625, 4.0711669921875, 4.48779296875, 4.9044189453125, 5.321044921875, 5.7376708984375, 6.154296875, 6.5709228515625, 6.987548828125, 7.4041748046875, 7.82080078125, 8.2374267578125, 8.654052734375, 9.0706787109375, 9.4873046875, 9.9039306640625, 10.320556640625, 10.7371826171875, 11.15380859375, 11.5704345703125, 11.987060546875, 12.4036865234375, 12.8203125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 9.0, 14.0, 38.0, 62.0, 120.0, 162.0, 327.0, 514.0, 926.0, 1654.0, 2921.0, 4805.0, 8144.0, 13543.0, 22286.0, 35443.0, 55348.0, 84447.0, 124053.0, 174697.0, 235221.0, 300208.0, 358654.0, 403349.0, 422268.0, 411426.0, 373833.0, 316970.0, 253351.0, 189836.0, 137698.0, 95071.0, 62663.0, 40578.0, 25446.0, 15363.0, 9500.0, 5561.0, 3352.0, 1843.0, 1115.0, 621.0, 342.0, 246.0, 112.0, 63.0, 33.0, 14.0, 17.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0], "bins": [-10.4921875, -10.1802978515625, -9.868408203125, -9.5565185546875, -9.24462890625, -8.9327392578125, -8.620849609375, -8.3089599609375, -7.9970703125, -7.6851806640625, -7.373291015625, -7.0614013671875, -6.74951171875, -6.4376220703125, -6.125732421875, -5.8138427734375, -5.501953125, -5.1900634765625, -4.878173828125, -4.5662841796875, -4.25439453125, -3.9425048828125, -3.630615234375, -3.3187255859375, -3.0068359375, -2.6949462890625, -2.383056640625, -2.0711669921875, -1.75927734375, -1.4473876953125, -1.135498046875, -0.8236083984375, -0.51171875, -0.1998291015625, 0.112060546875, 0.4239501953125, 0.73583984375, 1.0477294921875, 1.359619140625, 1.6715087890625, 1.9833984375, 2.2952880859375, 2.607177734375, 2.9190673828125, 3.23095703125, 3.5428466796875, 3.854736328125, 4.1666259765625, 4.478515625, 4.7904052734375, 5.102294921875, 5.4141845703125, 5.72607421875, 6.0379638671875, 6.349853515625, 6.6617431640625, 6.9736328125, 7.2855224609375, 7.597412109375, 7.9093017578125, 8.22119140625, 8.5330810546875, 8.844970703125, 9.1568603515625, 9.46875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 5.0, 5.0, 5.0, 24.0, 27.0, 39.0, 25.0, 37.0, 56.0, 74.0, 85.0, 89.0, 106.0, 118.0, 156.0, 149.0, 186.0, 203.0, 214.0, 189.0, 213.0, 192.0, 218.0, 196.0, 183.0, 177.0, 162.0, 154.0, 123.0, 130.0, 103.0, 86.0, 61.0, 58.0, 55.0, 34.0, 31.0, 31.0, 12.0, 12.0, 17.0, 10.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0], "bins": [-6.97265625, -6.7838134765625, -6.594970703125, -6.4061279296875, -6.21728515625, -6.0284423828125, -5.839599609375, -5.6507568359375, -5.4619140625, -5.2730712890625, -5.084228515625, -4.8953857421875, -4.70654296875, -4.5177001953125, -4.328857421875, -4.1400146484375, -3.951171875, -3.7623291015625, -3.573486328125, -3.3846435546875, -3.19580078125, -3.0069580078125, -2.818115234375, -2.6292724609375, -2.4404296875, -2.2515869140625, -2.062744140625, -1.8739013671875, -1.68505859375, -1.4962158203125, -1.307373046875, -1.1185302734375, -0.9296875, -0.7408447265625, -0.552001953125, -0.3631591796875, -0.17431640625, 0.0145263671875, 0.203369140625, 0.3922119140625, 0.5810546875, 0.7698974609375, 0.958740234375, 1.1475830078125, 1.33642578125, 1.5252685546875, 1.714111328125, 1.9029541015625, 2.091796875, 2.2806396484375, 2.469482421875, 2.6583251953125, 2.84716796875, 3.0360107421875, 3.224853515625, 3.4136962890625, 3.6025390625, 3.7913818359375, 3.980224609375, 4.1690673828125, 4.35791015625, 4.5467529296875, 4.735595703125, 4.9244384765625, 5.11328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 4.0, 8.0, 8.0, 13.0, 18.0, 18.0, 15.0, 20.0, 36.0, 34.0, 26.0, 30.0, 33.0, 29.0, 32.0, 51.0, 49.0, 39.0, 42.0, 40.0, 38.0, 42.0, 49.0, 42.0, 34.0, 24.0, 31.0, 29.0, 21.0, 28.0, 18.0, 15.0, 16.0, 6.0, 10.0, 6.0, 7.0, 4.0, 6.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3630952835083, -10.952713012695312, -10.542329788208008, -10.13194751739502, -9.721565246582031, -9.311182022094727, -8.900799751281738, -8.49041748046875, -8.080034255981445, -7.669651508331299, -7.2592692375183105, -6.848886489868164, -6.438504219055176, -6.028121471405029, -5.617738723754883, -5.2073564529418945, -4.796974182128906, -4.38659143447876, -3.9762091636657715, -3.565826416015625, -3.1554439067840576, -2.7450613975524902, -2.3346786499023438, -1.9242961406707764, -1.513913631439209, -1.1035311222076416, -0.6931484937667847, -0.28276586532592773, 0.12761664390563965, 0.537999153137207, 0.9483819007873535, 1.358764410018921, 1.7691478729248047, 2.179530382156372, 2.5899128913879395, 3.000295639038086, 3.4106781482696533, 3.8210606575012207, 4.231443405151367, 4.6418256759643555, 5.052208423614502, 5.462591171264648, 5.872973442077637, 6.283356189727783, 6.69373893737793, 7.104121208190918, 7.5145039558410645, 7.924886703491211, 8.3352689743042, 8.745651245117188, 9.156034469604492, 9.56641674041748, 9.976799011230469, 10.387182235717773, 10.797564506530762, 11.20794677734375, 11.618330001831055, 12.028712272644043, 12.439095497131348, 12.849477767944336, 13.259860038757324, 13.670242309570312, 14.080625534057617, 14.491007804870605, 14.901390075683594]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 1.0, 8.0, 11.0, 4.0, 7.0, 10.0, 14.0, 11.0, 13.0, 22.0, 19.0, 26.0, 28.0, 23.0, 34.0, 22.0, 34.0, 28.0, 36.0, 40.0, 31.0, 38.0, 51.0, 49.0, 42.0, 37.0, 30.0, 29.0, 34.0, 31.0, 37.0, 32.0, 26.0, 26.0, 18.0, 13.0, 12.0, 12.0, 11.0, 18.0, 9.0, 4.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0], "bins": [-16.742549896240234, -16.260732650756836, -15.778915405273438, -15.297098159790039, -14.81528091430664, -14.333463668823242, -13.851646423339844, -13.369829177856445, -12.888011932373047, -12.406194686889648, -11.92437744140625, -11.442560195922852, -10.960742950439453, -10.478925704956055, -9.997108459472656, -9.515291213989258, -9.03347396850586, -8.551656723022461, -8.069839477539062, -7.588022232055664, -7.106204986572266, -6.624387741088867, -6.142570495605469, -5.66075325012207, -5.178936004638672, -4.697118759155273, -4.215301513671875, -3.7334842681884766, -3.251667022705078, -2.7698497772216797, -2.2880325317382812, -1.8062152862548828, -1.3243989944458008, -0.8425817489624023, -0.3607645034790039, 0.12105274200439453, 0.602869987487793, 1.0846872329711914, 1.5665044784545898, 2.0483217239379883, 2.5301389694213867, 3.011956214904785, 3.4937734603881836, 3.975590705871582, 4.4574079513549805, 4.939225196838379, 5.421042442321777, 5.902859687805176, 6.384676933288574, 6.866494178771973, 7.348311424255371, 7.8301286697387695, 8.311945915222168, 8.793763160705566, 9.275580406188965, 9.757397651672363, 10.239214897155762, 10.72103214263916, 11.202849388122559, 11.684666633605957, 12.166483879089355, 12.648301124572754, 13.130118370056152, 13.61193561553955, 14.09375286102295]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 10.0, 15.0, 16.0, 30.0, 41.0, 47.0, 102.0, 145.0, 226.0, 370.0, 613.0, 977.0, 1605.0, 2661.0, 4641.0, 8149.0, 15383.0, 28335.0, 53429.0, 97302.0, 159134.0, 207525.0, 187331.0, 124614.0, 71716.0, 37924.0, 20416.0, 11139.0, 5986.0, 3470.0, 1984.0, 1176.0, 743.0, 459.0, 290.0, 197.0, 120.0, 76.0, 65.0, 38.0, 18.0, 6.0, 10.0, 8.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.421875, -4.28253173828125, -4.1431884765625, -4.00384521484375, -3.864501953125, -3.72515869140625, -3.5858154296875, -3.44647216796875, -3.30712890625, -3.16778564453125, -3.0284423828125, -2.88909912109375, -2.749755859375, -2.61041259765625, -2.4710693359375, -2.33172607421875, -2.1923828125, -2.05303955078125, -1.9136962890625, -1.77435302734375, -1.635009765625, -1.49566650390625, -1.3563232421875, -1.21697998046875, -1.07763671875, -0.93829345703125, -0.7989501953125, -0.65960693359375, -0.520263671875, -0.38092041015625, -0.2415771484375, -0.10223388671875, 0.037109375, 0.17645263671875, 0.3157958984375, 0.45513916015625, 0.594482421875, 0.73382568359375, 0.8731689453125, 1.01251220703125, 1.15185546875, 1.29119873046875, 1.4305419921875, 1.56988525390625, 1.709228515625, 1.84857177734375, 1.9879150390625, 2.12725830078125, 2.2666015625, 2.40594482421875, 2.5452880859375, 2.68463134765625, 2.823974609375, 2.96331787109375, 3.1026611328125, 3.24200439453125, 3.38134765625, 3.52069091796875, 3.6600341796875, 3.79937744140625, 3.938720703125, 4.07806396484375, 4.2174072265625, 4.35675048828125, 4.49609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 9.0, 9.0, 4.0, 11.0, 7.0, 10.0, 14.0, 19.0, 15.0, 25.0, 32.0, 33.0, 28.0, 30.0, 25.0, 46.0, 24.0, 41.0, 54.0, 39.0, 36.0, 50.0, 43.0, 44.0, 26.0, 39.0, 35.0, 39.0, 29.0, 31.0, 30.0, 25.0, 18.0, 17.0, 15.0, 18.0, 9.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.524658203125, -16.98681640625, -16.448974609375, -15.9111328125, -15.373291015625, -14.83544921875, -14.297607421875, -13.759765625, -13.221923828125, -12.68408203125, -12.146240234375, -11.6083984375, -11.070556640625, -10.53271484375, -9.994873046875, -9.45703125, -8.919189453125, -8.38134765625, -7.843505859375, -7.3056640625, -6.767822265625, -6.22998046875, -5.692138671875, -5.154296875, -4.616455078125, -4.07861328125, -3.540771484375, -3.0029296875, -2.465087890625, -1.92724609375, -1.389404296875, -0.8515625, -0.313720703125, 0.22412109375, 0.761962890625, 1.2998046875, 1.837646484375, 2.37548828125, 2.913330078125, 3.451171875, 3.989013671875, 4.52685546875, 5.064697265625, 5.6025390625, 6.140380859375, 6.67822265625, 7.216064453125, 7.75390625, 8.291748046875, 8.82958984375, 9.367431640625, 9.9052734375, 10.443115234375, 10.98095703125, 11.518798828125, 12.056640625, 12.594482421875, 13.13232421875, 13.670166015625, 14.2080078125, 14.745849609375, 15.28369140625, 15.821533203125, 16.359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 7.0, 12.0, 19.0, 15.0, 33.0, 33.0, 56.0, 68.0, 79.0, 103.0, 159.0, 228.0, 304.0, 457.0, 702.0, 1126.0, 1798.0, 3198.0, 5917.0, 11174.0, 22082.0, 43973.0, 84203.0, 147145.0, 206636.0, 204327.0, 143559.0, 82032.0, 42751.0, 21435.0, 10878.0, 5572.0, 3152.0, 1800.0, 1154.0, 689.0, 446.0, 331.0, 255.0, 165.0, 100.0, 91.0, 71.0, 56.0, 28.0, 36.0, 28.0, 17.0, 19.0, 8.0, 8.0, 3.0, 5.0, 0.0, 1.0, 3.0, 2.0], "bins": [-3.630859375, -3.517303466796875, -3.40374755859375, -3.290191650390625, -3.1766357421875, -3.063079833984375, -2.94952392578125, -2.835968017578125, -2.722412109375, -2.608856201171875, -2.49530029296875, -2.381744384765625, -2.2681884765625, -2.154632568359375, -2.04107666015625, -1.927520751953125, -1.81396484375, -1.700408935546875, -1.58685302734375, -1.473297119140625, -1.3597412109375, -1.246185302734375, -1.13262939453125, -1.019073486328125, -0.905517578125, -0.791961669921875, -0.67840576171875, -0.564849853515625, -0.4512939453125, -0.337738037109375, -0.22418212890625, -0.110626220703125, 0.0029296875, 0.116485595703125, 0.23004150390625, 0.343597412109375, 0.4571533203125, 0.570709228515625, 0.68426513671875, 0.797821044921875, 0.911376953125, 1.024932861328125, 1.13848876953125, 1.252044677734375, 1.3656005859375, 1.479156494140625, 1.59271240234375, 1.706268310546875, 1.81982421875, 1.933380126953125, 2.04693603515625, 2.160491943359375, 2.2740478515625, 2.387603759765625, 2.50115966796875, 2.614715576171875, 2.728271484375, 2.841827392578125, 2.95538330078125, 3.068939208984375, 3.1824951171875, 3.296051025390625, 3.40960693359375, 3.523162841796875, 3.63671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 10.0, 10.0, 8.0, 10.0, 13.0, 23.0, 24.0, 21.0, 33.0, 25.0, 31.0, 21.0, 33.0, 36.0, 40.0, 29.0, 38.0, 43.0, 45.0, 48.0, 51.0, 36.0, 47.0, 31.0, 41.0, 35.0, 29.0, 27.0, 24.0, 17.0, 19.0, 22.0, 13.0, 10.0, 9.0, 9.0, 8.0, 3.0, 9.0, 3.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.140625, -11.7838134765625, -11.427001953125, -11.0701904296875, -10.71337890625, -10.3565673828125, -9.999755859375, -9.6429443359375, -9.2861328125, -8.9293212890625, -8.572509765625, -8.2156982421875, -7.85888671875, -7.5020751953125, -7.145263671875, -6.7884521484375, -6.431640625, -6.0748291015625, -5.718017578125, -5.3612060546875, -5.00439453125, -4.6475830078125, -4.290771484375, -3.9339599609375, -3.5771484375, -3.2203369140625, -2.863525390625, -2.5067138671875, -2.14990234375, -1.7930908203125, -1.436279296875, -1.0794677734375, -0.72265625, -0.3658447265625, -0.009033203125, 0.3477783203125, 0.70458984375, 1.0614013671875, 1.418212890625, 1.7750244140625, 2.1318359375, 2.4886474609375, 2.845458984375, 3.2022705078125, 3.55908203125, 3.9158935546875, 4.272705078125, 4.6295166015625, 4.986328125, 5.3431396484375, 5.699951171875, 6.0567626953125, 6.41357421875, 6.7703857421875, 7.127197265625, 7.4840087890625, 7.8408203125, 8.1976318359375, 8.554443359375, 8.9112548828125, 9.26806640625, 9.6248779296875, 9.981689453125, 10.3385009765625, 10.6953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 11.0, 10.0, 21.0, 25.0, 34.0, 51.0, 72.0, 101.0, 118.0, 197.0, 223.0, 360.0, 496.0, 660.0, 988.0, 1356.0, 2000.0, 2977.0, 4850.0, 8019.0, 14988.0, 29934.0, 66520.0, 158780.0, 300181.0, 246080.0, 109997.0, 47102.0, 22225.0, 11561.0, 6524.0, 3911.0, 2524.0, 1706.0, 1151.0, 771.0, 580.0, 403.0, 310.0, 206.0, 141.0, 109.0, 83.0, 55.0, 45.0, 19.0, 19.0, 15.0, 8.0, 7.0, 8.0, 6.0, 2.0, 2.0, 5.0], "bins": [-0.84423828125, -0.8192520141601562, -0.7942657470703125, -0.7692794799804688, -0.744293212890625, -0.7193069458007812, -0.6943206787109375, -0.6693344116210938, -0.64434814453125, -0.6193618774414062, -0.5943756103515625, -0.5693893432617188, -0.544403076171875, -0.5194168090820312, -0.4944305419921875, -0.46944427490234375, -0.4444580078125, -0.41947174072265625, -0.3944854736328125, -0.36949920654296875, -0.344512939453125, -0.31952667236328125, -0.2945404052734375, -0.26955413818359375, -0.24456787109375, -0.21958160400390625, -0.1945953369140625, -0.16960906982421875, -0.144622802734375, -0.11963653564453125, -0.0946502685546875, -0.06966400146484375, -0.044677734375, -0.01969146728515625, 0.0052947998046875, 0.03028106689453125, 0.055267333984375, 0.08025360107421875, 0.1052398681640625, 0.13022613525390625, 0.15521240234375, 0.18019866943359375, 0.2051849365234375, 0.23017120361328125, 0.255157470703125, 0.28014373779296875, 0.3051300048828125, 0.33011627197265625, 0.3551025390625, 0.38008880615234375, 0.4050750732421875, 0.43006134033203125, 0.455047607421875, 0.48003387451171875, 0.5050201416015625, 0.5300064086914062, 0.55499267578125, 0.5799789428710938, 0.6049652099609375, 0.6299514770507812, 0.654937744140625, 0.6799240112304688, 0.7049102783203125, 0.7298965454101562, 0.7548828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 10.0, 2.0, 6.0, 7.0, 13.0, 16.0, 16.0, 27.0, 28.0, 37.0, 48.0, 82.0, 111.0, 111.0, 123.0, 81.0, 68.0, 52.0, 34.0, 28.0, 24.0, 14.0, 7.0, 10.0, 8.0, 10.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00021278858184814453, -0.0002070162445306778, -0.00020124390721321106, -0.00019547156989574432, -0.0001896992325782776, -0.00018392689526081085, -0.00017815455794334412, -0.00017238222062587738, -0.00016660988330841064, -0.0001608375459909439, -0.00015506520867347717, -0.00014929287135601044, -0.0001435205340385437, -0.00013774819672107697, -0.00013197585940361023, -0.0001262035220861435, -0.00012043118476867676, -0.00011465884745121002, -0.00010888651013374329, -0.00010311417281627655, -9.734183549880981e-05, -9.156949818134308e-05, -8.579716086387634e-05, -8.002482354640961e-05, -7.425248622894287e-05, -6.848014891147614e-05, -6.27078115940094e-05, -5.6935474276542664e-05, -5.116313695907593e-05, -4.539079964160919e-05, -3.9618462324142456e-05, -3.384612500667572e-05, -2.8073787689208984e-05, -2.230145037174225e-05, -1.6529113054275513e-05, -1.0756775736808777e-05, -4.984438419342041e-06, 7.878988981246948e-07, 6.560236215591431e-06, 1.2332573533058167e-05, 1.8104910850524902e-05, 2.3877248167991638e-05, 2.9649585485458374e-05, 3.542192280292511e-05, 4.1194260120391846e-05, 4.696659743785858e-05, 5.273893475532532e-05, 5.851127207279205e-05, 6.428360939025879e-05, 7.005594670772552e-05, 7.582828402519226e-05, 8.1600621342659e-05, 8.737295866012573e-05, 9.314529597759247e-05, 9.89176332950592e-05, 0.00010468997061252594, 0.00011046230792999268, 0.00011623464524745941, 0.00012200698256492615, 0.00012777931988239288, 0.00013355165719985962, 0.00013932399451732635, 0.0001450963318347931, 0.00015086866915225983, 0.00015664100646972656]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 14.0, 9.0, 23.0, 32.0, 37.0, 58.0, 90.0, 109.0, 173.0, 294.0, 388.0, 564.0, 813.0, 1282.0, 1891.0, 2836.0, 4406.0, 7146.0, 11670.0, 19917.0, 37755.0, 75170.0, 158713.0, 268999.0, 222343.0, 111257.0, 53863.0, 27829.0, 15479.0, 9075.0, 5646.0, 3583.0, 2395.0, 1567.0, 954.0, 685.0, 465.0, 298.0, 210.0, 167.0, 102.0, 81.0, 45.0, 35.0, 27.0, 13.0, 14.0, 10.0, 6.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.4052734375, -1.3623809814453125, -1.319488525390625, -1.2765960693359375, -1.23370361328125, -1.1908111572265625, -1.147918701171875, -1.1050262451171875, -1.0621337890625, -1.0192413330078125, -0.976348876953125, -0.9334564208984375, -0.89056396484375, -0.8476715087890625, -0.804779052734375, -0.7618865966796875, -0.718994140625, -0.6761016845703125, -0.633209228515625, -0.5903167724609375, -0.54742431640625, -0.5045318603515625, -0.461639404296875, -0.4187469482421875, -0.3758544921875, -0.3329620361328125, -0.290069580078125, -0.2471771240234375, -0.20428466796875, -0.1613922119140625, -0.118499755859375, -0.0756072998046875, -0.03271484375, 0.0101776123046875, 0.053070068359375, 0.0959625244140625, 0.13885498046875, 0.1817474365234375, 0.224639892578125, 0.2675323486328125, 0.3104248046875, 0.3533172607421875, 0.396209716796875, 0.4391021728515625, 0.48199462890625, 0.5248870849609375, 0.567779541015625, 0.6106719970703125, 0.653564453125, 0.6964569091796875, 0.739349365234375, 0.7822418212890625, 0.82513427734375, 0.8680267333984375, 0.910919189453125, 0.9538116455078125, 0.9967041015625, 1.0395965576171875, 1.082489013671875, 1.1253814697265625, 1.16827392578125, 1.2111663818359375, 1.254058837890625, 1.2969512939453125, 1.33984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 15.0, 16.0, 18.0, 38.0, 69.0, 86.0, 151.0, 161.0, 135.0, 100.0, 71.0, 44.0, 21.0, 14.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9013671875, -0.8728790283203125, -0.844390869140625, -0.8159027099609375, -0.78741455078125, -0.7589263916015625, -0.730438232421875, -0.7019500732421875, -0.6734619140625, -0.6449737548828125, -0.616485595703125, -0.5879974365234375, -0.55950927734375, -0.5310211181640625, -0.502532958984375, -0.4740447998046875, -0.445556640625, -0.4170684814453125, -0.388580322265625, -0.3600921630859375, -0.33160400390625, -0.3031158447265625, -0.274627685546875, -0.2461395263671875, -0.2176513671875, -0.1891632080078125, -0.160675048828125, -0.1321868896484375, -0.10369873046875, -0.0752105712890625, -0.046722412109375, -0.0182342529296875, 0.01025390625, 0.0387420654296875, 0.067230224609375, 0.0957183837890625, 0.12420654296875, 0.1526947021484375, 0.181182861328125, 0.2096710205078125, 0.2381591796875, 0.2666473388671875, 0.295135498046875, 0.3236236572265625, 0.35211181640625, 0.3805999755859375, 0.409088134765625, 0.4375762939453125, 0.466064453125, 0.4945526123046875, 0.523040771484375, 0.5515289306640625, 0.58001708984375, 0.6085052490234375, 0.636993408203125, 0.6654815673828125, 0.6939697265625, 0.7224578857421875, 0.750946044921875, 0.7794342041015625, 0.80792236328125, 0.8364105224609375, 0.864898681640625, 0.8933868408203125, 0.921875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 8.0, 2.0, 5.0, 12.0, 10.0, 11.0, 16.0, 16.0, 28.0, 22.0, 36.0, 31.0, 29.0, 30.0, 28.0, 37.0, 39.0, 49.0, 44.0, 41.0, 42.0, 44.0, 39.0, 45.0, 43.0, 38.0, 29.0, 33.0, 32.0, 24.0, 24.0, 21.0, 15.0, 15.0, 13.0, 12.0, 5.0, 5.0, 5.0, 7.0, 6.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.873531341552734, -10.458719253540039, -10.043907165527344, -9.629095077514648, -9.214282989501953, -8.799470901489258, -8.384658813476562, -7.969845771789551, -7.5550336837768555, -7.14022159576416, -6.725409507751465, -6.3105974197387695, -5.895784854888916, -5.480972766876221, -5.066160678863525, -4.651348114013672, -4.236536502838135, -3.8217244148254395, -3.406912088394165, -2.9921000003814697, -2.5772876739501953, -2.1624755859375, -1.7476634979248047, -1.3328511714935303, -0.918039083480835, -0.5032268762588501, -0.08841472864151001, 0.3263974189758301, 0.7412096261978149, 1.1560218334197998, 1.5708339214324951, 1.9856462478637695, 2.400458335876465, 2.81527042388916, 3.2300827503204346, 3.64489483833313, 4.059707164764404, 4.4745192527771, 4.889331340789795, 5.304143905639648, 5.718955993652344, 6.133768081665039, 6.548580169677734, 6.96339225769043, 7.378204822540283, 7.7930169105529785, 8.207828521728516, 8.622641563415527, 9.037452697753906, 9.452264785766602, 9.867076873779297, 10.281888961791992, 10.696701049804688, 11.111513137817383, 11.526325225830078, 11.94113826751709, 12.355950355529785, 12.77076244354248, 13.185574531555176, 13.600386619567871, 14.015198707580566, 14.430011749267578, 14.844823837280273, 15.259635925292969, 15.674448013305664]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 8.0, 10.0, 6.0, 5.0, 10.0, 14.0, 14.0, 12.0, 22.0, 18.0, 26.0, 23.0, 26.0, 33.0, 22.0, 33.0, 26.0, 39.0, 41.0, 34.0, 36.0, 42.0, 55.0, 41.0, 39.0, 33.0, 30.0, 28.0, 33.0, 41.0, 32.0, 28.0, 19.0, 21.0, 14.0, 11.0, 12.0, 11.0, 20.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0], "bins": [-16.54392433166504, -16.06588363647461, -15.587841033935547, -15.1097993850708, -14.631757736206055, -14.153717041015625, -13.675675392150879, -13.197633743286133, -12.719592094421387, -12.24155044555664, -11.763508796691895, -11.285467147827148, -10.807426452636719, -10.329383850097656, -9.851343154907227, -9.37330150604248, -8.895259857177734, -8.417218208312988, -7.939176559448242, -7.461135387420654, -6.983093738555908, -6.505052089691162, -6.027010917663574, -5.548969268798828, -5.070927619934082, -4.592885971069336, -4.11484432220459, -3.636803150177002, -3.158761501312256, -2.6807198524475098, -2.2026784420013428, -1.7246370315551758, -1.246596336364746, -0.7685548067092896, -0.290513277053833, 0.18752825260162354, 0.6655697822570801, 1.1436114311218262, 1.6216528415679932, 2.09969425201416, 2.5777359008789062, 3.0557775497436523, 3.5338189601898193, 4.011860370635986, 4.489902019500732, 4.9679436683654785, 5.445984840393066, 5.9240264892578125, 6.402068138122559, 6.880109786987305, 7.358151435852051, 7.836192607879639, 8.314233779907227, 8.792276382446289, 9.270317077636719, 9.748358726501465, 10.226400375366211, 10.704442024230957, 11.182483673095703, 11.66052532196045, 12.138566970825195, 12.616607666015625, 13.094649314880371, 13.572690963745117, 14.050732612609863]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 7.0, 13.0, 13.0, 29.0, 47.0, 62.0, 109.0, 175.0, 291.0, 462.0, 758.0, 1177.0, 1729.0, 2838.0, 4459.0, 6724.0, 10249.0, 15071.0, 21936.0, 30502.0, 41517.0, 54067.0, 67766.0, 80416.0, 90743.0, 96725.0, 96681.0, 90590.0, 79953.0, 66827.0, 53063.0, 40514.0, 29572.0, 20885.0, 14428.0, 9981.0, 6476.0, 4254.0, 2689.0, 1756.0, 1124.0, 709.0, 415.0, 291.0, 165.0, 105.0, 83.0, 42.0, 25.0, 21.0, 9.0, 11.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.765625, -8.4913330078125, -8.217041015625, -7.9427490234375, -7.66845703125, -7.3941650390625, -7.119873046875, -6.8455810546875, -6.5712890625, -6.2969970703125, -6.022705078125, -5.7484130859375, -5.47412109375, -5.1998291015625, -4.925537109375, -4.6512451171875, -4.376953125, -4.1026611328125, -3.828369140625, -3.5540771484375, -3.27978515625, -3.0054931640625, -2.731201171875, -2.4569091796875, -2.1826171875, -1.9083251953125, -1.634033203125, -1.3597412109375, -1.08544921875, -0.8111572265625, -0.536865234375, -0.2625732421875, 0.01171875, 0.2860107421875, 0.560302734375, 0.8345947265625, 1.10888671875, 1.3831787109375, 1.657470703125, 1.9317626953125, 2.2060546875, 2.4803466796875, 2.754638671875, 3.0289306640625, 3.30322265625, 3.5775146484375, 3.851806640625, 4.1260986328125, 4.400390625, 4.6746826171875, 4.948974609375, 5.2232666015625, 5.49755859375, 5.7718505859375, 6.046142578125, 6.3204345703125, 6.5947265625, 6.8690185546875, 7.143310546875, 7.4176025390625, 7.69189453125, 7.9661865234375, 8.240478515625, 8.5147705078125, 8.7890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 10.0, 7.0, 5.0, 19.0, 12.0, 17.0, 20.0, 24.0, 24.0, 24.0, 28.0, 36.0, 28.0, 28.0, 47.0, 40.0, 45.0, 55.0, 51.0, 34.0, 50.0, 35.0, 38.0, 35.0, 36.0, 31.0, 32.0, 24.0, 17.0, 26.0, 20.0, 26.0, 11.0, 9.0, 10.0, 16.0, 8.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.828125, -17.3125, -16.796875, -16.28125, -15.765625, -15.25, -14.734375, -14.21875, -13.703125, -13.1875, -12.671875, -12.15625, -11.640625, -11.125, -10.609375, -10.09375, -9.578125, -9.0625, -8.546875, -8.03125, -7.515625, -7.0, -6.484375, -5.96875, -5.453125, -4.9375, -4.421875, -3.90625, -3.390625, -2.875, -2.359375, -1.84375, -1.328125, -0.8125, -0.296875, 0.21875, 0.734375, 1.25, 1.765625, 2.28125, 2.796875, 3.3125, 3.828125, 4.34375, 4.859375, 5.375, 5.890625, 6.40625, 6.921875, 7.4375, 7.953125, 8.46875, 8.984375, 9.5, 10.015625, 10.53125, 11.046875, 11.5625, 12.078125, 12.59375, 13.109375, 13.625, 14.140625, 14.65625, 15.171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 11.0, 12.0, 34.0, 65.0, 81.0, 124.0, 220.0, 324.0, 528.0, 857.0, 1364.0, 2139.0, 3336.0, 5283.0, 8171.0, 12386.0, 18347.0, 26977.0, 37223.0, 50392.0, 64909.0, 78970.0, 92032.0, 99385.0, 100434.0, 95072.0, 84891.0, 70984.0, 56167.0, 42934.0, 31029.0, 21731.0, 14700.0, 9896.0, 6367.0, 4114.0, 2691.0, 1643.0, 1074.0, 628.0, 416.0, 256.0, 139.0, 87.0, 55.0, 28.0, 25.0, 14.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -7.97265625, -7.6796875, -7.38671875, -7.09375, -6.80078125, -6.5078125, -6.21484375, -5.921875, -5.62890625, -5.3359375, -5.04296875, -4.75, -4.45703125, -4.1640625, -3.87109375, -3.578125, -3.28515625, -2.9921875, -2.69921875, -2.40625, -2.11328125, -1.8203125, -1.52734375, -1.234375, -0.94140625, -0.6484375, -0.35546875, -0.0625, 0.23046875, 0.5234375, 0.81640625, 1.109375, 1.40234375, 1.6953125, 1.98828125, 2.28125, 2.57421875, 2.8671875, 3.16015625, 3.453125, 3.74609375, 4.0390625, 4.33203125, 4.625, 4.91796875, 5.2109375, 5.50390625, 5.796875, 6.08984375, 6.3828125, 6.67578125, 6.96875, 7.26171875, 7.5546875, 7.84765625, 8.140625, 8.43359375, 8.7265625, 9.01953125, 9.3125, 9.60546875, 9.8984375, 10.19140625, 10.484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 6.0, 9.0, 9.0, 11.0, 12.0, 15.0, 15.0, 31.0, 19.0, 21.0, 37.0, 32.0, 37.0, 28.0, 39.0, 46.0, 35.0, 32.0, 50.0, 47.0, 47.0, 51.0, 48.0, 39.0, 25.0, 26.0, 37.0, 29.0, 25.0, 20.0, 22.0, 13.0, 10.0, 15.0, 12.0, 9.0, 5.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.1171875, -10.7918701171875, -10.466552734375, -10.1412353515625, -9.81591796875, -9.4906005859375, -9.165283203125, -8.8399658203125, -8.5146484375, -8.1893310546875, -7.864013671875, -7.5386962890625, -7.21337890625, -6.8880615234375, -6.562744140625, -6.2374267578125, -5.912109375, -5.5867919921875, -5.261474609375, -4.9361572265625, -4.61083984375, -4.2855224609375, -3.960205078125, -3.6348876953125, -3.3095703125, -2.9842529296875, -2.658935546875, -2.3336181640625, -2.00830078125, -1.6829833984375, -1.357666015625, -1.0323486328125, -0.70703125, -0.3817138671875, -0.056396484375, 0.2689208984375, 0.59423828125, 0.9195556640625, 1.244873046875, 1.5701904296875, 1.8955078125, 2.2208251953125, 2.546142578125, 2.8714599609375, 3.19677734375, 3.5220947265625, 3.847412109375, 4.1727294921875, 4.498046875, 4.8233642578125, 5.148681640625, 5.4739990234375, 5.79931640625, 6.1246337890625, 6.449951171875, 6.7752685546875, 7.1005859375, 7.4259033203125, 7.751220703125, 8.0765380859375, 8.40185546875, 8.7271728515625, 9.052490234375, 9.3778076171875, 9.703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 13.0, 16.0, 31.0, 39.0, 60.0, 76.0, 127.0, 179.0, 304.0, 426.0, 650.0, 966.0, 1505.0, 2268.0, 3327.0, 5170.0, 7833.0, 11791.0, 17705.0, 26549.0, 38917.0, 54889.0, 72532.0, 91587.0, 106714.0, 113852.0, 110873.0, 98899.0, 80369.0, 62232.0, 44791.0, 31017.0, 21233.0, 14082.0, 9431.0, 6064.0, 4039.0, 2758.0, 1769.0, 1135.0, 802.0, 547.0, 347.0, 225.0, 154.0, 93.0, 55.0, 31.0, 19.0, 19.0, 8.0, 7.0, 7.0, 7.0, 6.0, 1.0, 6.0], "bins": [-3.962890625, -3.84173583984375, -3.7205810546875, -3.59942626953125, -3.478271484375, -3.35711669921875, -3.2359619140625, -3.11480712890625, -2.99365234375, -2.87249755859375, -2.7513427734375, -2.63018798828125, -2.509033203125, -2.38787841796875, -2.2667236328125, -2.14556884765625, -2.0244140625, -1.90325927734375, -1.7821044921875, -1.66094970703125, -1.539794921875, -1.41864013671875, -1.2974853515625, -1.17633056640625, -1.05517578125, -0.93402099609375, -0.8128662109375, -0.69171142578125, -0.570556640625, -0.44940185546875, -0.3282470703125, -0.20709228515625, -0.0859375, 0.03521728515625, 0.1563720703125, 0.27752685546875, 0.398681640625, 0.51983642578125, 0.6409912109375, 0.76214599609375, 0.88330078125, 1.00445556640625, 1.1256103515625, 1.24676513671875, 1.367919921875, 1.48907470703125, 1.6102294921875, 1.73138427734375, 1.8525390625, 1.97369384765625, 2.0948486328125, 2.21600341796875, 2.337158203125, 2.45831298828125, 2.5794677734375, 2.70062255859375, 2.82177734375, 2.94293212890625, 3.0640869140625, 3.18524169921875, 3.306396484375, 3.42755126953125, 3.5487060546875, 3.66986083984375, 3.791015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 7.0, 5.0, 8.0, 10.0, 11.0, 15.0, 19.0, 22.0, 23.0, 21.0, 40.0, 30.0, 33.0, 42.0, 43.0, 52.0, 46.0, 42.0, 55.0, 42.0, 38.0, 46.0, 44.0, 36.0, 21.0, 45.0, 26.0, 26.0, 22.0, 31.0, 13.0, 16.0, 9.0, 16.0, 8.0, 6.0, 11.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000446319580078125, -0.0004323050379753113, -0.00041829049587249756, -0.00040427595376968384, -0.0003902614116668701, -0.0003762468695640564, -0.0003622323274612427, -0.00034821778535842896, -0.00033420324325561523, -0.0003201887011528015, -0.0003061741590499878, -0.00029215961694717407, -0.00027814507484436035, -0.00026413053274154663, -0.0002501159906387329, -0.0002361014485359192, -0.00022208690643310547, -0.00020807236433029175, -0.00019405782222747803, -0.0001800432801246643, -0.00016602873802185059, -0.00015201419591903687, -0.00013799965381622314, -0.00012398511171340942, -0.0001099705696105957, -9.595602750778198e-05, -8.194148540496826e-05, -6.792694330215454e-05, -5.391240119934082e-05, -3.98978590965271e-05, -2.588331699371338e-05, -1.1868774890899658e-05, 2.1457672119140625e-06, 1.6160309314727783e-05, 3.0174851417541504e-05, 4.4189393520355225e-05, 5.8203935623168945e-05, 7.221847772598267e-05, 8.623301982879639e-05, 0.00010024756193161011, 0.00011426210403442383, 0.00012827664613723755, 0.00014229118824005127, 0.000156305730342865, 0.0001703202724456787, 0.00018433481454849243, 0.00019834935665130615, 0.00021236389875411987, 0.0002263784408569336, 0.00024039298295974731, 0.00025440752506256104, 0.00026842206716537476, 0.0002824366092681885, 0.0002964511513710022, 0.0003104656934738159, 0.00032448023557662964, 0.00033849477767944336, 0.0003525093197822571, 0.0003665238618850708, 0.0003805384039878845, 0.00039455294609069824, 0.00040856748819351196, 0.0004225820302963257, 0.0004365965723991394, 0.0004506111145019531]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 15.0, 15.0, 29.0, 38.0, 73.0, 105.0, 161.0, 284.0, 459.0, 724.0, 1261.0, 2166.0, 3844.0, 6658.0, 11544.0, 20095.0, 34413.0, 56722.0, 87264.0, 120281.0, 146056.0, 152036.0, 132641.0, 101027.0, 68227.0, 42583.0, 25129.0, 14622.0, 8410.0, 4798.0, 2772.0, 1618.0, 940.0, 613.0, 342.0, 240.0, 127.0, 81.0, 50.0, 32.0, 12.0, 13.0, 11.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.14227294921875, -4.9720458984375, -4.80181884765625, -4.631591796875, -4.46136474609375, -4.2911376953125, -4.12091064453125, -3.95068359375, -3.78045654296875, -3.6102294921875, -3.44000244140625, -3.269775390625, -3.09954833984375, -2.9293212890625, -2.75909423828125, -2.5888671875, -2.41864013671875, -2.2484130859375, -2.07818603515625, -1.907958984375, -1.73773193359375, -1.5675048828125, -1.39727783203125, -1.22705078125, -1.05682373046875, -0.8865966796875, -0.71636962890625, -0.546142578125, -0.37591552734375, -0.2056884765625, -0.03546142578125, 0.134765625, 0.30499267578125, 0.4752197265625, 0.64544677734375, 0.815673828125, 0.98590087890625, 1.1561279296875, 1.32635498046875, 1.49658203125, 1.66680908203125, 1.8370361328125, 2.00726318359375, 2.177490234375, 2.34771728515625, 2.5179443359375, 2.68817138671875, 2.8583984375, 3.02862548828125, 3.1988525390625, 3.36907958984375, 3.539306640625, 3.70953369140625, 3.8797607421875, 4.04998779296875, 4.22021484375, 4.39044189453125, 4.5606689453125, 4.73089599609375, 4.901123046875, 5.07135009765625, 5.2415771484375, 5.41180419921875, 5.58203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 10.0, 4.0, 3.0, 9.0, 8.0, 12.0, 11.0, 19.0, 12.0, 16.0, 29.0, 31.0, 30.0, 40.0, 28.0, 34.0, 30.0, 46.0, 48.0, 49.0, 39.0, 43.0, 48.0, 43.0, 47.0, 48.0, 46.0, 38.0, 38.0, 26.0, 23.0, 13.0, 20.0, 12.0, 15.0, 12.0, 4.0, 3.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.095703125, -2.03509521484375, -1.9744873046875, -1.91387939453125, -1.853271484375, -1.79266357421875, -1.7320556640625, -1.67144775390625, -1.61083984375, -1.55023193359375, -1.4896240234375, -1.42901611328125, -1.368408203125, -1.30780029296875, -1.2471923828125, -1.18658447265625, -1.1259765625, -1.06536865234375, -1.0047607421875, -0.94415283203125, -0.883544921875, -0.82293701171875, -0.7623291015625, -0.70172119140625, -0.64111328125, -0.58050537109375, -0.5198974609375, -0.45928955078125, -0.398681640625, -0.33807373046875, -0.2774658203125, -0.21685791015625, -0.15625, -0.09564208984375, -0.0350341796875, 0.02557373046875, 0.086181640625, 0.14678955078125, 0.2073974609375, 0.26800537109375, 0.32861328125, 0.38922119140625, 0.4498291015625, 0.51043701171875, 0.571044921875, 0.63165283203125, 0.6922607421875, 0.75286865234375, 0.8134765625, 0.87408447265625, 0.9346923828125, 0.99530029296875, 1.055908203125, 1.11651611328125, 1.1771240234375, 1.23773193359375, 1.29833984375, 1.35894775390625, 1.4195556640625, 1.48016357421875, 1.540771484375, 1.60137939453125, 1.6619873046875, 1.72259521484375, 1.783203125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 12.0, 12.0, 21.0, 17.0, 18.0, 28.0, 25.0, 27.0, 32.0, 36.0, 38.0, 28.0, 48.0, 36.0, 42.0, 46.0, 45.0, 45.0, 38.0, 47.0, 51.0, 36.0, 41.0, 32.0, 24.0, 23.0, 19.0, 23.0, 17.0, 20.0, 8.0, 7.0, 12.0, 2.0, 7.0, 5.0, 2.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.385777473449707, -10.968724250793457, -10.551671028137207, -10.134617805480957, -9.717564582824707, -9.30051040649414, -8.88345718383789, -8.46640396118164, -8.04935073852539, -7.632297515869141, -7.215244293212891, -6.798191070556641, -6.381137371063232, -5.964084148406982, -5.547030925750732, -5.129977226257324, -4.712924480438232, -4.295871257781982, -3.8788177967071533, -3.4617645740509033, -3.044711112976074, -2.627657890319824, -2.210604667663574, -1.7935512065887451, -1.3764979839324951, -0.9594446420669556, -0.5423913598060608, -0.12533807754516602, 0.29171526432037354, 0.7087686061859131, 1.125821828842163, 1.5428752899169922, 1.9599285125732422, 2.376981735229492, 2.7940351963043213, 3.2110884189605713, 3.6281418800354004, 4.04519510269165, 4.4622483253479, 4.879302024841309, 5.296355247497559, 5.713408470153809, 6.130461692810059, 6.547514915466309, 6.964568614959717, 7.381621837615967, 7.798675060272217, 8.215728759765625, 8.632781982421875, 9.049835205078125, 9.466888427734375, 9.883941650390625, 10.300994873046875, 10.718048095703125, 11.135101318359375, 11.552155494689941, 11.969207763671875, 12.386260986328125, 12.803314208984375, 13.220367431640625, 13.637420654296875, 14.054473876953125, 14.471527099609375, 14.888581275939941, 15.305634498596191]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 4.0, 8.0, 9.0, 6.0, 13.0, 10.0, 8.0, 8.0, 13.0, 29.0, 21.0, 29.0, 21.0, 25.0, 35.0, 39.0, 33.0, 28.0, 34.0, 42.0, 42.0, 31.0, 42.0, 50.0, 27.0, 40.0, 45.0, 35.0, 31.0, 31.0, 26.0, 26.0, 24.0, 19.0, 10.0, 16.0, 21.0, 16.0, 14.0, 9.0, 8.0, 14.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-17.004196166992188, -16.49961280822754, -15.99502944946289, -15.490447044372559, -14.98586368560791, -14.481280326843262, -13.97669792175293, -13.472114562988281, -12.967531204223633, -12.462947845458984, -11.958364486694336, -11.453782081604004, -10.949198722839355, -10.444615364074707, -9.940032958984375, -9.435449600219727, -8.930866241455078, -8.42628288269043, -7.9217000007629395, -7.417117118835449, -6.912533760070801, -6.407950401306152, -5.903367519378662, -5.398784637451172, -4.894201278686523, -4.389617919921875, -3.8850350379943848, -3.3804519176483154, -2.875868797302246, -2.3712856769561768, -1.8667025566101074, -1.362119436264038, -0.8575363159179688, -0.3529531955718994, 0.15162992477416992, 0.6562130451202393, 1.1607961654663086, 1.665379285812378, 2.1699624061584473, 2.6745455265045166, 3.179128646850586, 3.6837117671966553, 4.188294887542725, 4.692877769470215, 5.197461128234863, 5.702044486999512, 6.206627368927002, 6.711210250854492, 7.215793609619141, 7.720376968383789, 8.224960327148438, 8.72954273223877, 9.234126091003418, 9.738709449768066, 10.243291854858398, 10.747875213623047, 11.252458572387695, 11.757041931152344, 12.261625289916992, 12.766207695007324, 13.270791053771973, 13.775374412536621, 14.279956817626953, 14.784540176391602, 15.28912353515625]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 7.0, 9.0, 14.0, 29.0, 44.0, 75.0, 89.0, 149.0, 225.0, 406.0, 635.0, 1007.0, 1594.0, 2444.0, 4025.0, 6194.0, 9408.0, 14522.0, 22175.0, 33493.0, 49898.0, 73426.0, 105623.0, 146341.0, 198075.0, 256026.0, 315297.0, 366757.0, 398311.0, 405767.0, 382758.0, 339192.0, 282122.0, 223455.0, 168482.0, 123040.0, 86403.0, 60198.0, 40469.0, 26871.0, 17547.0, 11396.0, 7320.0, 4698.0, 3062.0, 1965.0, 1180.0, 756.0, 507.0, 306.0, 189.0, 114.0, 67.0, 59.0, 33.0, 22.0, 9.0, 8.0, 5.0, 2.0, 1.0, 1.0], "bins": [-8.71875, -8.439453125, -8.16015625, -7.880859375, -7.6015625, -7.322265625, -7.04296875, -6.763671875, -6.484375, -6.205078125, -5.92578125, -5.646484375, -5.3671875, -5.087890625, -4.80859375, -4.529296875, -4.25, -3.970703125, -3.69140625, -3.412109375, -3.1328125, -2.853515625, -2.57421875, -2.294921875, -2.015625, -1.736328125, -1.45703125, -1.177734375, -0.8984375, -0.619140625, -0.33984375, -0.060546875, 0.21875, 0.498046875, 0.77734375, 1.056640625, 1.3359375, 1.615234375, 1.89453125, 2.173828125, 2.453125, 2.732421875, 3.01171875, 3.291015625, 3.5703125, 3.849609375, 4.12890625, 4.408203125, 4.6875, 4.966796875, 5.24609375, 5.525390625, 5.8046875, 6.083984375, 6.36328125, 6.642578125, 6.921875, 7.201171875, 7.48046875, 7.759765625, 8.0390625, 8.318359375, 8.59765625, 8.876953125, 9.15625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 9.0, 9.0, 10.0, 17.0, 14.0, 18.0, 16.0, 16.0, 25.0, 25.0, 41.0, 34.0, 38.0, 27.0, 30.0, 33.0, 37.0, 42.0, 45.0, 41.0, 39.0, 42.0, 45.0, 33.0, 43.0, 33.0, 32.0, 24.0, 33.0, 28.0, 16.0, 14.0, 10.0, 15.0, 15.0, 11.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.1875, -12.7838134765625, -12.380126953125, -11.9764404296875, -11.57275390625, -11.1690673828125, -10.765380859375, -10.3616943359375, -9.9580078125, -9.5543212890625, -9.150634765625, -8.7469482421875, -8.34326171875, -7.9395751953125, -7.535888671875, -7.1322021484375, -6.728515625, -6.3248291015625, -5.921142578125, -5.5174560546875, -5.11376953125, -4.7100830078125, -4.306396484375, -3.9027099609375, -3.4990234375, -3.0953369140625, -2.691650390625, -2.2879638671875, -1.88427734375, -1.4805908203125, -1.076904296875, -0.6732177734375, -0.26953125, 0.1341552734375, 0.537841796875, 0.9415283203125, 1.34521484375, 1.7489013671875, 2.152587890625, 2.5562744140625, 2.9599609375, 3.3636474609375, 3.767333984375, 4.1710205078125, 4.57470703125, 4.9783935546875, 5.382080078125, 5.7857666015625, 6.189453125, 6.5931396484375, 6.996826171875, 7.4005126953125, 7.80419921875, 8.2078857421875, 8.611572265625, 9.0152587890625, 9.4189453125, 9.8226318359375, 10.226318359375, 10.6300048828125, 11.03369140625, 11.4373779296875, 11.841064453125, 12.2447509765625, 12.6484375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 14.0, 21.0, 46.0, 89.0, 151.0, 253.0, 413.0, 703.0, 1191.0, 1964.0, 3387.0, 5427.0, 8982.0, 14448.0, 22147.0, 34376.0, 51579.0, 76790.0, 108425.0, 149880.0, 199003.0, 251721.0, 303389.0, 347589.0, 375683.0, 384098.0, 370292.0, 336536.0, 289488.0, 237189.0, 184194.0, 138374.0, 99243.0, 69058.0, 45974.0, 30688.0, 19661.0, 12526.0, 7599.0, 4760.0, 2752.0, 1724.0, 1037.0, 611.0, 338.0, 191.0, 133.0, 64.0, 36.0, 19.0, 13.0, 6.0, 6.0, 4.0, 1.0], "bins": [-9.78125, -9.49658203125, -9.2119140625, -8.92724609375, -8.642578125, -8.35791015625, -8.0732421875, -7.78857421875, -7.50390625, -7.21923828125, -6.9345703125, -6.64990234375, -6.365234375, -6.08056640625, -5.7958984375, -5.51123046875, -5.2265625, -4.94189453125, -4.6572265625, -4.37255859375, -4.087890625, -3.80322265625, -3.5185546875, -3.23388671875, -2.94921875, -2.66455078125, -2.3798828125, -2.09521484375, -1.810546875, -1.52587890625, -1.2412109375, -0.95654296875, -0.671875, -0.38720703125, -0.1025390625, 0.18212890625, 0.466796875, 0.75146484375, 1.0361328125, 1.32080078125, 1.60546875, 1.89013671875, 2.1748046875, 2.45947265625, 2.744140625, 3.02880859375, 3.3134765625, 3.59814453125, 3.8828125, 4.16748046875, 4.4521484375, 4.73681640625, 5.021484375, 5.30615234375, 5.5908203125, 5.87548828125, 6.16015625, 6.44482421875, 6.7294921875, 7.01416015625, 7.298828125, 7.58349609375, 7.8681640625, 8.15283203125, 8.4375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 2.0, 4.0, 17.0, 10.0, 16.0, 19.0, 24.0, 28.0, 28.0, 38.0, 45.0, 70.0, 73.0, 85.0, 131.0, 135.0, 141.0, 134.0, 173.0, 188.0, 216.0, 203.0, 236.0, 196.0, 196.0, 185.0, 184.0, 194.0, 160.0, 134.0, 134.0, 126.0, 114.0, 93.0, 67.0, 60.0, 47.0, 33.0, 26.0, 28.0, 18.0, 17.0, 10.0, 16.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.1875, -6.00054931640625, -5.8135986328125, -5.62664794921875, -5.439697265625, -5.25274658203125, -5.0657958984375, -4.87884521484375, -4.69189453125, -4.50494384765625, -4.3179931640625, -4.13104248046875, -3.944091796875, -3.75714111328125, -3.5701904296875, -3.38323974609375, -3.1962890625, -3.00933837890625, -2.8223876953125, -2.63543701171875, -2.448486328125, -2.26153564453125, -2.0745849609375, -1.88763427734375, -1.70068359375, -1.51373291015625, -1.3267822265625, -1.13983154296875, -0.952880859375, -0.76593017578125, -0.5789794921875, -0.39202880859375, -0.205078125, -0.01812744140625, 0.1688232421875, 0.35577392578125, 0.542724609375, 0.72967529296875, 0.9166259765625, 1.10357666015625, 1.29052734375, 1.47747802734375, 1.6644287109375, 1.85137939453125, 2.038330078125, 2.22528076171875, 2.4122314453125, 2.59918212890625, 2.7861328125, 2.97308349609375, 3.1600341796875, 3.34698486328125, 3.533935546875, 3.72088623046875, 3.9078369140625, 4.09478759765625, 4.28173828125, 4.46868896484375, 4.6556396484375, 4.84259033203125, 5.029541015625, 5.21649169921875, 5.4034423828125, 5.59039306640625, 5.77734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 3.0, 8.0, 10.0, 11.0, 23.0, 27.0, 28.0, 29.0, 29.0, 30.0, 43.0, 42.0, 50.0, 53.0, 54.0, 47.0, 38.0, 47.0, 38.0, 48.0, 52.0, 43.0, 35.0, 25.0, 28.0, 19.0, 19.0, 14.0, 30.0, 10.0, 14.0, 10.0, 7.0, 6.0, 3.0, 3.0, 5.0, 6.0, 0.0, 3.0, 1.0, 0.0, 3.0], "bins": [-15.986053466796875, -15.557334899902344, -15.128615379333496, -14.699896812438965, -14.271178245544434, -13.842458724975586, -13.413740158081055, -12.985021591186523, -12.556303024291992, -12.127584457397461, -11.698864936828613, -11.270146369934082, -10.84142780303955, -10.412708282470703, -9.983989715576172, -9.55527114868164, -9.126551628112793, -8.697833061218262, -8.269113540649414, -7.840394973754883, -7.411676406860352, -6.982957363128662, -6.554238319396973, -6.125519752502441, -5.696800708770752, -5.2680816650390625, -4.839363098144531, -4.410644054412842, -3.9819252490997314, -3.553206443786621, -3.1244874000549316, -2.6957685947418213, -2.2670507431030273, -1.838331937789917, -1.409613013267517, -0.9808940887451172, -0.5521752834320068, -0.12345647811889648, 0.30526256561279297, 0.7339813709259033, 1.1627001762390137, 1.591418981552124, 2.0201377868652344, 2.448856830596924, 2.877575635910034, 3.3062944412231445, 3.735013484954834, 4.163732528686523, 4.592451095581055, 5.021170139312744, 5.449888706207275, 5.878607749938965, 6.307326316833496, 6.7360453605651855, 7.164764404296875, 7.593482971191406, 8.022201538085938, 8.450920104980469, 8.879639625549316, 9.308358192443848, 9.737076759338379, 10.165796279907227, 10.594514846801758, 11.023233413696289, 11.451952934265137]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 11.0, 5.0, 11.0, 6.0, 17.0, 11.0, 13.0, 19.0, 18.0, 29.0, 27.0, 22.0, 53.0, 34.0, 28.0, 34.0, 41.0, 35.0, 40.0, 48.0, 37.0, 42.0, 45.0, 37.0, 33.0, 44.0, 34.0, 35.0, 28.0, 24.0, 14.0, 21.0, 25.0, 11.0, 16.0, 5.0, 16.0, 5.0, 9.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.235815048217773, -16.738744735717773, -16.241676330566406, -15.744606018066406, -15.247536659240723, -14.750467300415039, -14.253396987915039, -13.756327629089355, -13.259258270263672, -12.762188911437988, -12.265119552612305, -11.768049240112305, -11.270979881286621, -10.773910522460938, -10.276840209960938, -9.779770851135254, -9.28270149230957, -8.785632133483887, -8.288562774658203, -7.791492462158203, -7.2944231033325195, -6.797353744506836, -6.300283908843994, -5.803214073181152, -5.306144714355469, -4.809075355529785, -4.312005519866943, -3.8149359226226807, -3.317866325378418, -2.8207967281341553, -2.3237271308898926, -1.8266575336456299, -1.3295888900756836, -0.8325192928314209, -0.3354496955871582, 0.1616199016571045, 0.6586894989013672, 1.1557590961456299, 1.6528286933898926, 2.1498982906341553, 2.646967887878418, 3.1440374851226807, 3.6411070823669434, 4.138176918029785, 4.635246276855469, 5.132315635681152, 5.629385471343994, 6.126455307006836, 6.6235246658325195, 7.120594024658203, 7.617663860321045, 8.114733695983887, 8.61180305480957, 9.108872413635254, 9.605941772460938, 10.103012084960938, 10.600081443786621, 11.097150802612305, 11.594221115112305, 12.091290473937988, 12.588359832763672, 13.085429191589355, 13.582498550415039, 14.079568862915039, 14.576638221740723]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 12.0, 19.0, 22.0, 26.0, 38.0, 87.0, 118.0, 179.0, 269.0, 406.0, 597.0, 990.0, 1465.0, 2496.0, 3952.0, 6422.0, 10940.0, 18707.0, 32022.0, 55524.0, 90581.0, 136237.0, 174128.0, 171602.0, 130894.0, 85065.0, 51534.0, 30177.0, 17463.0, 10377.0, 6185.0, 3744.0, 2251.0, 1365.0, 910.0, 625.0, 372.0, 276.0, 145.0, 128.0, 75.0, 43.0, 33.0, 23.0, 9.0, 12.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.153228759765625, -3.05450439453125, -2.955780029296875, -2.8570556640625, -2.758331298828125, -2.65960693359375, -2.560882568359375, -2.462158203125, -2.363433837890625, -2.26470947265625, -2.165985107421875, -2.0672607421875, -1.968536376953125, -1.86981201171875, -1.771087646484375, -1.67236328125, -1.573638916015625, -1.47491455078125, -1.376190185546875, -1.2774658203125, -1.178741455078125, -1.08001708984375, -0.981292724609375, -0.882568359375, -0.783843994140625, -0.68511962890625, -0.586395263671875, -0.4876708984375, -0.388946533203125, -0.29022216796875, -0.191497802734375, -0.0927734375, 0.005950927734375, 0.10467529296875, 0.203399658203125, 0.3021240234375, 0.400848388671875, 0.49957275390625, 0.598297119140625, 0.697021484375, 0.795745849609375, 0.89447021484375, 0.993194580078125, 1.0919189453125, 1.190643310546875, 1.28936767578125, 1.388092041015625, 1.48681640625, 1.585540771484375, 1.68426513671875, 1.782989501953125, 1.8817138671875, 1.980438232421875, 2.07916259765625, 2.177886962890625, 2.276611328125, 2.375335693359375, 2.47406005859375, 2.572784423828125, 2.6715087890625, 2.770233154296875, 2.86895751953125, 2.967681884765625, 3.06640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 10.0, 6.0, 5.0, 12.0, 13.0, 12.0, 8.0, 14.0, 26.0, 25.0, 28.0, 26.0, 35.0, 41.0, 31.0, 37.0, 34.0, 41.0, 38.0, 45.0, 48.0, 42.0, 55.0, 37.0, 40.0, 30.0, 27.0, 33.0, 42.0, 27.0, 17.0, 23.0, 20.0, 12.0, 12.0, 11.0, 13.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.078125, -17.542724609375, -17.00732421875, -16.471923828125, -15.9365234375, -15.401123046875, -14.86572265625, -14.330322265625, -13.794921875, -13.259521484375, -12.72412109375, -12.188720703125, -11.6533203125, -11.117919921875, -10.58251953125, -10.047119140625, -9.51171875, -8.976318359375, -8.44091796875, -7.905517578125, -7.3701171875, -6.834716796875, -6.29931640625, -5.763916015625, -5.228515625, -4.693115234375, -4.15771484375, -3.622314453125, -3.0869140625, -2.551513671875, -2.01611328125, -1.480712890625, -0.9453125, -0.409912109375, 0.12548828125, 0.660888671875, 1.1962890625, 1.731689453125, 2.26708984375, 2.802490234375, 3.337890625, 3.873291015625, 4.40869140625, 4.944091796875, 5.4794921875, 6.014892578125, 6.55029296875, 7.085693359375, 7.62109375, 8.156494140625, 8.69189453125, 9.227294921875, 9.7626953125, 10.298095703125, 10.83349609375, 11.368896484375, 11.904296875, 12.439697265625, 12.97509765625, 13.510498046875, 14.0458984375, 14.581298828125, 15.11669921875, 15.652099609375, 16.1875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 8.0, 11.0, 16.0, 30.0, 32.0, 47.0, 57.0, 66.0, 124.0, 179.0, 254.0, 414.0, 557.0, 901.0, 1314.0, 2121.0, 3433.0, 5533.0, 8931.0, 14630.0, 23895.0, 38372.0, 60313.0, 90337.0, 124105.0, 150580.0, 150132.0, 123555.0, 89203.0, 59501.0, 38313.0, 23534.0, 14611.0, 8876.0, 5369.0, 3405.0, 2043.0, 1311.0, 779.0, 527.0, 379.0, 210.0, 168.0, 105.0, 89.0, 51.0, 44.0, 23.0, 22.0, 15.0, 10.0, 8.0, 8.0, 2.0, 1.0, 2.0, 4.0, 2.0], "bins": [-2.41015625, -2.334808349609375, -2.25946044921875, -2.184112548828125, -2.1087646484375, -2.033416748046875, -1.95806884765625, -1.882720947265625, -1.807373046875, -1.732025146484375, -1.65667724609375, -1.581329345703125, -1.5059814453125, -1.430633544921875, -1.35528564453125, -1.279937744140625, -1.20458984375, -1.129241943359375, -1.05389404296875, -0.978546142578125, -0.9031982421875, -0.827850341796875, -0.75250244140625, -0.677154541015625, -0.601806640625, -0.526458740234375, -0.45111083984375, -0.375762939453125, -0.3004150390625, -0.225067138671875, -0.14971923828125, -0.074371337890625, 0.0009765625, 0.076324462890625, 0.15167236328125, 0.227020263671875, 0.3023681640625, 0.377716064453125, 0.45306396484375, 0.528411865234375, 0.603759765625, 0.679107666015625, 0.75445556640625, 0.829803466796875, 0.9051513671875, 0.980499267578125, 1.05584716796875, 1.131195068359375, 1.20654296875, 1.281890869140625, 1.35723876953125, 1.432586669921875, 1.5079345703125, 1.583282470703125, 1.65863037109375, 1.733978271484375, 1.809326171875, 1.884674072265625, 1.96002197265625, 2.035369873046875, 2.1107177734375, 2.186065673828125, 2.26141357421875, 2.336761474609375, 2.412109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 1.0, 4.0, 4.0, 1.0, 7.0, 8.0, 12.0, 18.0, 14.0, 16.0, 13.0, 18.0, 28.0, 17.0, 36.0, 29.0, 38.0, 33.0, 41.0, 45.0, 36.0, 52.0, 41.0, 45.0, 59.0, 37.0, 36.0, 31.0, 37.0, 31.0, 24.0, 27.0, 23.0, 29.0, 14.0, 15.0, 10.0, 16.0, 12.0, 5.0, 3.0, 8.0, 7.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.84375, -10.4979248046875, -10.152099609375, -9.8062744140625, -9.46044921875, -9.1146240234375, -8.768798828125, -8.4229736328125, -8.0771484375, -7.7313232421875, -7.385498046875, -7.0396728515625, -6.69384765625, -6.3480224609375, -6.002197265625, -5.6563720703125, -5.310546875, -4.9647216796875, -4.618896484375, -4.2730712890625, -3.92724609375, -3.5814208984375, -3.235595703125, -2.8897705078125, -2.5439453125, -2.1981201171875, -1.852294921875, -1.5064697265625, -1.16064453125, -0.8148193359375, -0.468994140625, -0.1231689453125, 0.22265625, 0.5684814453125, 0.914306640625, 1.2601318359375, 1.60595703125, 1.9517822265625, 2.297607421875, 2.6434326171875, 2.9892578125, 3.3350830078125, 3.680908203125, 4.0267333984375, 4.37255859375, 4.7183837890625, 5.064208984375, 5.4100341796875, 5.755859375, 6.1016845703125, 6.447509765625, 6.7933349609375, 7.13916015625, 7.4849853515625, 7.830810546875, 8.1766357421875, 8.5224609375, 8.8682861328125, 9.214111328125, 9.5599365234375, 9.90576171875, 10.2515869140625, 10.597412109375, 10.9432373046875, 11.2890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 9.0, 9.0, 19.0, 26.0, 30.0, 43.0, 43.0, 63.0, 101.0, 145.0, 171.0, 230.0, 336.0, 423.0, 680.0, 965.0, 1389.0, 2223.0, 3721.0, 6620.0, 12513.0, 25323.0, 55300.0, 127207.0, 258063.0, 279652.0, 146828.0, 64525.0, 28779.0, 14069.0, 7337.0, 4282.0, 2510.0, 1607.0, 1014.0, 633.0, 478.0, 330.0, 218.0, 157.0, 136.0, 85.0, 76.0, 49.0, 38.0, 23.0, 22.0, 16.0, 6.0, 8.0, 4.0, 9.0, 4.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.521484375, -0.5052337646484375, -0.488983154296875, -0.4727325439453125, -0.45648193359375, -0.4402313232421875, -0.423980712890625, -0.4077301025390625, -0.3914794921875, -0.3752288818359375, -0.358978271484375, -0.3427276611328125, -0.32647705078125, -0.3102264404296875, -0.293975830078125, -0.2777252197265625, -0.261474609375, -0.2452239990234375, -0.228973388671875, -0.2127227783203125, -0.19647216796875, -0.1802215576171875, -0.163970947265625, -0.1477203369140625, -0.1314697265625, -0.1152191162109375, -0.098968505859375, -0.0827178955078125, -0.06646728515625, -0.0502166748046875, -0.033966064453125, -0.0177154541015625, -0.00146484375, 0.0147857666015625, 0.031036376953125, 0.0472869873046875, 0.06353759765625, 0.0797882080078125, 0.096038818359375, 0.1122894287109375, 0.1285400390625, 0.1447906494140625, 0.161041259765625, 0.1772918701171875, 0.19354248046875, 0.2097930908203125, 0.226043701171875, 0.2422943115234375, 0.258544921875, 0.2747955322265625, 0.291046142578125, 0.3072967529296875, 0.32354736328125, 0.3397979736328125, 0.356048583984375, 0.3722991943359375, 0.3885498046875, 0.4048004150390625, 0.421051025390625, 0.4373016357421875, 0.45355224609375, 0.4698028564453125, 0.486053466796875, 0.5023040771484375, 0.5185546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 8.0, 15.0, 22.0, 24.0, 47.0, 75.0, 99.0, 114.0, 123.0, 123.0, 90.0, 75.0, 64.0, 37.0, 25.0, 16.0, 13.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.00014781951904296875, -0.00014418642967939377, -0.0001405533403158188, -0.0001369202509522438, -0.00013328716158866882, -0.00012965407222509384, -0.00012602098286151886, -0.00012238789349794388, -0.0001187548041343689, -0.00011512171477079391, -0.00011148862540721893, -0.00010785553604364395, -0.00010422244668006897, -0.00010058935731649399, -9.6956267952919e-05, -9.332317858934402e-05, -8.969008922576904e-05, -8.605699986219406e-05, -8.242391049861908e-05, -7.87908211350441e-05, -7.515773177146912e-05, -7.152464240789413e-05, -6.789155304431915e-05, -6.425846368074417e-05, -6.062537431716919e-05, -5.699228495359421e-05, -5.3359195590019226e-05, -4.9726106226444244e-05, -4.609301686286926e-05, -4.245992749929428e-05, -3.88268381357193e-05, -3.519374877214432e-05, -3.1560659408569336e-05, -2.7927570044994354e-05, -2.4294480681419373e-05, -2.066139131784439e-05, -1.702830195426941e-05, -1.3395212590694427e-05, -9.762123227119446e-06, -6.129033863544464e-06, -2.4959444999694824e-06, 1.1371448636054993e-06, 4.770234227180481e-06, 8.403323590755463e-06, 1.2036412954330444e-05, 1.5669502317905426e-05, 1.9302591681480408e-05, 2.293568104505539e-05, 2.656877040863037e-05, 3.0201859772205353e-05, 3.3834949135780334e-05, 3.7468038499355316e-05, 4.11011278629303e-05, 4.473421722650528e-05, 4.836730659008026e-05, 5.200039595365524e-05, 5.5633485317230225e-05, 5.9266574680805206e-05, 6.289966404438019e-05, 6.653275340795517e-05, 7.016584277153015e-05, 7.379893213510513e-05, 7.743202149868011e-05, 8.10651108622551e-05, 8.469820022583008e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 11.0, 12.0, 22.0, 19.0, 30.0, 40.0, 56.0, 93.0, 111.0, 186.0, 268.0, 394.0, 583.0, 873.0, 1403.0, 2401.0, 4715.0, 9913.0, 22794.0, 56673.0, 147755.0, 318115.0, 280215.0, 119330.0, 46056.0, 18517.0, 8148.0, 4061.0, 2103.0, 1228.0, 736.0, 557.0, 346.0, 217.0, 171.0, 114.0, 96.0, 66.0, 44.0, 29.0, 21.0, 12.0, 6.0, 5.0, 4.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.22265625, -1.1843109130859375, -1.145965576171875, -1.1076202392578125, -1.06927490234375, -1.0309295654296875, -0.992584228515625, -0.9542388916015625, -0.9158935546875, -0.8775482177734375, -0.839202880859375, -0.8008575439453125, -0.76251220703125, -0.7241668701171875, -0.685821533203125, -0.6474761962890625, -0.609130859375, -0.5707855224609375, -0.532440185546875, -0.4940948486328125, -0.45574951171875, -0.4174041748046875, -0.379058837890625, -0.3407135009765625, -0.3023681640625, -0.2640228271484375, -0.225677490234375, -0.1873321533203125, -0.14898681640625, -0.1106414794921875, -0.072296142578125, -0.0339508056640625, 0.00439453125, 0.0427398681640625, 0.081085205078125, 0.1194305419921875, 0.15777587890625, 0.1961212158203125, 0.234466552734375, 0.2728118896484375, 0.3111572265625, 0.3495025634765625, 0.387847900390625, 0.4261932373046875, 0.46453857421875, 0.5028839111328125, 0.541229248046875, 0.5795745849609375, 0.617919921875, 0.6562652587890625, 0.694610595703125, 0.7329559326171875, 0.77130126953125, 0.8096466064453125, 0.847991943359375, 0.8863372802734375, 0.9246826171875, 0.9630279541015625, 1.001373291015625, 1.0397186279296875, 1.07806396484375, 1.1164093017578125, 1.154754638671875, 1.1930999755859375, 1.2314453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 5.0, 8.0, 10.0, 15.0, 14.0, 18.0, 36.0, 43.0, 55.0, 73.0, 85.0, 101.0, 109.0, 97.0, 68.0, 56.0, 47.0, 34.0, 22.0, 23.0, 16.0, 10.0, 11.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32177734375, -0.31102752685546875, -0.3002777099609375, -0.28952789306640625, -0.278778076171875, -0.26802825927734375, -0.2572784423828125, -0.24652862548828125, -0.23577880859375, -0.22502899169921875, -0.2142791748046875, -0.20352935791015625, -0.192779541015625, -0.18202972412109375, -0.1712799072265625, -0.16053009033203125, -0.1497802734375, -0.13903045654296875, -0.1282806396484375, -0.11753082275390625, -0.106781005859375, -0.09603118896484375, -0.0852813720703125, -0.07453155517578125, -0.06378173828125, -0.05303192138671875, -0.0422821044921875, -0.03153228759765625, -0.020782470703125, -0.01003265380859375, 0.0007171630859375, 0.01146697998046875, 0.022216796875, 0.03296661376953125, 0.0437164306640625, 0.05446624755859375, 0.065216064453125, 0.07596588134765625, 0.0867156982421875, 0.09746551513671875, 0.10821533203125, 0.11896514892578125, 0.1297149658203125, 0.14046478271484375, 0.151214599609375, 0.16196441650390625, 0.1727142333984375, 0.18346405029296875, 0.1942138671875, 0.20496368408203125, 0.2157135009765625, 0.22646331787109375, 0.237213134765625, 0.24796295166015625, 0.2587127685546875, 0.26946258544921875, 0.28021240234375, 0.29096221923828125, 0.3017120361328125, 0.31246185302734375, 0.323211669921875, 0.33396148681640625, 0.3447113037109375, 0.35546112060546875, 0.3662109375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 7.0, 4.0, 7.0, 9.0, 13.0, 13.0, 23.0, 28.0, 31.0, 27.0, 43.0, 35.0, 36.0, 44.0, 52.0, 58.0, 46.0, 40.0, 54.0, 43.0, 43.0, 47.0, 51.0, 36.0, 21.0, 33.0, 20.0, 23.0, 21.0, 27.0, 10.0, 18.0, 8.0, 6.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.046205520629883, -15.609572410583496, -15.17293930053711, -14.736307144165039, -14.299674034118652, -13.863040924072266, -13.426407814025879, -12.989774703979492, -12.553141593933105, -12.116508483886719, -11.679875373840332, -11.243242263793945, -10.806610107421875, -10.369976997375488, -9.933343887329102, -9.496710777282715, -9.060077667236328, -8.623444557189941, -8.186811447143555, -7.750178813934326, -7.3135457038879395, -6.876913070678711, -6.440279960632324, -6.0036468505859375, -5.567014694213867, -5.1303815841674805, -4.693748950958252, -4.257115840911865, -3.8204827308654785, -3.383849859237671, -2.9472169876098633, -2.5105838775634766, -2.07395076751709, -1.6373177766799927, -1.2006847858428955, -0.7640519142150879, -0.3274189233779907, 0.10921406745910645, 0.5458469390869141, 0.9824800491333008, 1.4191129207611084, 1.8557459115982056, 2.2923789024353027, 2.7290117740631104, 3.165644645690918, 3.6022777557373047, 4.038910865783691, 4.475543975830078, 4.912176609039307, 5.348809719085693, 5.785442352294922, 6.222075462341309, 6.658708572387695, 7.095341682434082, 7.5319743156433105, 7.968607425689697, 8.405240058898926, 8.841873168945312, 9.2785062789917, 9.715139389038086, 10.151771545410156, 10.588404655456543, 11.02503776550293, 11.461670875549316, 11.898303985595703]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 8.0, 10.0, 6.0, 17.0, 10.0, 14.0, 22.0, 14.0, 29.0, 25.0, 24.0, 50.0, 34.0, 28.0, 33.0, 45.0, 32.0, 42.0, 44.0, 42.0, 38.0, 45.0, 32.0, 37.0, 45.0, 33.0, 40.0, 26.0, 25.0, 16.0, 15.0, 28.0, 13.0, 14.0, 7.0, 12.0, 9.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.06932258605957, -16.576322555541992, -16.08332061767578, -15.590320587158203, -15.097320556640625, -14.60431957244873, -14.111318588256836, -13.618318557739258, -13.12531852722168, -12.632317543029785, -12.139317512512207, -11.646316528320312, -11.153316497802734, -10.66031551361084, -10.167314529418945, -9.674314498901367, -9.181313514709473, -8.688312530517578, -8.1953125, -7.7023115158081055, -7.209311485290527, -6.716310501098633, -6.2233099937438965, -5.73030948638916, -5.237308979034424, -4.7443084716796875, -4.251307964324951, -3.7583072185516357, -3.2653067111968994, -2.772306203842163, -2.2793054580688477, -1.7863049507141113, -1.293304443359375, -0.8003038763999939, -0.3073033094406128, 0.18569731712341309, 0.6786978244781494, 1.1716983318328857, 1.6646990776062012, 2.1576995849609375, 2.650700092315674, 3.14370059967041, 3.6367011070251465, 4.129701614379883, 4.622702598571777, 5.1157026290893555, 5.60870361328125, 6.101704120635986, 6.594704627990723, 7.087705135345459, 7.580705642700195, 8.07370662689209, 8.566706657409668, 9.059707641601562, 9.55270767211914, 10.045708656311035, 10.53870964050293, 11.031710624694824, 11.524710655212402, 12.017711639404297, 12.510711669921875, 13.00371265411377, 13.496713638305664, 13.989713668823242, 14.48271369934082]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 9.0, 29.0, 25.0, 38.0, 76.0, 120.0, 193.0, 369.0, 543.0, 968.0, 1515.0, 2446.0, 4088.0, 6318.0, 9849.0, 15018.0, 21761.0, 31579.0, 43762.0, 57790.0, 72770.0, 87434.0, 97207.0, 102918.0, 100266.0, 91741.0, 78130.0, 63228.0, 49130.0, 35730.0, 25133.0, 17024.0, 11355.0, 7354.0, 4787.0, 3096.0, 1901.0, 1163.0, 655.0, 418.0, 261.0, 152.0, 90.0, 52.0, 22.0, 18.0, 12.0, 10.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3828125, -8.109619140625, -7.83642578125, -7.563232421875, -7.2900390625, -7.016845703125, -6.74365234375, -6.470458984375, -6.197265625, -5.924072265625, -5.65087890625, -5.377685546875, -5.1044921875, -4.831298828125, -4.55810546875, -4.284912109375, -4.01171875, -3.738525390625, -3.46533203125, -3.192138671875, -2.9189453125, -2.645751953125, -2.37255859375, -2.099365234375, -1.826171875, -1.552978515625, -1.27978515625, -1.006591796875, -0.7333984375, -0.460205078125, -0.18701171875, 0.086181640625, 0.359375, 0.632568359375, 0.90576171875, 1.178955078125, 1.4521484375, 1.725341796875, 1.99853515625, 2.271728515625, 2.544921875, 2.818115234375, 3.09130859375, 3.364501953125, 3.6376953125, 3.910888671875, 4.18408203125, 4.457275390625, 4.73046875, 5.003662109375, 5.27685546875, 5.550048828125, 5.8232421875, 6.096435546875, 6.36962890625, 6.642822265625, 6.916015625, 7.189208984375, 7.46240234375, 7.735595703125, 8.0087890625, 8.281982421875, 8.55517578125, 8.828369140625, 9.1015625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 9.0, 7.0, 12.0, 16.0, 18.0, 18.0, 23.0, 14.0, 23.0, 21.0, 26.0, 37.0, 33.0, 35.0, 25.0, 32.0, 40.0, 36.0, 43.0, 44.0, 36.0, 48.0, 37.0, 34.0, 32.0, 29.0, 31.0, 32.0, 23.0, 26.0, 19.0, 23.0, 20.0, 14.0, 14.0, 13.0, 10.0, 7.0, 8.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.25, -15.78369140625, -15.3173828125, -14.85107421875, -14.384765625, -13.91845703125, -13.4521484375, -12.98583984375, -12.51953125, -12.05322265625, -11.5869140625, -11.12060546875, -10.654296875, -10.18798828125, -9.7216796875, -9.25537109375, -8.7890625, -8.32275390625, -7.8564453125, -7.39013671875, -6.923828125, -6.45751953125, -5.9912109375, -5.52490234375, -5.05859375, -4.59228515625, -4.1259765625, -3.65966796875, -3.193359375, -2.72705078125, -2.2607421875, -1.79443359375, -1.328125, -0.86181640625, -0.3955078125, 0.07080078125, 0.537109375, 1.00341796875, 1.4697265625, 1.93603515625, 2.40234375, 2.86865234375, 3.3349609375, 3.80126953125, 4.267578125, 4.73388671875, 5.2001953125, 5.66650390625, 6.1328125, 6.59912109375, 7.0654296875, 7.53173828125, 7.998046875, 8.46435546875, 8.9306640625, 9.39697265625, 9.86328125, 10.32958984375, 10.7958984375, 11.26220703125, 11.728515625, 12.19482421875, 12.6611328125, 13.12744140625, 13.59375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 9.0, 17.0, 19.0, 37.0, 49.0, 93.0, 146.0, 191.0, 342.0, 533.0, 865.0, 1312.0, 2120.0, 3281.0, 4903.0, 7664.0, 11376.0, 16651.0, 23854.0, 33380.0, 44608.0, 58309.0, 72653.0, 85343.0, 94591.0, 98220.0, 96130.0, 88195.0, 76560.0, 62063.0, 48195.0, 36100.0, 26079.0, 18168.0, 12606.0, 8435.0, 5495.0, 3622.0, 2276.0, 1501.0, 918.0, 602.0, 384.0, 247.0, 139.0, 100.0, 69.0, 35.0, 28.0, 16.0, 18.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.61328125, -7.34735107421875, -7.0814208984375, -6.81549072265625, -6.549560546875, -6.28363037109375, -6.0177001953125, -5.75177001953125, -5.48583984375, -5.21990966796875, -4.9539794921875, -4.68804931640625, -4.422119140625, -4.15618896484375, -3.8902587890625, -3.62432861328125, -3.3583984375, -3.09246826171875, -2.8265380859375, -2.56060791015625, -2.294677734375, -2.02874755859375, -1.7628173828125, -1.49688720703125, -1.23095703125, -0.96502685546875, -0.6990966796875, -0.43316650390625, -0.167236328125, 0.09869384765625, 0.3646240234375, 0.63055419921875, 0.896484375, 1.16241455078125, 1.4283447265625, 1.69427490234375, 1.960205078125, 2.22613525390625, 2.4920654296875, 2.75799560546875, 3.02392578125, 3.28985595703125, 3.5557861328125, 3.82171630859375, 4.087646484375, 4.35357666015625, 4.6195068359375, 4.88543701171875, 5.1513671875, 5.41729736328125, 5.6832275390625, 5.94915771484375, 6.215087890625, 6.48101806640625, 6.7469482421875, 7.01287841796875, 7.27880859375, 7.54473876953125, 7.8106689453125, 8.07659912109375, 8.342529296875, 8.60845947265625, 8.8743896484375, 9.14031982421875, 9.40625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 6.0, 8.0, 7.0, 7.0, 10.0, 15.0, 18.0, 22.0, 22.0, 26.0, 33.0, 33.0, 35.0, 42.0, 38.0, 36.0, 44.0, 43.0, 38.0, 51.0, 40.0, 40.0, 39.0, 34.0, 33.0, 25.0, 32.0, 26.0, 26.0, 29.0, 19.0, 25.0, 14.0, 10.0, 14.0, 11.0, 7.0, 9.0, 8.0, 7.0, 2.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.1484375, -9.8438720703125, -9.539306640625, -9.2347412109375, -8.93017578125, -8.6256103515625, -8.321044921875, -8.0164794921875, -7.7119140625, -7.4073486328125, -7.102783203125, -6.7982177734375, -6.49365234375, -6.1890869140625, -5.884521484375, -5.5799560546875, -5.275390625, -4.9708251953125, -4.666259765625, -4.3616943359375, -4.05712890625, -3.7525634765625, -3.447998046875, -3.1434326171875, -2.8388671875, -2.5343017578125, -2.229736328125, -1.9251708984375, -1.62060546875, -1.3160400390625, -1.011474609375, -0.7069091796875, -0.40234375, -0.0977783203125, 0.206787109375, 0.5113525390625, 0.81591796875, 1.1204833984375, 1.425048828125, 1.7296142578125, 2.0341796875, 2.3387451171875, 2.643310546875, 2.9478759765625, 3.25244140625, 3.5570068359375, 3.861572265625, 4.1661376953125, 4.470703125, 4.7752685546875, 5.079833984375, 5.3843994140625, 5.68896484375, 5.9935302734375, 6.298095703125, 6.6026611328125, 6.9072265625, 7.2117919921875, 7.516357421875, 7.8209228515625, 8.12548828125, 8.4300537109375, 8.734619140625, 9.0391845703125, 9.34375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 10.0, 12.0, 17.0, 21.0, 39.0, 53.0, 81.0, 94.0, 136.0, 240.0, 330.0, 554.0, 814.0, 1171.0, 1721.0, 2707.0, 4142.0, 6397.0, 9902.0, 15016.0, 22667.0, 33365.0, 47435.0, 64978.0, 84821.0, 101114.0, 113110.0, 113838.0, 104824.0, 88963.0, 69706.0, 51440.0, 36072.0, 24876.0, 16535.0, 10753.0, 7040.0, 4685.0, 2908.0, 1969.0, 1314.0, 884.0, 577.0, 407.0, 278.0, 167.0, 129.0, 94.0, 60.0, 31.0, 27.0, 11.0, 13.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.544921875, -3.430999755859375, -3.31707763671875, -3.203155517578125, -3.0892333984375, -2.975311279296875, -2.86138916015625, -2.747467041015625, -2.633544921875, -2.519622802734375, -2.40570068359375, -2.291778564453125, -2.1778564453125, -2.063934326171875, -1.95001220703125, -1.836090087890625, -1.72216796875, -1.608245849609375, -1.49432373046875, -1.380401611328125, -1.2664794921875, -1.152557373046875, -1.03863525390625, -0.924713134765625, -0.810791015625, -0.696868896484375, -0.58294677734375, -0.469024658203125, -0.3551025390625, -0.241180419921875, -0.12725830078125, -0.013336181640625, 0.1005859375, 0.214508056640625, 0.32843017578125, 0.442352294921875, 0.5562744140625, 0.670196533203125, 0.78411865234375, 0.898040771484375, 1.011962890625, 1.125885009765625, 1.23980712890625, 1.353729248046875, 1.4676513671875, 1.581573486328125, 1.69549560546875, 1.809417724609375, 1.92333984375, 2.037261962890625, 2.15118408203125, 2.265106201171875, 2.3790283203125, 2.492950439453125, 2.60687255859375, 2.720794677734375, 2.834716796875, 2.948638916015625, 3.06256103515625, 3.176483154296875, 3.2904052734375, 3.404327392578125, 3.51824951171875, 3.632171630859375, 3.74609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 1.0, 5.0, 3.0, 12.0, 8.0, 13.0, 14.0, 19.0, 16.0, 33.0, 33.0, 29.0, 29.0, 40.0, 37.0, 47.0, 42.0, 41.0, 41.0, 60.0, 47.0, 47.0, 59.0, 47.0, 41.0, 38.0, 35.0, 27.0, 27.0, 14.0, 18.0, 14.0, 12.0, 5.0, 10.0, 7.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004107952117919922, -0.0003975033760070801, -0.00038421154022216797, -0.00037091970443725586, -0.00035762786865234375, -0.00034433603286743164, -0.00033104419708251953, -0.0003177523612976074, -0.0003044605255126953, -0.0002911686897277832, -0.0002778768539428711, -0.000264585018157959, -0.0002512931823730469, -0.00023800134658813477, -0.00022470951080322266, -0.00021141767501831055, -0.00019812583923339844, -0.00018483400344848633, -0.00017154216766357422, -0.0001582503318786621, -0.00014495849609375, -0.0001316666603088379, -0.00011837482452392578, -0.00010508298873901367, -9.179115295410156e-05, -7.849931716918945e-05, -6.520748138427734e-05, -5.1915645599365234e-05, -3.8623809814453125e-05, -2.5331974029541016e-05, -1.2040138244628906e-05, 1.2516975402832031e-06, 1.4543533325195312e-05, 2.7835369110107422e-05, 4.112720489501953e-05, 5.441904067993164e-05, 6.771087646484375e-05, 8.100271224975586e-05, 9.429454803466797e-05, 0.00010758638381958008, 0.00012087821960449219, 0.0001341700553894043, 0.0001474618911743164, 0.00016075372695922852, 0.00017404556274414062, 0.00018733739852905273, 0.00020062923431396484, 0.00021392107009887695, 0.00022721290588378906, 0.00024050474166870117, 0.0002537965774536133, 0.0002670884132385254, 0.0002803802490234375, 0.0002936720848083496, 0.0003069639205932617, 0.00032025575637817383, 0.00033354759216308594, 0.00034683942794799805, 0.00036013126373291016, 0.00037342309951782227, 0.0003867149353027344, 0.0004000067710876465, 0.0004132986068725586, 0.0004265904426574707, 0.0004398822784423828]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 14.0, 16.0, 20.0, 36.0, 40.0, 65.0, 123.0, 181.0, 270.0, 450.0, 691.0, 1192.0, 1962.0, 3275.0, 5631.0, 9747.0, 16952.0, 28700.0, 47109.0, 73240.0, 104569.0, 134081.0, 148176.0, 139843.0, 114055.0, 82659.0, 54179.0, 33605.0, 19805.0, 11565.0, 6562.0, 3825.0, 2283.0, 1356.0, 820.0, 534.0, 339.0, 192.0, 154.0, 70.0, 55.0, 42.0, 22.0, 17.0, 16.0, 12.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.8359375, -4.67816162109375, -4.5203857421875, -4.36260986328125, -4.204833984375, -4.04705810546875, -3.8892822265625, -3.73150634765625, -3.57373046875, -3.41595458984375, -3.2581787109375, -3.10040283203125, -2.942626953125, -2.78485107421875, -2.6270751953125, -2.46929931640625, -2.3115234375, -2.15374755859375, -1.9959716796875, -1.83819580078125, -1.680419921875, -1.52264404296875, -1.3648681640625, -1.20709228515625, -1.04931640625, -0.89154052734375, -0.7337646484375, -0.57598876953125, -0.418212890625, -0.26043701171875, -0.1026611328125, 0.05511474609375, 0.212890625, 0.37066650390625, 0.5284423828125, 0.68621826171875, 0.843994140625, 1.00177001953125, 1.1595458984375, 1.31732177734375, 1.47509765625, 1.63287353515625, 1.7906494140625, 1.94842529296875, 2.106201171875, 2.26397705078125, 2.4217529296875, 2.57952880859375, 2.7373046875, 2.89508056640625, 3.0528564453125, 3.21063232421875, 3.368408203125, 3.52618408203125, 3.6839599609375, 3.84173583984375, 3.99951171875, 4.15728759765625, 4.3150634765625, 4.47283935546875, 4.630615234375, 4.78839111328125, 4.9461669921875, 5.10394287109375, 5.26171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 3.0, 15.0, 11.0, 24.0, 22.0, 26.0, 23.0, 28.0, 42.0, 59.0, 46.0, 68.0, 55.0, 69.0, 52.0, 44.0, 61.0, 69.0, 44.0, 38.0, 28.0, 27.0, 24.0, 27.0, 28.0, 18.0, 8.0, 5.0, 7.0, 4.0, 6.0, 6.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8988189697265625, -1.835723876953125, -1.7726287841796875, -1.70953369140625, -1.6464385986328125, -1.583343505859375, -1.5202484130859375, -1.4571533203125, -1.3940582275390625, -1.330963134765625, -1.2678680419921875, -1.20477294921875, -1.1416778564453125, -1.078582763671875, -1.0154876708984375, -0.952392578125, -0.8892974853515625, -0.826202392578125, -0.7631072998046875, -0.70001220703125, -0.6369171142578125, -0.573822021484375, -0.5107269287109375, -0.4476318359375, -0.3845367431640625, -0.321441650390625, -0.2583465576171875, -0.19525146484375, -0.1321563720703125, -0.069061279296875, -0.0059661865234375, 0.05712890625, 0.1202239990234375, 0.183319091796875, 0.2464141845703125, 0.30950927734375, 0.3726043701171875, 0.435699462890625, 0.4987945556640625, 0.5618896484375, 0.6249847412109375, 0.688079833984375, 0.7511749267578125, 0.81427001953125, 0.8773651123046875, 0.940460205078125, 1.0035552978515625, 1.066650390625, 1.1297454833984375, 1.192840576171875, 1.2559356689453125, 1.31903076171875, 1.3821258544921875, 1.445220947265625, 1.5083160400390625, 1.5714111328125, 1.6345062255859375, 1.697601318359375, 1.7606964111328125, 1.82379150390625, 1.8868865966796875, 1.949981689453125, 2.0130767822265625, 2.076171875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 15.0, 13.0, 17.0, 16.0, 31.0, 22.0, 28.0, 22.0, 37.0, 32.0, 33.0, 39.0, 57.0, 45.0, 42.0, 47.0, 34.0, 41.0, 43.0, 43.0, 43.0, 21.0, 37.0, 22.0, 34.0, 22.0, 27.0, 24.0, 18.0, 9.0, 11.0, 10.0, 11.0, 11.0, 4.0, 3.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.94345760345459, -12.551535606384277, -12.159614562988281, -11.767692565917969, -11.375770568847656, -10.98384952545166, -10.591927528381348, -10.200006484985352, -9.808084487915039, -9.416162490844727, -9.02424144744873, -8.632319450378418, -8.240398406982422, -7.848476409912109, -7.456554412841797, -7.064632892608643, -6.672711372375488, -6.280789852142334, -5.88886833190918, -5.496946334838867, -5.105024814605713, -4.713103294372559, -4.321181297302246, -3.929259777069092, -3.5373382568359375, -3.145416736602783, -2.75349497795105, -2.3615732192993164, -1.969651699066162, -1.5777300596237183, -1.1858084201812744, -0.793886661529541, -0.4019641876220703, -0.010042548179626465, 0.3818790912628174, 0.7738007307052612, 1.165722370147705, 1.557644009590149, 1.9495656490325928, 2.341487407684326, 2.7334089279174805, 3.1253304481506348, 3.517252206802368, 3.9091739654541016, 4.301095485687256, 4.69301700592041, 5.084939002990723, 5.476860523223877, 5.868782043457031, 6.2607035636901855, 6.65262508392334, 7.044547080993652, 7.436468601226807, 7.828390121459961, 8.220312118530273, 8.612234115600586, 9.004155158996582, 9.396077156066895, 9.78799819946289, 10.179920196533203, 10.571842193603516, 10.963763236999512, 11.355685234069824, 11.74760627746582, 12.139528274536133]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 10.0, 9.0, 9.0, 7.0, 4.0, 12.0, 9.0, 13.0, 17.0, 21.0, 21.0, 21.0, 33.0, 34.0, 36.0, 49.0, 39.0, 39.0, 45.0, 35.0, 49.0, 55.0, 45.0, 28.0, 51.0, 43.0, 32.0, 32.0, 30.0, 25.0, 25.0, 17.0, 17.0, 23.0, 16.0, 14.0, 15.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.820951461791992, -18.276235580444336, -17.731521606445312, -17.186805725097656, -16.64208984375, -16.097373962402344, -15.552659034729004, -15.007944107055664, -14.463228225708008, -13.918512344360352, -13.373797416687012, -12.829082489013672, -12.284366607666016, -11.73965072631836, -11.19493579864502, -10.65022087097168, -10.105504989624023, -9.560789108276367, -9.016074180603027, -8.471359252929688, -7.926643371582031, -7.381927967071533, -6.837212562561035, -6.292497158050537, -5.747781753540039, -5.203066349029541, -4.658350944519043, -4.113635540008545, -3.568920135498047, -3.024204730987549, -2.479489326477051, -1.9347739219665527, -1.3900585174560547, -0.8453431129455566, -0.3006277084350586, 0.24408769607543945, 0.7888031005859375, 1.3335185050964355, 1.8782339096069336, 2.4229493141174316, 2.9676647186279297, 3.5123801231384277, 4.057095527648926, 4.601810932159424, 5.146526336669922, 5.69124174118042, 6.235957145690918, 6.780672550201416, 7.325387954711914, 7.870103359222412, 8.41481876373291, 8.95953369140625, 9.504249572753906, 10.048965454101562, 10.593680381774902, 11.138395309448242, 11.683111190795898, 12.227827072143555, 12.772541999816895, 13.317256927490234, 13.86197280883789, 14.406688690185547, 14.951403617858887, 15.496118545532227, 16.040834426879883]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 11.0, 19.0, 32.0, 45.0, 61.0, 130.0, 171.0, 324.0, 520.0, 894.0, 1417.0, 2397.0, 3926.0, 6386.0, 10318.0, 16344.0, 25979.0, 41028.0, 62543.0, 93834.0, 137140.0, 192507.0, 255326.0, 324834.0, 384098.0, 424541.0, 432459.0, 408027.0, 356862.0, 292858.0, 224363.0, 164197.0, 114644.0, 77580.0, 51566.0, 32807.0, 20683.0, 13035.0, 8070.0, 4955.0, 2980.0, 1753.0, 1056.0, 626.0, 376.0, 227.0, 134.0, 75.0, 52.0, 31.0, 17.0, 12.0, 4.0, 4.0, 6.0, 1.0, 2.0], "bins": [-10.125, -9.8204345703125, -9.515869140625, -9.2113037109375, -8.90673828125, -8.6021728515625, -8.297607421875, -7.9930419921875, -7.6884765625, -7.3839111328125, -7.079345703125, -6.7747802734375, -6.47021484375, -6.1656494140625, -5.861083984375, -5.5565185546875, -5.251953125, -4.9473876953125, -4.642822265625, -4.3382568359375, -4.03369140625, -3.7291259765625, -3.424560546875, -3.1199951171875, -2.8154296875, -2.5108642578125, -2.206298828125, -1.9017333984375, -1.59716796875, -1.2926025390625, -0.988037109375, -0.6834716796875, -0.37890625, -0.0743408203125, 0.230224609375, 0.5347900390625, 0.83935546875, 1.1439208984375, 1.448486328125, 1.7530517578125, 2.0576171875, 2.3621826171875, 2.666748046875, 2.9713134765625, 3.27587890625, 3.5804443359375, 3.885009765625, 4.1895751953125, 4.494140625, 4.7987060546875, 5.103271484375, 5.4078369140625, 5.71240234375, 6.0169677734375, 6.321533203125, 6.6260986328125, 6.9306640625, 7.2352294921875, 7.539794921875, 7.8443603515625, 8.14892578125, 8.4534912109375, 8.758056640625, 9.0626220703125, 9.3671875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 10.0, 7.0, 8.0, 9.0, 8.0, 10.0, 12.0, 17.0, 19.0, 26.0, 23.0, 27.0, 26.0, 32.0, 49.0, 45.0, 54.0, 40.0, 45.0, 51.0, 43.0, 50.0, 50.0, 40.0, 40.0, 34.0, 34.0, 28.0, 31.0, 30.0, 21.0, 21.0, 16.0, 17.0, 10.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.578125, -15.11083984375, -14.6435546875, -14.17626953125, -13.708984375, -13.24169921875, -12.7744140625, -12.30712890625, -11.83984375, -11.37255859375, -10.9052734375, -10.43798828125, -9.970703125, -9.50341796875, -9.0361328125, -8.56884765625, -8.1015625, -7.63427734375, -7.1669921875, -6.69970703125, -6.232421875, -5.76513671875, -5.2978515625, -4.83056640625, -4.36328125, -3.89599609375, -3.4287109375, -2.96142578125, -2.494140625, -2.02685546875, -1.5595703125, -1.09228515625, -0.625, -0.15771484375, 0.3095703125, 0.77685546875, 1.244140625, 1.71142578125, 2.1787109375, 2.64599609375, 3.11328125, 3.58056640625, 4.0478515625, 4.51513671875, 4.982421875, 5.44970703125, 5.9169921875, 6.38427734375, 6.8515625, 7.31884765625, 7.7861328125, 8.25341796875, 8.720703125, 9.18798828125, 9.6552734375, 10.12255859375, 10.58984375, 11.05712890625, 11.5244140625, 11.99169921875, 12.458984375, 12.92626953125, 13.3935546875, 13.86083984375, 14.328125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 4.0, 18.0, 24.0, 48.0, 79.0, 166.0, 289.0, 465.0, 777.0, 1270.0, 2122.0, 3587.0, 5674.0, 9287.0, 14767.0, 22793.0, 35934.0, 52589.0, 76838.0, 108340.0, 147255.0, 191952.0, 242958.0, 290867.0, 331684.0, 362130.0, 371615.0, 362033.0, 334956.0, 292669.0, 245186.0, 195623.0, 148963.0, 109437.0, 78327.0, 54313.0, 35631.0, 23683.0, 15303.0, 9545.0, 5996.0, 3715.0, 2204.0, 1305.0, 766.0, 451.0, 298.0, 163.0, 73.0, 53.0, 29.0, 16.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0], "bins": [-9.1875, -8.905029296875, -8.62255859375, -8.340087890625, -8.0576171875, -7.775146484375, -7.49267578125, -7.210205078125, -6.927734375, -6.645263671875, -6.36279296875, -6.080322265625, -5.7978515625, -5.515380859375, -5.23291015625, -4.950439453125, -4.66796875, -4.385498046875, -4.10302734375, -3.820556640625, -3.5380859375, -3.255615234375, -2.97314453125, -2.690673828125, -2.408203125, -2.125732421875, -1.84326171875, -1.560791015625, -1.2783203125, -0.995849609375, -0.71337890625, -0.430908203125, -0.1484375, 0.134033203125, 0.41650390625, 0.698974609375, 0.9814453125, 1.263916015625, 1.54638671875, 1.828857421875, 2.111328125, 2.393798828125, 2.67626953125, 2.958740234375, 3.2412109375, 3.523681640625, 3.80615234375, 4.088623046875, 4.37109375, 4.653564453125, 4.93603515625, 5.218505859375, 5.5009765625, 5.783447265625, 6.06591796875, 6.348388671875, 6.630859375, 6.913330078125, 7.19580078125, 7.478271484375, 7.7607421875, 8.043212890625, 8.32568359375, 8.608154296875, 8.890625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 7.0, 5.0, 20.0, 42.0, 33.0, 40.0, 45.0, 60.0, 75.0, 91.0, 103.0, 118.0, 131.0, 144.0, 159.0, 167.0, 196.0, 199.0, 203.0, 198.0, 196.0, 185.0, 213.0, 181.0, 189.0, 170.0, 161.0, 121.0, 121.0, 89.0, 75.0, 68.0, 56.0, 55.0, 30.0, 29.0, 19.0, 12.0, 21.0, 13.0, 8.0, 3.0, 5.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.33203125, -6.13909912109375, -5.9461669921875, -5.75323486328125, -5.560302734375, -5.36737060546875, -5.1744384765625, -4.98150634765625, -4.78857421875, -4.59564208984375, -4.4027099609375, -4.20977783203125, -4.016845703125, -3.82391357421875, -3.6309814453125, -3.43804931640625, -3.2451171875, -3.05218505859375, -2.8592529296875, -2.66632080078125, -2.473388671875, -2.28045654296875, -2.0875244140625, -1.89459228515625, -1.70166015625, -1.50872802734375, -1.3157958984375, -1.12286376953125, -0.929931640625, -0.73699951171875, -0.5440673828125, -0.35113525390625, -0.158203125, 0.03472900390625, 0.2276611328125, 0.42059326171875, 0.613525390625, 0.80645751953125, 0.9993896484375, 1.19232177734375, 1.38525390625, 1.57818603515625, 1.7711181640625, 1.96405029296875, 2.156982421875, 2.34991455078125, 2.5428466796875, 2.73577880859375, 2.9287109375, 3.12164306640625, 3.3145751953125, 3.50750732421875, 3.700439453125, 3.89337158203125, 4.0863037109375, 4.27923583984375, 4.47216796875, 4.66510009765625, 4.8580322265625, 5.05096435546875, 5.243896484375, 5.43682861328125, 5.6297607421875, 5.82269287109375, 6.015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 5.0, 6.0, 11.0, 20.0, 17.0, 27.0, 22.0, 32.0, 36.0, 31.0, 40.0, 47.0, 49.0, 58.0, 61.0, 53.0, 59.0, 69.0, 44.0, 50.0, 49.0, 34.0, 31.0, 23.0, 30.0, 23.0, 17.0, 17.0, 9.0, 8.0, 6.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.849138259887695, -17.3325138092041, -16.815887451171875, -16.29926300048828, -15.782638549804688, -15.266013145446777, -14.749387741088867, -14.232763290405273, -13.71613883972168, -13.19951343536377, -12.682888984680176, -12.166263580322266, -11.649639129638672, -11.133013725280762, -10.616388320922852, -10.099763870239258, -9.583138465881348, -9.066513061523438, -8.549888610839844, -8.033263206481934, -7.51663875579834, -7.00001335144043, -6.483388423919678, -5.966763496398926, -5.450138568878174, -4.933513641357422, -4.41688871383667, -3.900263547897339, -3.383638620376587, -2.867013692855835, -2.350388526916504, -1.833763599395752, -1.3171396255493164, -0.8005146384239197, -0.28388965129852295, 0.23273539543151855, 0.7493603229522705, 1.2659852504730225, 1.7826104164123535, 2.2992353439331055, 2.8158602714538574, 3.3324851989746094, 3.8491101264953613, 4.365735054016113, 4.882360458374023, 5.398984909057617, 5.915610313415527, 6.432235240936279, 6.948860168457031, 7.465485095977783, 7.982110023498535, 8.498735427856445, 9.015359878540039, 9.53198528289795, 10.04861068725586, 10.565235137939453, 11.081859588623047, 11.598484992980957, 12.11510944366455, 12.631734848022461, 13.148359298706055, 13.664984703063965, 14.181610107421875, 14.698234558105469, 15.214859962463379]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 4.0, 13.0, 13.0, 9.0, 8.0, 14.0, 13.0, 16.0, 22.0, 26.0, 23.0, 23.0, 38.0, 37.0, 38.0, 28.0, 41.0, 51.0, 36.0, 49.0, 52.0, 42.0, 35.0, 34.0, 43.0, 41.0, 41.0, 32.0, 26.0, 22.0, 25.0, 21.0, 17.0, 11.0, 14.0, 7.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.520597457885742, -17.01219940185547, -16.503801345825195, -15.995404243469238, -15.487007141113281, -14.978609085083008, -14.470211029052734, -13.961813926696777, -13.45341682434082, -12.945018768310547, -12.43662166595459, -11.928223609924316, -11.41982650756836, -10.911428451538086, -10.403030395507812, -9.894633293151855, -9.386235237121582, -8.877837181091309, -8.369440078735352, -7.861042022705078, -7.352644920349121, -6.844246864318848, -6.335849285125732, -5.827451705932617, -5.319054126739502, -4.810656547546387, -4.3022589683532715, -3.793861150741577, -3.285463571548462, -2.7770659923553467, -2.2686681747436523, -1.760270595550537, -1.2518720626831055, -0.7434744238853455, -0.23507678508758545, 0.27332091331481934, 0.7817184925079346, 1.2901160717010498, 1.7985138893127441, 2.3069114685058594, 2.8153090476989746, 3.32370662689209, 3.832104206085205, 4.34050178527832, 4.848899841308594, 5.357296943664551, 5.865694999694824, 6.3740925788879395, 6.882490158081055, 7.39088773727417, 7.899285316467285, 8.407683372497559, 8.916080474853516, 9.424478530883789, 9.932876586914062, 10.44127368927002, 10.949670791625977, 11.45806884765625, 11.966465950012207, 12.47486400604248, 12.983261108398438, 13.491659164428711, 14.000057220458984, 14.508454322814941, 15.016852378845215]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 11.0, 12.0, 16.0, 21.0, 34.0, 62.0, 78.0, 101.0, 181.0, 266.0, 473.0, 623.0, 987.0, 1500.0, 2429.0, 3863.0, 6007.0, 9354.0, 14721.0, 23120.0, 35171.0, 52889.0, 77819.0, 105966.0, 131225.0, 140111.0, 127246.0, 99663.0, 72788.0, 49868.0, 32812.0, 21427.0, 13697.0, 8657.0, 5470.0, 3551.0, 2293.0, 1410.0, 886.0, 610.0, 392.0, 258.0, 152.0, 103.0, 84.0, 47.0, 35.0, 26.0, 15.0, 10.0, 7.0, 5.0, 5.0, 2.0, 1.0], "bins": [-2.466796875, -2.395111083984375, -2.32342529296875, -2.251739501953125, -2.1800537109375, -2.108367919921875, -2.03668212890625, -1.964996337890625, -1.893310546875, -1.821624755859375, -1.74993896484375, -1.678253173828125, -1.6065673828125, -1.534881591796875, -1.46319580078125, -1.391510009765625, -1.31982421875, -1.248138427734375, -1.17645263671875, -1.104766845703125, -1.0330810546875, -0.961395263671875, -0.88970947265625, -0.818023681640625, -0.746337890625, -0.674652099609375, -0.60296630859375, -0.531280517578125, -0.4595947265625, -0.387908935546875, -0.31622314453125, -0.244537353515625, -0.1728515625, -0.101165771484375, -0.02947998046875, 0.042205810546875, 0.1138916015625, 0.185577392578125, 0.25726318359375, 0.328948974609375, 0.400634765625, 0.472320556640625, 0.54400634765625, 0.615692138671875, 0.6873779296875, 0.759063720703125, 0.83074951171875, 0.902435302734375, 0.97412109375, 1.045806884765625, 1.11749267578125, 1.189178466796875, 1.2608642578125, 1.332550048828125, 1.40423583984375, 1.475921630859375, 1.547607421875, 1.619293212890625, 1.69097900390625, 1.762664794921875, 1.8343505859375, 1.906036376953125, 1.97772216796875, 2.049407958984375, 2.12109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 7.0, 4.0, 11.0, 14.0, 24.0, 13.0, 11.0, 11.0, 23.0, 19.0, 12.0, 21.0, 32.0, 38.0, 28.0, 29.0, 46.0, 39.0, 45.0, 41.0, 50.0, 38.0, 42.0, 53.0, 33.0, 47.0, 41.0, 36.0, 23.0, 30.0, 17.0, 17.0, 19.0, 15.0, 9.0, 13.0, 3.0, 8.0, 15.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.921875, -17.4102783203125, -16.898681640625, -16.3870849609375, -15.87548828125, -15.3638916015625, -14.852294921875, -14.3406982421875, -13.8291015625, -13.3175048828125, -12.805908203125, -12.2943115234375, -11.78271484375, -11.2711181640625, -10.759521484375, -10.2479248046875, -9.736328125, -9.2247314453125, -8.713134765625, -8.2015380859375, -7.68994140625, -7.1783447265625, -6.666748046875, -6.1551513671875, -5.6435546875, -5.1319580078125, -4.620361328125, -4.1087646484375, -3.59716796875, -3.0855712890625, -2.573974609375, -2.0623779296875, -1.55078125, -1.0391845703125, -0.527587890625, -0.0159912109375, 0.49560546875, 1.0072021484375, 1.518798828125, 2.0303955078125, 2.5419921875, 3.0535888671875, 3.565185546875, 4.0767822265625, 4.58837890625, 5.0999755859375, 5.611572265625, 6.1231689453125, 6.634765625, 7.1463623046875, 7.657958984375, 8.1695556640625, 8.68115234375, 9.1927490234375, 9.704345703125, 10.2159423828125, 10.7275390625, 11.2391357421875, 11.750732421875, 12.2623291015625, 12.77392578125, 13.2855224609375, 13.797119140625, 14.3087158203125, 14.8203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 12.0, 22.0, 36.0, 38.0, 65.0, 99.0, 128.0, 208.0, 309.0, 548.0, 736.0, 1163.0, 1884.0, 3067.0, 5113.0, 8172.0, 13570.0, 22052.0, 36114.0, 55542.0, 83828.0, 115551.0, 143144.0, 148353.0, 129375.0, 97445.0, 67563.0, 43583.0, 27439.0, 16783.0, 10426.0, 6132.0, 3801.0, 2287.0, 1452.0, 880.0, 565.0, 365.0, 249.0, 149.0, 102.0, 80.0, 41.0, 31.0, 19.0, 14.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.26953125, -2.19683837890625, -2.1241455078125, -2.05145263671875, -1.978759765625, -1.90606689453125, -1.8333740234375, -1.76068115234375, -1.68798828125, -1.61529541015625, -1.5426025390625, -1.46990966796875, -1.397216796875, -1.32452392578125, -1.2518310546875, -1.17913818359375, -1.1064453125, -1.03375244140625, -0.9610595703125, -0.88836669921875, -0.815673828125, -0.74298095703125, -0.6702880859375, -0.59759521484375, -0.52490234375, -0.45220947265625, -0.3795166015625, -0.30682373046875, -0.234130859375, -0.16143798828125, -0.0887451171875, -0.01605224609375, 0.056640625, 0.12933349609375, 0.2020263671875, 0.27471923828125, 0.347412109375, 0.42010498046875, 0.4927978515625, 0.56549072265625, 0.63818359375, 0.71087646484375, 0.7835693359375, 0.85626220703125, 0.928955078125, 1.00164794921875, 1.0743408203125, 1.14703369140625, 1.2197265625, 1.29241943359375, 1.3651123046875, 1.43780517578125, 1.510498046875, 1.58319091796875, 1.6558837890625, 1.72857666015625, 1.80126953125, 1.87396240234375, 1.9466552734375, 2.01934814453125, 2.092041015625, 2.16473388671875, 2.2374267578125, 2.31011962890625, 2.3828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 9.0, 8.0, 12.0, 13.0, 5.0, 11.0, 10.0, 17.0, 17.0, 16.0, 21.0, 29.0, 33.0, 28.0, 33.0, 32.0, 32.0, 47.0, 31.0, 51.0, 36.0, 34.0, 32.0, 42.0, 30.0, 36.0, 40.0, 24.0, 33.0, 33.0, 21.0, 24.0, 20.0, 25.0, 20.0, 15.0, 16.0, 9.0, 10.0, 11.0, 10.0, 0.0, 6.0, 5.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0], "bins": [-10.265625, -9.9615478515625, -9.657470703125, -9.3533935546875, -9.04931640625, -8.7452392578125, -8.441162109375, -8.1370849609375, -7.8330078125, -7.5289306640625, -7.224853515625, -6.9207763671875, -6.61669921875, -6.3126220703125, -6.008544921875, -5.7044677734375, -5.400390625, -5.0963134765625, -4.792236328125, -4.4881591796875, -4.18408203125, -3.8800048828125, -3.575927734375, -3.2718505859375, -2.9677734375, -2.6636962890625, -2.359619140625, -2.0555419921875, -1.75146484375, -1.4473876953125, -1.143310546875, -0.8392333984375, -0.53515625, -0.2310791015625, 0.072998046875, 0.3770751953125, 0.68115234375, 0.9852294921875, 1.289306640625, 1.5933837890625, 1.8974609375, 2.2015380859375, 2.505615234375, 2.8096923828125, 3.11376953125, 3.4178466796875, 3.721923828125, 4.0260009765625, 4.330078125, 4.6341552734375, 4.938232421875, 5.2423095703125, 5.54638671875, 5.8504638671875, 6.154541015625, 6.4586181640625, 6.7626953125, 7.0667724609375, 7.370849609375, 7.6749267578125, 7.97900390625, 8.2830810546875, 8.587158203125, 8.8912353515625, 9.1953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 2.0, 7.0, 6.0, 9.0, 12.0, 24.0, 29.0, 44.0, 49.0, 79.0, 107.0, 172.0, 268.0, 381.0, 629.0, 1113.0, 1985.0, 3996.0, 8287.0, 18623.0, 47583.0, 127254.0, 283968.0, 308059.0, 148888.0, 56203.0, 21766.0, 9325.0, 4336.0, 2221.0, 1197.0, 689.0, 431.0, 276.0, 189.0, 111.0, 58.0, 55.0, 39.0, 21.0, 19.0, 11.0, 9.0, 11.0, 8.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50732421875, -0.49100494384765625, -0.4746856689453125, -0.45836639404296875, -0.442047119140625, -0.42572784423828125, -0.4094085693359375, -0.39308929443359375, -0.37677001953125, -0.36045074462890625, -0.3441314697265625, -0.32781219482421875, -0.311492919921875, -0.29517364501953125, -0.2788543701171875, -0.26253509521484375, -0.2462158203125, -0.22989654541015625, -0.2135772705078125, -0.19725799560546875, -0.180938720703125, -0.16461944580078125, -0.1483001708984375, -0.13198089599609375, -0.11566162109375, -0.09934234619140625, -0.0830230712890625, -0.06670379638671875, -0.050384521484375, -0.03406524658203125, -0.0177459716796875, -0.00142669677734375, 0.014892578125, 0.03121185302734375, 0.0475311279296875, 0.06385040283203125, 0.080169677734375, 0.09648895263671875, 0.1128082275390625, 0.12912750244140625, 0.14544677734375, 0.16176605224609375, 0.1780853271484375, 0.19440460205078125, 0.210723876953125, 0.22704315185546875, 0.2433624267578125, 0.25968170166015625, 0.2760009765625, 0.29232025146484375, 0.3086395263671875, 0.32495880126953125, 0.341278076171875, 0.35759735107421875, 0.3739166259765625, 0.39023590087890625, 0.40655517578125, 0.42287445068359375, 0.4391937255859375, 0.45551300048828125, 0.471832275390625, 0.48815155029296875, 0.5044708251953125, 0.5207901000976562, 0.537109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 9.0, 11.0, 17.0, 28.0, 27.0, 41.0, 44.0, 77.0, 95.0, 111.0, 98.0, 99.0, 87.0, 71.0, 41.0, 26.0, 28.0, 14.0, 11.0, 6.0, 11.0, 5.0, 3.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.053945541381836e-05, -8.772220462560654e-05, -8.490495383739471e-05, -8.208770304918289e-05, -7.927045226097107e-05, -7.645320147275925e-05, -7.363595068454742e-05, -7.08186998963356e-05, -6.800144910812378e-05, -6.518419831991196e-05, -6.236694753170013e-05, -5.954969674348831e-05, -5.673244595527649e-05, -5.391519516706467e-05, -5.1097944378852844e-05, -4.828069359064102e-05, -4.54634428024292e-05, -4.264619201421738e-05, -3.9828941226005554e-05, -3.701169043779373e-05, -3.419443964958191e-05, -3.137718886137009e-05, -2.8559938073158264e-05, -2.574268728494644e-05, -2.292543649673462e-05, -2.0108185708522797e-05, -1.7290934920310974e-05, -1.4473684132099152e-05, -1.1656433343887329e-05, -8.839182555675507e-06, -6.021931767463684e-06, -3.2046809792518616e-06, -3.8743019104003906e-07, 2.4298205971717834e-06, 5.247071385383606e-06, 8.064322173595428e-06, 1.0881572961807251e-05, 1.3698823750019073e-05, 1.6516074538230896e-05, 1.933332532644272e-05, 2.215057611465454e-05, 2.4967826902866364e-05, 2.7785077691078186e-05, 3.060232847929001e-05, 3.341957926750183e-05, 3.6236830055713654e-05, 3.9054080843925476e-05, 4.18713316321373e-05, 4.468858242034912e-05, 4.7505833208560944e-05, 5.0323083996772766e-05, 5.314033478498459e-05, 5.595758557319641e-05, 5.8774836361408234e-05, 6.159208714962006e-05, 6.440933793783188e-05, 6.72265887260437e-05, 7.004383951425552e-05, 7.286109030246735e-05, 7.567834109067917e-05, 7.849559187889099e-05, 8.131284266710281e-05, 8.413009345531464e-05, 8.694734424352646e-05, 8.976459503173828e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 7.0, 8.0, 9.0, 28.0, 31.0, 64.0, 64.0, 92.0, 121.0, 203.0, 269.0, 434.0, 550.0, 887.0, 1377.0, 2076.0, 3377.0, 5449.0, 9640.0, 17418.0, 33076.0, 67358.0, 136367.0, 241682.0, 244162.0, 138766.0, 68479.0, 34110.0, 17662.0, 9553.0, 5538.0, 3476.0, 2051.0, 1328.0, 899.0, 633.0, 390.0, 279.0, 185.0, 126.0, 86.0, 80.0, 42.0, 34.0, 26.0, 23.0, 17.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.875, -0.849273681640625, -0.82354736328125, -0.797821044921875, -0.7720947265625, -0.746368408203125, -0.72064208984375, -0.694915771484375, -0.669189453125, -0.643463134765625, -0.61773681640625, -0.592010498046875, -0.5662841796875, -0.540557861328125, -0.51483154296875, -0.489105224609375, -0.46337890625, -0.437652587890625, -0.41192626953125, -0.386199951171875, -0.3604736328125, -0.334747314453125, -0.30902099609375, -0.283294677734375, -0.257568359375, -0.231842041015625, -0.20611572265625, -0.180389404296875, -0.1546630859375, -0.128936767578125, -0.10321044921875, -0.077484130859375, -0.0517578125, -0.026031494140625, -0.00030517578125, 0.025421142578125, 0.0511474609375, 0.076873779296875, 0.10260009765625, 0.128326416015625, 0.154052734375, 0.179779052734375, 0.20550537109375, 0.231231689453125, 0.2569580078125, 0.282684326171875, 0.30841064453125, 0.334136962890625, 0.35986328125, 0.385589599609375, 0.41131591796875, 0.437042236328125, 0.4627685546875, 0.488494873046875, 0.51422119140625, 0.539947509765625, 0.565673828125, 0.591400146484375, 0.61712646484375, 0.642852783203125, 0.6685791015625, 0.694305419921875, 0.72003173828125, 0.745758056640625, 0.771484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 3.0, 4.0, 3.0, 4.0, 9.0, 12.0, 14.0, 12.0, 16.0, 17.0, 29.0, 30.0, 29.0, 36.0, 42.0, 50.0, 50.0, 49.0, 66.0, 64.0, 49.0, 54.0, 45.0, 44.0, 37.0, 32.0, 36.0, 19.0, 14.0, 22.0, 23.0, 16.0, 11.0, 6.0, 8.0, 11.0, 8.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0], "bins": [-0.22265625, -0.21608352661132812, -0.20951080322265625, -0.20293807983398438, -0.1963653564453125, -0.18979263305664062, -0.18321990966796875, -0.17664718627929688, -0.170074462890625, -0.16350173950195312, -0.15692901611328125, -0.15035629272460938, -0.1437835693359375, -0.13721084594726562, -0.13063812255859375, -0.12406539916992188, -0.11749267578125, -0.11091995239257812, -0.10434722900390625, -0.09777450561523438, -0.0912017822265625, -0.08462905883789062, -0.07805633544921875, -0.07148361206054688, -0.064910888671875, -0.058338165283203125, -0.05176544189453125, -0.045192718505859375, -0.0386199951171875, -0.032047271728515625, -0.02547454833984375, -0.018901824951171875, -0.0123291015625, -0.005756378173828125, 0.00081634521484375, 0.007389068603515625, 0.0139617919921875, 0.020534515380859375, 0.02710723876953125, 0.033679962158203125, 0.040252685546875, 0.046825408935546875, 0.05339813232421875, 0.059970855712890625, 0.0665435791015625, 0.07311630249023438, 0.07968902587890625, 0.08626174926757812, 0.09283447265625, 0.09940719604492188, 0.10597991943359375, 0.11255264282226562, 0.1191253662109375, 0.12569808959960938, 0.13227081298828125, 0.13884353637695312, 0.145416259765625, 0.15198898315429688, 0.15856170654296875, 0.16513442993164062, 0.1717071533203125, 0.17827987670898438, 0.18485260009765625, 0.19142532348632812, 0.197998046875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 3.0, 9.0, 17.0, 13.0, 21.0, 28.0, 24.0, 32.0, 38.0, 33.0, 42.0, 42.0, 56.0, 62.0, 57.0, 59.0, 53.0, 65.0, 44.0, 51.0, 44.0, 34.0, 24.0, 29.0, 29.0, 22.0, 15.0, 16.0, 9.0, 7.0, 6.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.706798553466797, -17.189796447753906, -16.672792434692383, -16.155790328979492, -15.638788223266602, -15.121785163879395, -14.604782104492188, -14.087779998779297, -13.57077693939209, -13.053773880004883, -12.536771774291992, -12.019768714904785, -11.502765655517578, -10.985763549804688, -10.46876049041748, -9.951757431030273, -9.434755325317383, -8.917752265930176, -8.400750160217285, -7.883747100830078, -7.366744518280029, -6.8497419357299805, -6.332738876342773, -5.815736293792725, -5.298733711242676, -4.781731128692627, -4.264728546142578, -3.747725486755371, -3.2307229042053223, -2.7137203216552734, -2.1967175006866455, -1.6797146797180176, -1.162710189819336, -0.6457074880599976, -0.12870478630065918, 0.3882979154586792, 0.9053006172180176, 1.4223031997680664, 1.9393060207366943, 2.4563088417053223, 2.973311424255371, 3.49031400680542, 4.007316589355469, 4.524319648742676, 5.041322231292725, 5.558324813842773, 6.0753278732299805, 6.592330455780029, 7.109333038330078, 7.626335620880127, 8.143338203430176, 8.660341262817383, 9.177343368530273, 9.69434642791748, 10.211349487304688, 10.728351593017578, 11.245354652404785, 11.762357711791992, 12.279359817504883, 12.79636287689209, 13.313365936279297, 13.830368041992188, 14.347371101379395, 14.864374160766602, 15.381376266479492]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 0.0, 0.0, 4.0, 10.0, 11.0, 11.0, 7.0, 11.0, 12.0, 15.0, 15.0, 24.0, 24.0, 23.0, 27.0, 38.0, 39.0, 37.0, 26.0, 39.0, 49.0, 38.0, 53.0, 53.0, 36.0, 39.0, 31.0, 46.0, 41.0, 39.0, 32.0, 23.0, 23.0, 22.0, 22.0, 15.0, 13.0, 14.0, 7.0, 9.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.27195930480957, -16.76767921447754, -16.263399124145508, -15.75911808013916, -15.254837036132812, -14.750556945800781, -14.24627685546875, -13.741995811462402, -13.237714767456055, -12.733434677124023, -12.229153633117676, -11.724873542785645, -11.220592498779297, -10.716312408447266, -10.212032318115234, -9.707751274108887, -9.203471183776855, -8.699191093444824, -8.194910049438477, -7.690629959106445, -7.186348915100098, -6.682068824768066, -6.177788257598877, -5.6735076904296875, -5.169227123260498, -4.664946556091309, -4.160665988922119, -3.656385660171509, -3.1521050930023193, -2.64782452583313, -2.1435441970825195, -1.63926362991333, -1.1349821090698242, -0.6307016015052795, -0.12642109394073486, 0.37785935401916504, 0.8821399211883545, 1.386420488357544, 1.8907008171081543, 2.3949813842773438, 2.899261951446533, 3.4035425186157227, 3.907823085784912, 4.412103652954102, 4.916383743286133, 5.4206647872924805, 5.924944877624512, 6.429225444793701, 6.933506011962891, 7.43778657913208, 7.9420671463012695, 8.4463472366333, 8.950628280639648, 9.45490837097168, 9.959188461303711, 10.463469505310059, 10.967750549316406, 11.472030639648438, 11.976311683654785, 12.480591773986816, 12.984872817993164, 13.489152908325195, 13.993432998657227, 14.497714042663574, 15.001994132995605]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 13.0, 22.0, 28.0, 41.0, 82.0, 89.0, 171.0, 230.0, 386.0, 668.0, 1029.0, 1648.0, 2484.0, 3718.0, 6034.0, 8833.0, 13091.0, 19132.0, 26699.0, 36459.0, 48101.0, 60826.0, 73757.0, 84821.0, 92462.0, 94994.0, 92184.0, 84109.0, 72572.0, 59700.0, 47336.0, 35509.0, 25579.0, 18333.0, 12623.0, 8512.0, 5901.0, 3677.0, 2415.0, 1538.0, 1022.0, 651.0, 404.0, 245.0, 147.0, 111.0, 66.0, 36.0, 25.0, 15.0, 8.0, 8.0, 5.0, 5.0, 2.0, 1.0], "bins": [-8.390625, -8.13983154296875, -7.8890380859375, -7.63824462890625, -7.387451171875, -7.13665771484375, -6.8858642578125, -6.63507080078125, -6.38427734375, -6.13348388671875, -5.8826904296875, -5.63189697265625, -5.381103515625, -5.13031005859375, -4.8795166015625, -4.62872314453125, -4.3779296875, -4.12713623046875, -3.8763427734375, -3.62554931640625, -3.374755859375, -3.12396240234375, -2.8731689453125, -2.62237548828125, -2.37158203125, -2.12078857421875, -1.8699951171875, -1.61920166015625, -1.368408203125, -1.11761474609375, -0.8668212890625, -0.61602783203125, -0.365234375, -0.11444091796875, 0.1363525390625, 0.38714599609375, 0.637939453125, 0.88873291015625, 1.1395263671875, 1.39031982421875, 1.64111328125, 1.89190673828125, 2.1427001953125, 2.39349365234375, 2.644287109375, 2.89508056640625, 3.1458740234375, 3.39666748046875, 3.6474609375, 3.89825439453125, 4.1490478515625, 4.39984130859375, 4.650634765625, 4.90142822265625, 5.1522216796875, 5.40301513671875, 5.65380859375, 5.90460205078125, 6.1553955078125, 6.40618896484375, 6.656982421875, 6.90777587890625, 7.1585693359375, 7.40936279296875, 7.66015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 0.0, 3.0, 6.0, 12.0, 7.0, 8.0, 13.0, 19.0, 17.0, 16.0, 15.0, 27.0, 22.0, 28.0, 28.0, 40.0, 31.0, 44.0, 43.0, 52.0, 43.0, 40.0, 53.0, 34.0, 43.0, 41.0, 34.0, 41.0, 24.0, 38.0, 31.0, 27.0, 21.0, 22.0, 11.0, 14.0, 12.0, 10.0, 7.0, 5.0, 2.0, 7.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.71875, -16.200927734375, -15.68310546875, -15.165283203125, -14.6474609375, -14.129638671875, -13.61181640625, -13.093994140625, -12.576171875, -12.058349609375, -11.54052734375, -11.022705078125, -10.5048828125, -9.987060546875, -9.46923828125, -8.951416015625, -8.43359375, -7.915771484375, -7.39794921875, -6.880126953125, -6.3623046875, -5.844482421875, -5.32666015625, -4.808837890625, -4.291015625, -3.773193359375, -3.25537109375, -2.737548828125, -2.2197265625, -1.701904296875, -1.18408203125, -0.666259765625, -0.1484375, 0.369384765625, 0.88720703125, 1.405029296875, 1.9228515625, 2.440673828125, 2.95849609375, 3.476318359375, 3.994140625, 4.511962890625, 5.02978515625, 5.547607421875, 6.0654296875, 6.583251953125, 7.10107421875, 7.618896484375, 8.13671875, 8.654541015625, 9.17236328125, 9.690185546875, 10.2080078125, 10.725830078125, 11.24365234375, 11.761474609375, 12.279296875, 12.797119140625, 13.31494140625, 13.832763671875, 14.3505859375, 14.868408203125, 15.38623046875, 15.904052734375, 16.421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 8.0, 9.0, 16.0, 26.0, 44.0, 62.0, 123.0, 187.0, 352.0, 583.0, 934.0, 1553.0, 2629.0, 4262.0, 6725.0, 10608.0, 16497.0, 24861.0, 36316.0, 50237.0, 66804.0, 84756.0, 98129.0, 106625.0, 108138.0, 100517.0, 87807.0, 70753.0, 53868.0, 39042.0, 26969.0, 17868.0, 11712.0, 7427.0, 4790.0, 2958.0, 1765.0, 1041.0, 617.0, 396.0, 235.0, 135.0, 73.0, 52.0, 24.0, 12.0, 13.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.0830078125, -8.791015625, -8.4990234375, -8.20703125, -7.9150390625, -7.623046875, -7.3310546875, -7.0390625, -6.7470703125, -6.455078125, -6.1630859375, -5.87109375, -5.5791015625, -5.287109375, -4.9951171875, -4.703125, -4.4111328125, -4.119140625, -3.8271484375, -3.53515625, -3.2431640625, -2.951171875, -2.6591796875, -2.3671875, -2.0751953125, -1.783203125, -1.4912109375, -1.19921875, -0.9072265625, -0.615234375, -0.3232421875, -0.03125, 0.2607421875, 0.552734375, 0.8447265625, 1.13671875, 1.4287109375, 1.720703125, 2.0126953125, 2.3046875, 2.5966796875, 2.888671875, 3.1806640625, 3.47265625, 3.7646484375, 4.056640625, 4.3486328125, 4.640625, 4.9326171875, 5.224609375, 5.5166015625, 5.80859375, 6.1005859375, 6.392578125, 6.6845703125, 6.9765625, 7.2685546875, 7.560546875, 7.8525390625, 8.14453125, 8.4365234375, 8.728515625, 9.0205078125, 9.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 11.0, 15.0, 23.0, 21.0, 24.0, 27.0, 39.0, 43.0, 36.0, 32.0, 44.0, 49.0, 43.0, 45.0, 32.0, 41.0, 32.0, 41.0, 43.0, 39.0, 34.0, 29.0, 36.0, 32.0, 23.0, 26.0, 19.0, 18.0, 11.0, 21.0, 18.0, 8.0, 4.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3984375, -11.048828125, -10.69921875, -10.349609375, -10.0, -9.650390625, -9.30078125, -8.951171875, -8.6015625, -8.251953125, -7.90234375, -7.552734375, -7.203125, -6.853515625, -6.50390625, -6.154296875, -5.8046875, -5.455078125, -5.10546875, -4.755859375, -4.40625, -4.056640625, -3.70703125, -3.357421875, -3.0078125, -2.658203125, -2.30859375, -1.958984375, -1.609375, -1.259765625, -0.91015625, -0.560546875, -0.2109375, 0.138671875, 0.48828125, 0.837890625, 1.1875, 1.537109375, 1.88671875, 2.236328125, 2.5859375, 2.935546875, 3.28515625, 3.634765625, 3.984375, 4.333984375, 4.68359375, 5.033203125, 5.3828125, 5.732421875, 6.08203125, 6.431640625, 6.78125, 7.130859375, 7.48046875, 7.830078125, 8.1796875, 8.529296875, 8.87890625, 9.228515625, 9.578125, 9.927734375, 10.27734375, 10.626953125, 10.9765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 14.0, 9.0, 26.0, 37.0, 69.0, 92.0, 184.0, 288.0, 600.0, 1011.0, 1629.0, 2833.0, 4962.0, 8573.0, 14464.0, 23983.0, 37318.0, 56368.0, 79681.0, 103234.0, 120714.0, 127692.0, 121830.0, 103809.0, 81547.0, 57865.0, 38808.0, 24686.0, 15114.0, 8796.0, 5265.0, 2973.0, 1733.0, 968.0, 557.0, 359.0, 189.0, 112.0, 72.0, 36.0, 23.0, 13.0, 8.0, 6.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.25, -4.130401611328125, -4.01080322265625, -3.891204833984375, -3.7716064453125, -3.652008056640625, -3.53240966796875, -3.412811279296875, -3.293212890625, -3.173614501953125, -3.05401611328125, -2.934417724609375, -2.8148193359375, -2.695220947265625, -2.57562255859375, -2.456024169921875, -2.33642578125, -2.216827392578125, -2.09722900390625, -1.977630615234375, -1.8580322265625, -1.738433837890625, -1.61883544921875, -1.499237060546875, -1.379638671875, -1.260040283203125, -1.14044189453125, -1.020843505859375, -0.9012451171875, -0.781646728515625, -0.66204833984375, -0.542449951171875, -0.4228515625, -0.303253173828125, -0.18365478515625, -0.064056396484375, 0.0555419921875, 0.175140380859375, 0.29473876953125, 0.414337158203125, 0.533935546875, 0.653533935546875, 0.77313232421875, 0.892730712890625, 1.0123291015625, 1.131927490234375, 1.25152587890625, 1.371124267578125, 1.49072265625, 1.610321044921875, 1.72991943359375, 1.849517822265625, 1.9691162109375, 2.088714599609375, 2.20831298828125, 2.327911376953125, 2.447509765625, 2.567108154296875, 2.68670654296875, 2.806304931640625, 2.9259033203125, 3.045501708984375, 3.16510009765625, 3.284698486328125, 3.404296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 6.0, 4.0, 9.0, 10.0, 11.0, 11.0, 19.0, 26.0, 19.0, 23.0, 33.0, 24.0, 33.0, 37.0, 39.0, 44.0, 42.0, 48.0, 42.0, 53.0, 42.0, 41.0, 31.0, 35.0, 43.0, 22.0, 29.0, 28.0, 22.0, 28.0, 22.0, 23.0, 16.0, 13.0, 9.0, 12.0, 9.0, 4.0, 2.0, 5.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003452301025390625, -0.00033386796712875366, -0.0003225058317184448, -0.000311143696308136, -0.00029978156089782715, -0.0002884194254875183, -0.00027705729007720947, -0.00026569515466690063, -0.0002543330192565918, -0.00024297088384628296, -0.00023160874843597412, -0.00022024661302566528, -0.00020888447761535645, -0.0001975223422050476, -0.00018616020679473877, -0.00017479807138442993, -0.0001634359359741211, -0.00015207380056381226, -0.00014071166515350342, -0.00012934952974319458, -0.00011798739433288574, -0.0001066252589225769, -9.526312351226807e-05, -8.390098810195923e-05, -7.253885269165039e-05, -6.117671728134155e-05, -4.9814581871032715e-05, -3.845244646072388e-05, -2.709031105041504e-05, -1.57281756401062e-05, -4.366040229797363e-06, 6.996095180511475e-06, 1.8358230590820312e-05, 2.972036600112915e-05, 4.108250141143799e-05, 5.2444636821746826e-05, 6.380677223205566e-05, 7.51689076423645e-05, 8.653104305267334e-05, 9.789317846298218e-05, 0.00010925531387329102, 0.00012061744928359985, 0.0001319795846939087, 0.00014334172010421753, 0.00015470385551452637, 0.0001660659909248352, 0.00017742812633514404, 0.00018879026174545288, 0.00020015239715576172, 0.00021151453256607056, 0.0002228766679763794, 0.00023423880338668823, 0.00024560093879699707, 0.0002569630742073059, 0.00026832520961761475, 0.0002796873450279236, 0.0002910494804382324, 0.00030241161584854126, 0.0003137737512588501, 0.00032513588666915894, 0.0003364980220794678, 0.0003478601574897766, 0.00035922229290008545, 0.0003705844283103943, 0.0003819465637207031]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 10.0, 28.0, 23.0, 51.0, 82.0, 126.0, 226.0, 394.0, 640.0, 1109.0, 2092.0, 3587.0, 6393.0, 10830.0, 17864.0, 29482.0, 46154.0, 68897.0, 94677.0, 118792.0, 132755.0, 131173.0, 115499.0, 90913.0, 65362.0, 43974.0, 27667.0, 16451.0, 9973.0, 5556.0, 3315.0, 1879.0, 1089.0, 627.0, 342.0, 201.0, 113.0, 85.0, 52.0, 24.0, 13.0, 11.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.24609375, -4.11309814453125, -3.9801025390625, -3.84710693359375, -3.714111328125, -3.58111572265625, -3.4481201171875, -3.31512451171875, -3.18212890625, -3.04913330078125, -2.9161376953125, -2.78314208984375, -2.650146484375, -2.51715087890625, -2.3841552734375, -2.25115966796875, -2.1181640625, -1.98516845703125, -1.8521728515625, -1.71917724609375, -1.586181640625, -1.45318603515625, -1.3201904296875, -1.18719482421875, -1.05419921875, -0.92120361328125, -0.7882080078125, -0.65521240234375, -0.522216796875, -0.38922119140625, -0.2562255859375, -0.12322998046875, 0.009765625, 0.14276123046875, 0.2757568359375, 0.40875244140625, 0.541748046875, 0.67474365234375, 0.8077392578125, 0.94073486328125, 1.07373046875, 1.20672607421875, 1.3397216796875, 1.47271728515625, 1.605712890625, 1.73870849609375, 1.8717041015625, 2.00469970703125, 2.1376953125, 2.27069091796875, 2.4036865234375, 2.53668212890625, 2.669677734375, 2.80267333984375, 2.9356689453125, 3.06866455078125, 3.20166015625, 3.33465576171875, 3.4676513671875, 3.60064697265625, 3.733642578125, 3.86663818359375, 3.9996337890625, 4.13262939453125, 4.265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 6.0, 7.0, 9.0, 16.0, 13.0, 13.0, 15.0, 22.0, 27.0, 30.0, 30.0, 20.0, 43.0, 37.0, 51.0, 37.0, 50.0, 45.0, 52.0, 56.0, 42.0, 51.0, 46.0, 38.0, 24.0, 28.0, 29.0, 26.0, 21.0, 18.0, 19.0, 16.0, 13.0, 12.0, 3.0, 4.0, 4.0, 4.0, 5.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5214385986328125, -1.471588134765625, -1.4217376708984375, -1.37188720703125, -1.3220367431640625, -1.272186279296875, -1.2223358154296875, -1.1724853515625, -1.1226348876953125, -1.072784423828125, -1.0229339599609375, -0.97308349609375, -0.9232330322265625, -0.873382568359375, -0.8235321044921875, -0.773681640625, -0.7238311767578125, -0.673980712890625, -0.6241302490234375, -0.57427978515625, -0.5244293212890625, -0.474578857421875, -0.4247283935546875, -0.3748779296875, -0.3250274658203125, -0.275177001953125, -0.2253265380859375, -0.17547607421875, -0.1256256103515625, -0.075775146484375, -0.0259246826171875, 0.02392578125, 0.0737762451171875, 0.123626708984375, 0.1734771728515625, 0.22332763671875, 0.2731781005859375, 0.323028564453125, 0.3728790283203125, 0.4227294921875, 0.4725799560546875, 0.522430419921875, 0.5722808837890625, 0.62213134765625, 0.6719818115234375, 0.721832275390625, 0.7716827392578125, 0.821533203125, 0.8713836669921875, 0.921234130859375, 0.9710845947265625, 1.02093505859375, 1.0707855224609375, 1.120635986328125, 1.1704864501953125, 1.2203369140625, 1.2701873779296875, 1.320037841796875, 1.3698883056640625, 1.41973876953125, 1.4695892333984375, 1.519439697265625, 1.5692901611328125, 1.619140625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 13.0, 10.0, 21.0, 27.0, 36.0, 17.0, 43.0, 46.0, 47.0, 41.0, 53.0, 60.0, 69.0, 63.0, 68.0, 63.0, 44.0, 46.0, 35.0, 37.0, 31.0, 28.0, 29.0, 20.0, 8.0, 9.0, 11.0, 12.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5992431640625, -18.036405563354492, -17.473567962646484, -16.910730361938477, -16.34789276123047, -15.785055160522461, -15.222217559814453, -14.659379959106445, -14.096542358398438, -13.53370475769043, -12.970867156982422, -12.408029556274414, -11.845191955566406, -11.282354354858398, -10.71951675415039, -10.156679153442383, -9.593842506408691, -9.031004905700684, -8.468167304992676, -7.905329704284668, -7.34249210357666, -6.779654502868652, -6.216817378997803, -5.653979778289795, -5.091142177581787, -4.528304576873779, -3.9654669761657715, -3.4026296138763428, -2.839792013168335, -2.276954412460327, -1.7141170501708984, -1.1512794494628906, -0.5884418487548828, -0.025604307651519775, 0.5372332334518433, 1.1000707149505615, 1.6629083156585693, 2.225745916366577, 2.788583278656006, 3.3514208793640137, 3.9142584800720215, 4.477096080780029, 5.039933681488037, 5.602770805358887, 6.1656084060668945, 6.728446006774902, 7.29128360748291, 7.854121208190918, 8.416958808898926, 8.979796409606934, 9.542634010314941, 10.10547161102295, 10.668309211730957, 11.231146812438965, 11.793983459472656, 12.356821060180664, 12.919658660888672, 13.48249626159668, 14.045333862304688, 14.608171463012695, 15.171009063720703, 15.733846664428711, 16.29668426513672, 16.859521865844727, 17.422359466552734]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 7.0, 13.0, 4.0, 5.0, 14.0, 18.0, 18.0, 16.0, 13.0, 23.0, 29.0, 27.0, 35.0, 34.0, 50.0, 51.0, 48.0, 47.0, 46.0, 54.0, 48.0, 39.0, 51.0, 32.0, 40.0, 45.0, 31.0, 24.0, 36.0, 21.0, 14.0, 7.0, 20.0, 13.0, 10.0, 5.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.871850967407227, -17.271791458129883, -16.67173194885254, -16.071670532226562, -15.471611022949219, -14.871551513671875, -14.271492004394531, -13.671432495117188, -13.071372032165527, -12.471312522888184, -11.871252059936523, -11.27119255065918, -10.671133041381836, -10.071072578430176, -9.471013069152832, -8.870952606201172, -8.270893096923828, -7.670833110809326, -7.070773124694824, -6.4707136154174805, -5.8706536293029785, -5.270593643188477, -4.670534133911133, -4.070474147796631, -3.470414161682129, -2.870354175567627, -2.270294427871704, -1.6702345609664917, -1.0701746940612793, -0.47011470794677734, 0.1299450397491455, 0.7300047874450684, 1.3300666809082031, 1.9301265478134155, 2.530186414718628, 3.130246162414551, 3.7303061485290527, 4.330366134643555, 4.930425643920898, 5.5304856300354, 6.130545616149902, 6.730605602264404, 7.330665588378906, 7.93072509765625, 8.530784606933594, 9.130845069885254, 9.730904579162598, 10.330965042114258, 10.931024551391602, 11.531084060668945, 12.131144523620605, 12.73120403289795, 13.33126449584961, 13.931324005126953, 14.531383514404297, 15.13144302368164, 15.7315034866333, 16.33156394958496, 16.931623458862305, 17.53168296813965, 18.131742477416992, 18.73180389404297, 19.331863403320312, 19.931922912597656, 20.531982421875]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 17.0, 26.0, 37.0, 90.0, 130.0, 187.0, 328.0, 594.0, 925.0, 1619.0, 2498.0, 4162.0, 6696.0, 10928.0, 17160.0, 27099.0, 41124.0, 62619.0, 91985.0, 132055.0, 179879.0, 237172.0, 297296.0, 352547.0, 390698.0, 406870.0, 395603.0, 360604.0, 307524.0, 248377.0, 190261.0, 138978.0, 97723.0, 67057.0, 45006.0, 29376.0, 18832.0, 11915.0, 7392.0, 4375.0, 2604.0, 1613.0, 949.0, 583.0, 343.0, 178.0, 113.0, 70.0, 33.0, 27.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.859375, -9.556884765625, -9.25439453125, -8.951904296875, -8.6494140625, -8.346923828125, -8.04443359375, -7.741943359375, -7.439453125, -7.136962890625, -6.83447265625, -6.531982421875, -6.2294921875, -5.927001953125, -5.62451171875, -5.322021484375, -5.01953125, -4.717041015625, -4.41455078125, -4.112060546875, -3.8095703125, -3.507080078125, -3.20458984375, -2.902099609375, -2.599609375, -2.297119140625, -1.99462890625, -1.692138671875, -1.3896484375, -1.087158203125, -0.78466796875, -0.482177734375, -0.1796875, 0.122802734375, 0.42529296875, 0.727783203125, 1.0302734375, 1.332763671875, 1.63525390625, 1.937744140625, 2.240234375, 2.542724609375, 2.84521484375, 3.147705078125, 3.4501953125, 3.752685546875, 4.05517578125, 4.357666015625, 4.66015625, 4.962646484375, 5.26513671875, 5.567626953125, 5.8701171875, 6.172607421875, 6.47509765625, 6.777587890625, 7.080078125, 7.382568359375, 7.68505859375, 7.987548828125, 8.2900390625, 8.592529296875, 8.89501953125, 9.197509765625, 9.5]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 4.0, 6.0, 4.0, 7.0, 6.0, 9.0, 8.0, 13.0, 15.0, 20.0, 25.0, 29.0, 20.0, 48.0, 31.0, 35.0, 47.0, 47.0, 64.0, 45.0, 50.0, 50.0, 39.0, 44.0, 45.0, 42.0, 42.0, 32.0, 20.0, 33.0, 21.0, 23.0, 22.0, 7.0, 13.0, 8.0, 12.0, 9.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.828125, -14.339111328125, -13.85009765625, -13.361083984375, -12.8720703125, -12.383056640625, -11.89404296875, -11.405029296875, -10.916015625, -10.427001953125, -9.93798828125, -9.448974609375, -8.9599609375, -8.470947265625, -7.98193359375, -7.492919921875, -7.00390625, -6.514892578125, -6.02587890625, -5.536865234375, -5.0478515625, -4.558837890625, -4.06982421875, -3.580810546875, -3.091796875, -2.602783203125, -2.11376953125, -1.624755859375, -1.1357421875, -0.646728515625, -0.15771484375, 0.331298828125, 0.8203125, 1.309326171875, 1.79833984375, 2.287353515625, 2.7763671875, 3.265380859375, 3.75439453125, 4.243408203125, 4.732421875, 5.221435546875, 5.71044921875, 6.199462890625, 6.6884765625, 7.177490234375, 7.66650390625, 8.155517578125, 8.64453125, 9.133544921875, 9.62255859375, 10.111572265625, 10.6005859375, 11.089599609375, 11.57861328125, 12.067626953125, 12.556640625, 13.045654296875, 13.53466796875, 14.023681640625, 14.5126953125, 15.001708984375, 15.49072265625, 15.979736328125, 16.46875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 10.0, 13.0, 26.0, 32.0, 79.0, 117.0, 238.0, 371.0, 589.0, 998.0, 1865.0, 2979.0, 5077.0, 8205.0, 13124.0, 21008.0, 32613.0, 48783.0, 72960.0, 102716.0, 142112.0, 186394.0, 237821.0, 286686.0, 330217.0, 360527.0, 373490.0, 366472.0, 340812.0, 299855.0, 252942.0, 201233.0, 155105.0, 113235.0, 80920.0, 55397.0, 36789.0, 23795.0, 15153.0, 9340.0, 5759.0, 3373.0, 2181.0, 1205.0, 726.0, 403.0, 239.0, 135.0, 69.0, 56.0, 28.0, 12.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.8671875, -9.56494140625, -9.2626953125, -8.96044921875, -8.658203125, -8.35595703125, -8.0537109375, -7.75146484375, -7.44921875, -7.14697265625, -6.8447265625, -6.54248046875, -6.240234375, -5.93798828125, -5.6357421875, -5.33349609375, -5.03125, -4.72900390625, -4.4267578125, -4.12451171875, -3.822265625, -3.52001953125, -3.2177734375, -2.91552734375, -2.61328125, -2.31103515625, -2.0087890625, -1.70654296875, -1.404296875, -1.10205078125, -0.7998046875, -0.49755859375, -0.1953125, 0.10693359375, 0.4091796875, 0.71142578125, 1.013671875, 1.31591796875, 1.6181640625, 1.92041015625, 2.22265625, 2.52490234375, 2.8271484375, 3.12939453125, 3.431640625, 3.73388671875, 4.0361328125, 4.33837890625, 4.640625, 4.94287109375, 5.2451171875, 5.54736328125, 5.849609375, 6.15185546875, 6.4541015625, 6.75634765625, 7.05859375, 7.36083984375, 7.6630859375, 7.96533203125, 8.267578125, 8.56982421875, 8.8720703125, 9.17431640625, 9.4765625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 7.0, 8.0, 11.0, 12.0, 14.0, 23.0, 23.0, 30.0, 59.0, 60.0, 59.0, 72.0, 97.0, 79.0, 111.0, 141.0, 143.0, 160.0, 175.0, 179.0, 197.0, 181.0, 191.0, 201.0, 185.0, 177.0, 191.0, 155.0, 169.0, 150.0, 108.0, 102.0, 100.0, 97.0, 64.0, 67.0, 55.0, 46.0, 41.0, 30.0, 24.0, 21.0, 14.0, 8.0, 7.0, 10.0, 4.0, 5.0, 4.0, 0.0, 4.0, 2.0, 3.0], "bins": [-6.37890625, -6.1907958984375, -6.002685546875, -5.8145751953125, -5.62646484375, -5.4383544921875, -5.250244140625, -5.0621337890625, -4.8740234375, -4.6859130859375, -4.497802734375, -4.3096923828125, -4.12158203125, -3.9334716796875, -3.745361328125, -3.5572509765625, -3.369140625, -3.1810302734375, -2.992919921875, -2.8048095703125, -2.61669921875, -2.4285888671875, -2.240478515625, -2.0523681640625, -1.8642578125, -1.6761474609375, -1.488037109375, -1.2999267578125, -1.11181640625, -0.9237060546875, -0.735595703125, -0.5474853515625, -0.359375, -0.1712646484375, 0.016845703125, 0.2049560546875, 0.39306640625, 0.5811767578125, 0.769287109375, 0.9573974609375, 1.1455078125, 1.3336181640625, 1.521728515625, 1.7098388671875, 1.89794921875, 2.0860595703125, 2.274169921875, 2.4622802734375, 2.650390625, 2.8385009765625, 3.026611328125, 3.2147216796875, 3.40283203125, 3.5909423828125, 3.779052734375, 3.9671630859375, 4.1552734375, 4.3433837890625, 4.531494140625, 4.7196044921875, 4.90771484375, 5.0958251953125, 5.283935546875, 5.4720458984375, 5.66015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 10.0, 5.0, 14.0, 8.0, 21.0, 16.0, 17.0, 25.0, 36.0, 28.0, 35.0, 40.0, 43.0, 39.0, 51.0, 52.0, 57.0, 47.0, 52.0, 56.0, 34.0, 53.0, 50.0, 31.0, 25.0, 32.0, 25.0, 18.0, 11.0, 19.0, 9.0, 16.0, 7.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.374584197998047, -14.856935501098633, -14.339285850524902, -13.821637153625488, -13.303987503051758, -12.786338806152344, -12.26869010925293, -11.7510404586792, -11.233390808105469, -10.715742111206055, -10.198092460632324, -9.68044376373291, -9.16279411315918, -8.645145416259766, -8.127496719360352, -7.609847068786621, -7.092198371887207, -6.574549198150635, -6.0569000244140625, -5.539251327514648, -5.021601676940918, -4.503952980041504, -3.9863038063049316, -3.4686546325683594, -2.951005458831787, -2.433356285095215, -1.9157072305679321, -1.3980581760406494, -0.8804090023040771, -0.3627598285675049, 0.15488910675048828, 0.6725382804870605, 1.1901874542236328, 1.707836627960205, 2.2254858016967773, 2.7431347370147705, 3.2607839107513428, 3.778433084487915, 4.296082019805908, 4.8137311935424805, 5.331380367279053, 5.849029541015625, 6.366678714752197, 6.8843278884887695, 7.401976585388184, 7.919626235961914, 8.437274932861328, 8.954923629760742, 9.472573280334473, 9.990221977233887, 10.507871627807617, 11.025520324707031, 11.543169975280762, 12.060818672180176, 12.578468322753906, 13.09611701965332, 13.613765716552734, 14.131414413452148, 14.649064064025879, 15.166712760925293, 15.684362411499023, 16.202011108398438, 16.71965980529785, 17.237308502197266, 17.754959106445312]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 3.0, 4.0, 12.0, 12.0, 18.0, 10.0, 13.0, 12.0, 23.0, 27.0, 29.0, 41.0, 39.0, 32.0, 39.0, 53.0, 42.0, 54.0, 44.0, 49.0, 54.0, 48.0, 43.0, 33.0, 38.0, 37.0, 35.0, 26.0, 15.0, 18.0, 20.0, 17.0, 12.0, 12.0, 8.0, 10.0, 8.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.725248336791992, -17.14628791809082, -16.56732749938965, -15.988367080688477, -15.409406661987305, -14.830446243286133, -14.251485824584961, -13.672525405883789, -13.093564987182617, -12.514604568481445, -11.935644149780273, -11.356683731079102, -10.77772331237793, -10.198762893676758, -9.619802474975586, -9.040842056274414, -8.461881637573242, -7.88292121887207, -7.303960800170898, -6.725000381469727, -6.146039962768555, -5.567079544067383, -4.988119125366211, -4.409158706665039, -3.830198287963867, -3.2512378692626953, -2.6722774505615234, -2.0933170318603516, -1.5143566131591797, -0.9353961944580078, -0.35643577575683594, 0.22252464294433594, 0.8014850616455078, 1.3804454803466797, 1.9594058990478516, 2.5383663177490234, 3.1173267364501953, 3.696287155151367, 4.275247573852539, 4.854207992553711, 5.433168411254883, 6.012128829956055, 6.591089248657227, 7.170049667358398, 7.74901008605957, 8.327970504760742, 8.906930923461914, 9.485891342163086, 10.064851760864258, 10.64381217956543, 11.222772598266602, 11.801733016967773, 12.380693435668945, 12.959653854370117, 13.538614273071289, 14.117574691772461, 14.696535110473633, 15.275495529174805, 15.854455947875977, 16.43341636657715, 17.01237678527832, 17.591337203979492, 18.170297622680664, 18.749258041381836, 19.328218460083008]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 9.0, 9.0, 9.0, 23.0, 28.0, 39.0, 72.0, 129.0, 209.0, 316.0, 460.0, 720.0, 1153.0, 1849.0, 2802.0, 4400.0, 7222.0, 11705.0, 18266.0, 29523.0, 46542.0, 72185.0, 105084.0, 140463.0, 156603.0, 141083.0, 106570.0, 73533.0, 47459.0, 29954.0, 18923.0, 11584.0, 7224.0, 4650.0, 2770.0, 1767.0, 1153.0, 744.0, 493.0, 293.0, 198.0, 129.0, 95.0, 49.0, 25.0, 20.0, 11.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.63763427734375, -2.5565185546875, -2.47540283203125, -2.394287109375, -2.31317138671875, -2.2320556640625, -2.15093994140625, -2.06982421875, -1.98870849609375, -1.9075927734375, -1.82647705078125, -1.745361328125, -1.66424560546875, -1.5831298828125, -1.50201416015625, -1.4208984375, -1.33978271484375, -1.2586669921875, -1.17755126953125, -1.096435546875, -1.01531982421875, -0.9342041015625, -0.85308837890625, -0.77197265625, -0.69085693359375, -0.6097412109375, -0.52862548828125, -0.447509765625, -0.36639404296875, -0.2852783203125, -0.20416259765625, -0.123046875, -0.04193115234375, 0.0391845703125, 0.12030029296875, 0.201416015625, 0.28253173828125, 0.3636474609375, 0.44476318359375, 0.52587890625, 0.60699462890625, 0.6881103515625, 0.76922607421875, 0.850341796875, 0.93145751953125, 1.0125732421875, 1.09368896484375, 1.1748046875, 1.25592041015625, 1.3370361328125, 1.41815185546875, 1.499267578125, 1.58038330078125, 1.6614990234375, 1.74261474609375, 1.82373046875, 1.90484619140625, 1.9859619140625, 2.06707763671875, 2.148193359375, 2.22930908203125, 2.3104248046875, 2.39154052734375, 2.47265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 3.0, 6.0, 9.0, 7.0, 8.0, 14.0, 14.0, 18.0, 19.0, 21.0, 30.0, 32.0, 37.0, 35.0, 48.0, 41.0, 43.0, 50.0, 51.0, 44.0, 43.0, 47.0, 58.0, 36.0, 35.0, 33.0, 30.0, 27.0, 20.0, 33.0, 28.0, 12.0, 16.0, 10.0, 7.0, 11.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.235595703125, -16.64306640625, -16.050537109375, -15.4580078125, -14.865478515625, -14.27294921875, -13.680419921875, -13.087890625, -12.495361328125, -11.90283203125, -11.310302734375, -10.7177734375, -10.125244140625, -9.53271484375, -8.940185546875, -8.34765625, -7.755126953125, -7.16259765625, -6.570068359375, -5.9775390625, -5.385009765625, -4.79248046875, -4.199951171875, -3.607421875, -3.014892578125, -2.42236328125, -1.829833984375, -1.2373046875, -0.644775390625, -0.05224609375, 0.540283203125, 1.1328125, 1.725341796875, 2.31787109375, 2.910400390625, 3.5029296875, 4.095458984375, 4.68798828125, 5.280517578125, 5.873046875, 6.465576171875, 7.05810546875, 7.650634765625, 8.2431640625, 8.835693359375, 9.42822265625, 10.020751953125, 10.61328125, 11.205810546875, 11.79833984375, 12.390869140625, 12.9833984375, 13.575927734375, 14.16845703125, 14.760986328125, 15.353515625, 15.946044921875, 16.53857421875, 17.131103515625, 17.7236328125, 18.316162109375, 18.90869140625, 19.501220703125, 20.09375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 10.0, 9.0, 13.0, 30.0, 33.0, 62.0, 78.0, 94.0, 168.0, 277.0, 374.0, 580.0, 943.0, 1417.0, 2203.0, 3224.0, 4977.0, 7682.0, 11988.0, 18282.0, 28983.0, 43959.0, 64437.0, 90665.0, 117510.0, 136148.0, 135174.0, 114243.0, 86526.0, 61511.0, 41110.0, 27008.0, 17240.0, 11104.0, 7167.0, 4586.0, 2941.0, 1964.0, 1262.0, 871.0, 574.0, 377.0, 244.0, 169.0, 92.0, 97.0, 44.0, 42.0, 21.0, 14.0, 13.0, 4.0, 9.0, 4.0, 1.0, 2.0, 2.0], "bins": [-2.431640625, -2.3577880859375, -2.283935546875, -2.2100830078125, -2.13623046875, -2.0623779296875, -1.988525390625, -1.9146728515625, -1.8408203125, -1.7669677734375, -1.693115234375, -1.6192626953125, -1.54541015625, -1.4715576171875, -1.397705078125, -1.3238525390625, -1.25, -1.1761474609375, -1.102294921875, -1.0284423828125, -0.95458984375, -0.8807373046875, -0.806884765625, -0.7330322265625, -0.6591796875, -0.5853271484375, -0.511474609375, -0.4376220703125, -0.36376953125, -0.2899169921875, -0.216064453125, -0.1422119140625, -0.068359375, 0.0054931640625, 0.079345703125, 0.1531982421875, 0.22705078125, 0.3009033203125, 0.374755859375, 0.4486083984375, 0.5224609375, 0.5963134765625, 0.670166015625, 0.7440185546875, 0.81787109375, 0.8917236328125, 0.965576171875, 1.0394287109375, 1.11328125, 1.1871337890625, 1.260986328125, 1.3348388671875, 1.40869140625, 1.4825439453125, 1.556396484375, 1.6302490234375, 1.7041015625, 1.7779541015625, 1.851806640625, 1.9256591796875, 1.99951171875, 2.0733642578125, 2.147216796875, 2.2210693359375, 2.294921875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 8.0, 2.0, 6.0, 10.0, 7.0, 10.0, 3.0, 11.0, 13.0, 10.0, 13.0, 21.0, 26.0, 24.0, 25.0, 33.0, 19.0, 24.0, 36.0, 27.0, 42.0, 40.0, 29.0, 42.0, 29.0, 37.0, 37.0, 21.0, 47.0, 43.0, 30.0, 38.0, 36.0, 22.0, 27.0, 19.0, 20.0, 18.0, 16.0, 20.0, 7.0, 11.0, 4.0, 10.0, 9.0, 6.0, 2.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.765625, -9.451904296875, -9.13818359375, -8.824462890625, -8.5107421875, -8.197021484375, -7.88330078125, -7.569580078125, -7.255859375, -6.942138671875, -6.62841796875, -6.314697265625, -6.0009765625, -5.687255859375, -5.37353515625, -5.059814453125, -4.74609375, -4.432373046875, -4.11865234375, -3.804931640625, -3.4912109375, -3.177490234375, -2.86376953125, -2.550048828125, -2.236328125, -1.922607421875, -1.60888671875, -1.295166015625, -0.9814453125, -0.667724609375, -0.35400390625, -0.040283203125, 0.2734375, 0.587158203125, 0.90087890625, 1.214599609375, 1.5283203125, 1.842041015625, 2.15576171875, 2.469482421875, 2.783203125, 3.096923828125, 3.41064453125, 3.724365234375, 4.0380859375, 4.351806640625, 4.66552734375, 4.979248046875, 5.29296875, 5.606689453125, 5.92041015625, 6.234130859375, 6.5478515625, 6.861572265625, 7.17529296875, 7.489013671875, 7.802734375, 8.116455078125, 8.43017578125, 8.743896484375, 9.0576171875, 9.371337890625, 9.68505859375, 9.998779296875, 10.3125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 14.0, 18.0, 12.0, 31.0, 34.0, 36.0, 52.0, 56.0, 86.0, 92.0, 94.0, 155.0, 178.0, 210.0, 296.0, 410.0, 560.0, 836.0, 1239.0, 2233.0, 4446.0, 11282.0, 34994.0, 133127.0, 384414.0, 327399.0, 99560.0, 27387.0, 9319.0, 3884.0, 2006.0, 1125.0, 777.0, 513.0, 378.0, 288.0, 214.0, 162.0, 156.0, 104.0, 92.0, 62.0, 44.0, 41.0, 28.0, 25.0, 16.0, 14.0, 12.0, 14.0, 3.0, 2.0, 8.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.7333984375, -0.7104034423828125, -0.687408447265625, -0.6644134521484375, -0.64141845703125, -0.6184234619140625, -0.595428466796875, -0.5724334716796875, -0.5494384765625, -0.5264434814453125, -0.503448486328125, -0.4804534912109375, -0.45745849609375, -0.4344635009765625, -0.411468505859375, -0.3884735107421875, -0.365478515625, -0.3424835205078125, -0.319488525390625, -0.2964935302734375, -0.27349853515625, -0.2505035400390625, -0.227508544921875, -0.2045135498046875, -0.1815185546875, -0.1585235595703125, -0.135528564453125, -0.1125335693359375, -0.08953857421875, -0.0665435791015625, -0.043548583984375, -0.0205535888671875, 0.00244140625, 0.0254364013671875, 0.048431396484375, 0.0714263916015625, 0.09442138671875, 0.1174163818359375, 0.140411376953125, 0.1634063720703125, 0.1864013671875, 0.2093963623046875, 0.232391357421875, 0.2553863525390625, 0.27838134765625, 0.3013763427734375, 0.324371337890625, 0.3473663330078125, 0.370361328125, 0.3933563232421875, 0.416351318359375, 0.4393463134765625, 0.46234130859375, 0.4853363037109375, 0.508331298828125, 0.5313262939453125, 0.5543212890625, 0.5773162841796875, 0.600311279296875, 0.6233062744140625, 0.64630126953125, 0.6692962646484375, 0.692291259765625, 0.7152862548828125, 0.73828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 12.0, 18.0, 37.0, 35.0, 53.0, 73.0, 107.0, 107.0, 114.0, 122.0, 87.0, 81.0, 50.0, 28.0, 17.0, 20.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.189678192138672e-05, -7.908884435892105e-05, -7.628090679645538e-05, -7.347296923398972e-05, -7.066503167152405e-05, -6.785709410905838e-05, -6.504915654659271e-05, -6.224121898412704e-05, -5.943328142166138e-05, -5.662534385919571e-05, -5.381740629673004e-05, -5.1009468734264374e-05, -4.8201531171798706e-05, -4.539359360933304e-05, -4.258565604686737e-05, -3.97777184844017e-05, -3.6969780921936035e-05, -3.416184335947037e-05, -3.13539057970047e-05, -2.8545968234539032e-05, -2.5738030672073364e-05, -2.2930093109607697e-05, -2.012215554714203e-05, -1.731421798467636e-05, -1.4506280422210693e-05, -1.1698342859745026e-05, -8.890405297279358e-06, -6.08246773481369e-06, -3.2745301723480225e-06, -4.6659260988235474e-07, 2.341344952583313e-06, 5.149282515048981e-06, 7.957220077514648e-06, 1.0765157639980316e-05, 1.3573095202445984e-05, 1.638103276491165e-05, 1.918897032737732e-05, 2.1996907889842987e-05, 2.4804845452308655e-05, 2.7612783014774323e-05, 3.042072057723999e-05, 3.322865813970566e-05, 3.6036595702171326e-05, 3.8844533264636993e-05, 4.165247082710266e-05, 4.446040838956833e-05, 4.7268345952033997e-05, 5.0076283514499664e-05, 5.288422107696533e-05, 5.5692158639431e-05, 5.850009620189667e-05, 6.130803376436234e-05, 6.4115971326828e-05, 6.692390888929367e-05, 6.973184645175934e-05, 7.2539784014225e-05, 7.534772157669067e-05, 7.815565913915634e-05, 8.096359670162201e-05, 8.377153426408768e-05, 8.657947182655334e-05, 8.938740938901901e-05, 9.219534695148468e-05, 9.500328451395035e-05, 9.781122207641602e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 21.0, 25.0, 30.0, 47.0, 53.0, 86.0, 120.0, 162.0, 233.0, 349.0, 493.0, 752.0, 1140.0, 1896.0, 3049.0, 5352.0, 9559.0, 17340.0, 34266.0, 68869.0, 138628.0, 237377.0, 239910.0, 141206.0, 70877.0, 35108.0, 17952.0, 9640.0, 5298.0, 3162.0, 1856.0, 1237.0, 780.0, 512.0, 362.0, 249.0, 160.0, 110.0, 80.0, 53.0, 34.0, 43.0, 20.0, 10.0, 8.0, 12.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74658203125, -0.721710205078125, -0.69683837890625, -0.671966552734375, -0.6470947265625, -0.622222900390625, -0.59735107421875, -0.572479248046875, -0.547607421875, -0.522735595703125, -0.49786376953125, -0.472991943359375, -0.4481201171875, -0.423248291015625, -0.39837646484375, -0.373504638671875, -0.3486328125, -0.323760986328125, -0.29888916015625, -0.274017333984375, -0.2491455078125, -0.224273681640625, -0.19940185546875, -0.174530029296875, -0.149658203125, -0.124786376953125, -0.09991455078125, -0.075042724609375, -0.0501708984375, -0.025299072265625, -0.00042724609375, 0.024444580078125, 0.04931640625, 0.074188232421875, 0.09906005859375, 0.123931884765625, 0.1488037109375, 0.173675537109375, 0.19854736328125, 0.223419189453125, 0.248291015625, 0.273162841796875, 0.29803466796875, 0.322906494140625, 0.3477783203125, 0.372650146484375, 0.39752197265625, 0.422393798828125, 0.447265625, 0.472137451171875, 0.49700927734375, 0.521881103515625, 0.5467529296875, 0.571624755859375, 0.59649658203125, 0.621368408203125, 0.646240234375, 0.671112060546875, 0.69598388671875, 0.720855712890625, 0.7457275390625, 0.770599365234375, 0.79547119140625, 0.820343017578125, 0.84521484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 0.0, 2.0, 2.0, 10.0, 4.0, 10.0, 6.0, 16.0, 6.0, 20.0, 23.0, 22.0, 40.0, 41.0, 44.0, 65.0, 55.0, 65.0, 81.0, 76.0, 57.0, 69.0, 48.0, 38.0, 42.0, 31.0, 24.0, 21.0, 13.0, 10.0, 14.0, 4.0, 13.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24787521362304688, -0.23818206787109375, -0.22848892211914062, -0.2187957763671875, -0.20910263061523438, -0.19940948486328125, -0.18971633911132812, -0.180023193359375, -0.17033004760742188, -0.16063690185546875, -0.15094375610351562, -0.1412506103515625, -0.13155746459960938, -0.12186431884765625, -0.11217117309570312, -0.10247802734375, -0.09278488159179688, -0.08309173583984375, -0.07339859008789062, -0.0637054443359375, -0.054012298583984375, -0.04431915283203125, -0.034626007080078125, -0.024932861328125, -0.015239715576171875, -0.00554656982421875, 0.004146575927734375, 0.0138397216796875, 0.023532867431640625, 0.03322601318359375, 0.042919158935546875, 0.0526123046875, 0.062305450439453125, 0.07199859619140625, 0.08169174194335938, 0.0913848876953125, 0.10107803344726562, 0.11077117919921875, 0.12046432495117188, 0.130157470703125, 0.13985061645507812, 0.14954376220703125, 0.15923690795898438, 0.1689300537109375, 0.17862319946289062, 0.18831634521484375, 0.19800949096679688, 0.20770263671875, 0.21739578247070312, 0.22708892822265625, 0.23678207397460938, 0.2464752197265625, 0.2561683654785156, 0.26586151123046875, 0.2755546569824219, 0.285247802734375, 0.2949409484863281, 0.30463409423828125, 0.3143272399902344, 0.3240203857421875, 0.3337135314941406, 0.34340667724609375, 0.3530998229980469, 0.36279296875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 8.0, 14.0, 12.0, 18.0, 20.0, 15.0, 26.0, 36.0, 35.0, 38.0, 35.0, 50.0, 33.0, 53.0, 53.0, 56.0, 45.0, 57.0, 51.0, 38.0, 53.0, 47.0, 23.0, 27.0, 30.0, 25.0, 18.0, 13.0, 14.0, 15.0, 11.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.235774040222168, -14.71944522857666, -14.203116416931152, -13.686787605285645, -13.170458793640137, -12.654129981994629, -12.137802124023438, -11.62147331237793, -11.105144500732422, -10.588815689086914, -10.072486877441406, -9.556158065795898, -9.03982925415039, -8.523500442504883, -8.007171630859375, -7.490843296051025, -6.974514007568359, -6.458185195922852, -5.941856384277344, -5.425527572631836, -4.909198760986328, -4.39286994934082, -3.8765416145324707, -3.360212802886963, -2.843883991241455, -2.3275551795959473, -1.811226487159729, -1.2948977947235107, -0.7785689830780029, -0.2622401714324951, 0.2540884017944336, 0.7704172134399414, 1.2867469787597656, 1.8030757904052734, 2.3194046020507812, 2.83573317527771, 3.3520619869232178, 3.8683907985687256, 4.384719371795654, 4.901048183441162, 5.41737699508667, 5.933705806732178, 6.4500346183776855, 6.966362953186035, 7.482691764831543, 7.999020576477051, 8.515349388122559, 9.031678199768066, 9.548007011413574, 10.064335823059082, 10.58066463470459, 11.096993446350098, 11.613322257995605, 12.129651069641113, 12.645978927612305, 13.162307739257812, 13.67863655090332, 14.194965362548828, 14.711294174194336, 15.227622985839844, 15.743951797485352, 16.26028060913086, 16.776609420776367, 17.292938232421875, 17.809267044067383]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 4.0, 13.0, 10.0, 19.0, 10.0, 12.0, 13.0, 26.0, 23.0, 27.0, 45.0, 35.0, 35.0, 40.0, 49.0, 43.0, 54.0, 49.0, 45.0, 55.0, 43.0, 43.0, 33.0, 37.0, 38.0, 32.0, 27.0, 20.0, 18.0, 20.0, 16.0, 14.0, 12.0, 7.0, 10.0, 9.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.608219146728516, -17.03321647644043, -16.458213806152344, -15.883211135864258, -15.308208465576172, -14.733205795288086, -14.158204078674316, -13.58320140838623, -13.008198738098145, -12.433196067810059, -11.858193397521973, -11.283190727233887, -10.708189010620117, -10.133186340332031, -9.558183670043945, -8.98318099975586, -8.408178329467773, -7.8331756591796875, -7.258172988891602, -6.683170795440674, -6.108168125152588, -5.533165454864502, -4.958163261413574, -4.383160591125488, -3.8081579208374023, -3.2331552505493164, -2.6581528186798096, -2.0831503868103027, -1.5081477165222168, -0.9331450462341309, -0.358142614364624, 0.2168598175048828, 0.7918643951416016, 1.366866946220398, 1.9418694972991943, 2.516871929168701, 3.091874599456787, 3.666877269744873, 4.241879463195801, 4.816882133483887, 5.391884803771973, 5.966887474060059, 6.5418901443481445, 7.116892337799072, 7.691895008087158, 8.266897201538086, 8.841899871826172, 9.416902542114258, 9.991905212402344, 10.56690788269043, 11.141910552978516, 11.716913223266602, 12.291915893554688, 12.866918563842773, 13.441920280456543, 14.016922950744629, 14.591925621032715, 15.1669282913208, 15.741930961608887, 16.316932678222656, 16.891935348510742, 17.466938018798828, 18.041940689086914, 18.616943359375, 19.191946029663086]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 13.0, 17.0, 31.0, 49.0, 84.0, 138.0, 213.0, 367.0, 560.0, 956.0, 1445.0, 2313.0, 3618.0, 5623.0, 8311.0, 12238.0, 18150.0, 25494.0, 35163.0, 46850.0, 59776.0, 72305.0, 84396.0, 92681.0, 95212.0, 92784.0, 85785.0, 73866.0, 61221.0, 48493.0, 36882.0, 26671.0, 18923.0, 13032.0, 8888.0, 5769.0, 3754.0, 2346.0, 1565.0, 996.0, 645.0, 366.0, 226.0, 126.0, 88.0, 44.0, 27.0, 21.0, 18.0, 7.0, 6.0, 2.0, 2.0, 1.0], "bins": [-8.6875, -8.4361572265625, -8.184814453125, -7.9334716796875, -7.68212890625, -7.4307861328125, -7.179443359375, -6.9281005859375, -6.6767578125, -6.4254150390625, -6.174072265625, -5.9227294921875, -5.67138671875, -5.4200439453125, -5.168701171875, -4.9173583984375, -4.666015625, -4.4146728515625, -4.163330078125, -3.9119873046875, -3.66064453125, -3.4093017578125, -3.157958984375, -2.9066162109375, -2.6552734375, -2.4039306640625, -2.152587890625, -1.9012451171875, -1.64990234375, -1.3985595703125, -1.147216796875, -0.8958740234375, -0.64453125, -0.3931884765625, -0.141845703125, 0.1094970703125, 0.36083984375, 0.6121826171875, 0.863525390625, 1.1148681640625, 1.3662109375, 1.6175537109375, 1.868896484375, 2.1202392578125, 2.37158203125, 2.6229248046875, 2.874267578125, 3.1256103515625, 3.376953125, 3.6282958984375, 3.879638671875, 4.1309814453125, 4.38232421875, 4.6336669921875, 4.885009765625, 5.1363525390625, 5.3876953125, 5.6390380859375, 5.890380859375, 6.1417236328125, 6.39306640625, 6.6444091796875, 6.895751953125, 7.1470947265625, 7.3984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 11.0, 7.0, 4.0, 8.0, 9.0, 13.0, 20.0, 13.0, 13.0, 28.0, 25.0, 26.0, 25.0, 34.0, 37.0, 46.0, 34.0, 38.0, 55.0, 35.0, 54.0, 43.0, 40.0, 42.0, 42.0, 36.0, 38.0, 29.0, 36.0, 24.0, 21.0, 16.0, 27.0, 13.0, 10.0, 12.0, 10.0, 8.0, 8.0, 2.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.84375, -16.28564453125, -15.7275390625, -15.16943359375, -14.611328125, -14.05322265625, -13.4951171875, -12.93701171875, -12.37890625, -11.82080078125, -11.2626953125, -10.70458984375, -10.146484375, -9.58837890625, -9.0302734375, -8.47216796875, -7.9140625, -7.35595703125, -6.7978515625, -6.23974609375, -5.681640625, -5.12353515625, -4.5654296875, -4.00732421875, -3.44921875, -2.89111328125, -2.3330078125, -1.77490234375, -1.216796875, -0.65869140625, -0.1005859375, 0.45751953125, 1.015625, 1.57373046875, 2.1318359375, 2.68994140625, 3.248046875, 3.80615234375, 4.3642578125, 4.92236328125, 5.48046875, 6.03857421875, 6.5966796875, 7.15478515625, 7.712890625, 8.27099609375, 8.8291015625, 9.38720703125, 9.9453125, 10.50341796875, 11.0615234375, 11.61962890625, 12.177734375, 12.73583984375, 13.2939453125, 13.85205078125, 14.41015625, 14.96826171875, 15.5263671875, 16.08447265625, 16.642578125, 17.20068359375, 17.7587890625, 18.31689453125, 18.875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 11.0, 13.0, 19.0, 34.0, 74.0, 87.0, 173.0, 311.0, 479.0, 748.0, 1238.0, 2001.0, 3271.0, 5259.0, 8056.0, 12437.0, 18639.0, 27236.0, 38219.0, 52054.0, 67030.0, 81631.0, 94071.0, 101823.0, 102506.0, 96026.0, 84469.0, 69714.0, 54453.0, 40656.0, 28941.0, 19737.0, 13453.0, 8806.0, 5614.0, 3533.0, 2147.0, 1407.0, 841.0, 542.0, 316.0, 191.0, 111.0, 73.0, 41.0, 24.0, 16.0, 14.0, 9.0, 2.0, 1.0, 2.0, 2.0], "bins": [-9.71875, -9.4417724609375, -9.164794921875, -8.8878173828125, -8.61083984375, -8.3338623046875, -8.056884765625, -7.7799072265625, -7.5029296875, -7.2259521484375, -6.948974609375, -6.6719970703125, -6.39501953125, -6.1180419921875, -5.841064453125, -5.5640869140625, -5.287109375, -5.0101318359375, -4.733154296875, -4.4561767578125, -4.17919921875, -3.9022216796875, -3.625244140625, -3.3482666015625, -3.0712890625, -2.7943115234375, -2.517333984375, -2.2403564453125, -1.96337890625, -1.6864013671875, -1.409423828125, -1.1324462890625, -0.85546875, -0.5784912109375, -0.301513671875, -0.0245361328125, 0.25244140625, 0.5294189453125, 0.806396484375, 1.0833740234375, 1.3603515625, 1.6373291015625, 1.914306640625, 2.1912841796875, 2.46826171875, 2.7452392578125, 3.022216796875, 3.2991943359375, 3.576171875, 3.8531494140625, 4.130126953125, 4.4071044921875, 4.68408203125, 4.9610595703125, 5.238037109375, 5.5150146484375, 5.7919921875, 6.0689697265625, 6.345947265625, 6.6229248046875, 6.89990234375, 7.1768798828125, 7.453857421875, 7.7308349609375, 8.0078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 7.0, 13.0, 14.0, 16.0, 17.0, 22.0, 26.0, 18.0, 23.0, 38.0, 36.0, 32.0, 51.0, 45.0, 50.0, 42.0, 37.0, 37.0, 50.0, 44.0, 44.0, 49.0, 41.0, 34.0, 18.0, 31.0, 25.0, 20.0, 20.0, 21.0, 20.0, 15.0, 8.0, 7.0, 10.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2421875, -10.896484375, -10.55078125, -10.205078125, -9.859375, -9.513671875, -9.16796875, -8.822265625, -8.4765625, -8.130859375, -7.78515625, -7.439453125, -7.09375, -6.748046875, -6.40234375, -6.056640625, -5.7109375, -5.365234375, -5.01953125, -4.673828125, -4.328125, -3.982421875, -3.63671875, -3.291015625, -2.9453125, -2.599609375, -2.25390625, -1.908203125, -1.5625, -1.216796875, -0.87109375, -0.525390625, -0.1796875, 0.166015625, 0.51171875, 0.857421875, 1.203125, 1.548828125, 1.89453125, 2.240234375, 2.5859375, 2.931640625, 3.27734375, 3.623046875, 3.96875, 4.314453125, 4.66015625, 5.005859375, 5.3515625, 5.697265625, 6.04296875, 6.388671875, 6.734375, 7.080078125, 7.42578125, 7.771484375, 8.1171875, 8.462890625, 8.80859375, 9.154296875, 9.5, 9.845703125, 10.19140625, 10.537109375, 10.8828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 14.0, 25.0, 52.0, 74.0, 113.0, 183.0, 288.0, 474.0, 768.0, 1292.0, 1981.0, 3080.0, 5082.0, 8177.0, 12622.0, 19392.0, 29477.0, 41516.0, 57425.0, 75010.0, 91465.0, 103860.0, 109592.0, 106993.0, 95929.0, 80514.0, 62869.0, 46381.0, 32674.0, 22172.0, 14251.0, 9205.0, 5943.0, 3629.0, 2268.0, 1407.0, 877.0, 547.0, 332.0, 214.0, 141.0, 74.0, 50.0, 41.0, 27.0, 23.0, 12.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.45703125, -3.357269287109375, -3.25750732421875, -3.157745361328125, -3.0579833984375, -2.958221435546875, -2.85845947265625, -2.758697509765625, -2.658935546875, -2.559173583984375, -2.45941162109375, -2.359649658203125, -2.2598876953125, -2.160125732421875, -2.06036376953125, -1.960601806640625, -1.86083984375, -1.761077880859375, -1.66131591796875, -1.561553955078125, -1.4617919921875, -1.362030029296875, -1.26226806640625, -1.162506103515625, -1.062744140625, -0.962982177734375, -0.86322021484375, -0.763458251953125, -0.6636962890625, -0.563934326171875, -0.46417236328125, -0.364410400390625, -0.2646484375, -0.164886474609375, -0.06512451171875, 0.034637451171875, 0.1343994140625, 0.234161376953125, 0.33392333984375, 0.433685302734375, 0.533447265625, 0.633209228515625, 0.73297119140625, 0.832733154296875, 0.9324951171875, 1.032257080078125, 1.13201904296875, 1.231781005859375, 1.33154296875, 1.431304931640625, 1.53106689453125, 1.630828857421875, 1.7305908203125, 1.830352783203125, 1.93011474609375, 2.029876708984375, 2.129638671875, 2.229400634765625, 2.32916259765625, 2.428924560546875, 2.5286865234375, 2.628448486328125, 2.72821044921875, 2.827972412109375, 2.927734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 10.0, 10.0, 16.0, 12.0, 17.0, 20.0, 27.0, 26.0, 40.0, 34.0, 52.0, 52.0, 54.0, 44.0, 46.0, 54.0, 43.0, 66.0, 54.0, 46.0, 33.0, 43.0, 29.0, 36.0, 19.0, 23.0, 17.0, 16.0, 13.0, 11.0, 7.0, 4.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003731250762939453, -0.00035999715328216553, -0.00034686923027038574, -0.00033374130725860596, -0.00032061338424682617, -0.0003074854612350464, -0.0002943575382232666, -0.0002812296152114868, -0.00026810169219970703, -0.00025497376918792725, -0.00024184584617614746, -0.00022871792316436768, -0.0002155900001525879, -0.0002024620771408081, -0.00018933415412902832, -0.00017620623111724854, -0.00016307830810546875, -0.00014995038509368896, -0.00013682246208190918, -0.0001236945390701294, -0.00011056661605834961, -9.743869304656982e-05, -8.431077003479004e-05, -7.118284702301025e-05, -5.805492401123047e-05, -4.4927000999450684e-05, -3.17990779876709e-05, -1.8671154975891113e-05, -5.543231964111328e-06, 7.584691047668457e-06, 2.0712614059448242e-05, 3.384053707122803e-05, 4.696846008300781e-05, 6.00963830947876e-05, 7.322430610656738e-05, 8.635222911834717e-05, 9.948015213012695e-05, 0.00011260807514190674, 0.00012573599815368652, 0.0001388639211654663, 0.0001519918441772461, 0.00016511976718902588, 0.00017824769020080566, 0.00019137561321258545, 0.00020450353622436523, 0.00021763145923614502, 0.0002307593822479248, 0.0002438873052597046, 0.0002570152282714844, 0.00027014315128326416, 0.00028327107429504395, 0.00029639899730682373, 0.0003095269203186035, 0.0003226548433303833, 0.0003357827663421631, 0.00034891068935394287, 0.00036203861236572266, 0.00037516653537750244, 0.0003882944583892822, 0.000401422381401062, 0.0004145503044128418, 0.0004276782274246216, 0.00044080615043640137, 0.00045393407344818115, 0.00046706199645996094]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 9.0, 18.0, 33.0, 69.0, 76.0, 128.0, 191.0, 330.0, 496.0, 866.0, 1416.0, 2398.0, 4015.0, 6724.0, 11014.0, 17838.0, 28873.0, 44328.0, 63711.0, 87031.0, 109280.0, 122514.0, 125235.0, 115357.0, 95393.0, 72011.0, 50617.0, 33786.0, 21419.0, 13298.0, 8033.0, 4678.0, 3012.0, 1646.0, 1082.0, 623.0, 358.0, 208.0, 169.0, 100.0, 52.0, 28.0, 34.0, 22.0, 7.0, 10.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.86328125, -3.7393798828125, -3.615478515625, -3.4915771484375, -3.36767578125, -3.2437744140625, -3.119873046875, -2.9959716796875, -2.8720703125, -2.7481689453125, -2.624267578125, -2.5003662109375, -2.37646484375, -2.2525634765625, -2.128662109375, -2.0047607421875, -1.880859375, -1.7569580078125, -1.633056640625, -1.5091552734375, -1.38525390625, -1.2613525390625, -1.137451171875, -1.0135498046875, -0.8896484375, -0.7657470703125, -0.641845703125, -0.5179443359375, -0.39404296875, -0.2701416015625, -0.146240234375, -0.0223388671875, 0.1015625, 0.2254638671875, 0.349365234375, 0.4732666015625, 0.59716796875, 0.7210693359375, 0.844970703125, 0.9688720703125, 1.0927734375, 1.2166748046875, 1.340576171875, 1.4644775390625, 1.58837890625, 1.7122802734375, 1.836181640625, 1.9600830078125, 2.083984375, 2.2078857421875, 2.331787109375, 2.4556884765625, 2.57958984375, 2.7034912109375, 2.827392578125, 2.9512939453125, 3.0751953125, 3.1990966796875, 3.322998046875, 3.4468994140625, 3.57080078125, 3.6947021484375, 3.818603515625, 3.9425048828125, 4.06640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 6.0, 9.0, 8.0, 16.0, 15.0, 20.0, 26.0, 22.0, 31.0, 47.0, 40.0, 49.0, 58.0, 49.0, 51.0, 60.0, 63.0, 66.0, 43.0, 60.0, 53.0, 39.0, 32.0, 33.0, 29.0, 14.0, 17.0, 12.0, 5.0, 14.0, 6.0, 7.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.439453125, -2.377777099609375, -2.31610107421875, -2.254425048828125, -2.1927490234375, -2.131072998046875, -2.06939697265625, -2.007720947265625, -1.946044921875, -1.884368896484375, -1.82269287109375, -1.761016845703125, -1.6993408203125, -1.637664794921875, -1.57598876953125, -1.514312744140625, -1.45263671875, -1.390960693359375, -1.32928466796875, -1.267608642578125, -1.2059326171875, -1.144256591796875, -1.08258056640625, -1.020904541015625, -0.959228515625, -0.897552490234375, -0.83587646484375, -0.774200439453125, -0.7125244140625, -0.650848388671875, -0.58917236328125, -0.527496337890625, -0.4658203125, -0.404144287109375, -0.34246826171875, -0.280792236328125, -0.2191162109375, -0.157440185546875, -0.09576416015625, -0.034088134765625, 0.027587890625, 0.089263916015625, 0.15093994140625, 0.212615966796875, 0.2742919921875, 0.335968017578125, 0.39764404296875, 0.459320068359375, 0.52099609375, 0.582672119140625, 0.64434814453125, 0.706024169921875, 0.7677001953125, 0.829376220703125, 0.89105224609375, 0.952728271484375, 1.014404296875, 1.076080322265625, 1.13775634765625, 1.199432373046875, 1.2611083984375, 1.322784423828125, 1.38446044921875, 1.446136474609375, 1.5078125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 10.0, 11.0, 12.0, 11.0, 19.0, 16.0, 15.0, 27.0, 25.0, 37.0, 37.0, 34.0, 25.0, 40.0, 39.0, 45.0, 50.0, 48.0, 44.0, 52.0, 40.0, 52.0, 44.0, 38.0, 34.0, 26.0, 27.0, 22.0, 26.0, 23.0, 14.0, 11.0, 11.0, 10.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.720953941345215, -14.254154205322266, -13.787353515625, -13.32055377960205, -12.853754043579102, -12.386953353881836, -11.920153617858887, -11.453353881835938, -10.986553192138672, -10.519753456115723, -10.052952766418457, -9.586153030395508, -9.119353294372559, -8.65255355834961, -8.185752868652344, -7.7189531326293945, -7.252153396606445, -6.785353183746338, -6.318553447723389, -5.851753234863281, -5.384953498840332, -4.918153285980225, -4.451353073120117, -3.984553098678589, -3.5177531242370605, -3.0509531497955322, -2.584153175354004, -2.1173529624938965, -1.6505529880523682, -1.1837530136108398, -0.7169528007507324, -0.2501528263092041, 0.21664714813232422, 0.6834471821784973, 1.1502472162246704, 1.6170473098754883, 2.0838472843170166, 2.550647258758545, 3.0174474716186523, 3.4842474460601807, 3.951047420501709, 4.417847633361816, 4.884647369384766, 5.351447582244873, 5.8182477951049805, 6.28504753112793, 6.751847743988037, 7.2186479568481445, 7.685447692871094, 8.152247428894043, 8.619048118591309, 9.085847854614258, 9.552647590637207, 10.019447326660156, 10.486248016357422, 10.953047752380371, 11.41984748840332, 11.88664722442627, 12.353447914123535, 12.820247650146484, 13.287047386169434, 13.753847122192383, 14.220647811889648, 14.687447547912598, 15.154248237609863]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 7.0, 7.0, 6.0, 7.0, 14.0, 9.0, 17.0, 18.0, 13.0, 21.0, 34.0, 32.0, 28.0, 37.0, 38.0, 47.0, 54.0, 64.0, 30.0, 49.0, 56.0, 43.0, 54.0, 47.0, 37.0, 25.0, 28.0, 26.0, 17.0, 26.0, 31.0, 13.0, 18.0, 16.0, 8.0, 10.0, 5.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.77967071533203, -17.148536682128906, -16.517404556274414, -15.886271476745605, -15.255138397216797, -14.624004364013672, -13.992871284484863, -13.361738204956055, -12.730605125427246, -12.099472045898438, -11.468338966369629, -10.83720588684082, -10.206071853637695, -9.574939727783203, -8.943805694580078, -8.31267261505127, -7.681539535522461, -7.050406455993652, -6.419273376464844, -5.788139820098877, -5.157006740570068, -4.52587366104126, -3.894740343093872, -3.2636070251464844, -2.632473945617676, -2.001340866088867, -1.3702075481414795, -0.7390743494033813, -0.1079411506652832, 0.5231919288635254, 1.154325246810913, 1.7854585647583008, 2.4165916442871094, 3.047724723815918, 3.6788580417633057, 4.309991359710693, 4.941124439239502, 5.5722575187683105, 6.203391075134277, 6.834524154663086, 7.4656572341918945, 8.096790313720703, 8.727923393249512, 9.35905647277832, 9.990190505981445, 10.621322631835938, 11.252456665039062, 11.883589744567871, 12.51472282409668, 13.145855903625488, 13.776988983154297, 14.408122062683105, 15.039255142211914, 15.670389175415039, 16.30152130126953, 16.932655334472656, 17.56378936767578, 18.194923400878906, 18.8260555267334, 19.457189559936523, 20.088321685791016, 20.71945571899414, 21.350587844848633, 21.981721878051758, 22.61285400390625]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 17.0, 15.0, 43.0, 93.0, 128.0, 254.0, 400.0, 739.0, 1259.0, 2130.0, 3587.0, 6121.0, 9847.0, 16083.0, 25238.0, 39372.0, 60384.0, 89104.0, 127647.0, 176091.0, 231642.0, 291078.0, 345135.0, 386214.0, 404904.0, 396291.0, 363837.0, 312891.0, 256054.0, 197169.0, 145344.0, 104094.0, 71348.0, 47318.0, 30959.0, 19903.0, 12267.0, 7693.0, 4668.0, 2823.0, 1629.0, 1002.0, 623.0, 360.0, 209.0, 111.0, 70.0, 47.0, 33.0, 8.0, 5.0, 2.0, 0.0, 1.0, 3.0], "bins": [-11.125, -10.794921875, -10.46484375, -10.134765625, -9.8046875, -9.474609375, -9.14453125, -8.814453125, -8.484375, -8.154296875, -7.82421875, -7.494140625, -7.1640625, -6.833984375, -6.50390625, -6.173828125, -5.84375, -5.513671875, -5.18359375, -4.853515625, -4.5234375, -4.193359375, -3.86328125, -3.533203125, -3.203125, -2.873046875, -2.54296875, -2.212890625, -1.8828125, -1.552734375, -1.22265625, -0.892578125, -0.5625, -0.232421875, 0.09765625, 0.427734375, 0.7578125, 1.087890625, 1.41796875, 1.748046875, 2.078125, 2.408203125, 2.73828125, 3.068359375, 3.3984375, 3.728515625, 4.05859375, 4.388671875, 4.71875, 5.048828125, 5.37890625, 5.708984375, 6.0390625, 6.369140625, 6.69921875, 7.029296875, 7.359375, 7.689453125, 8.01953125, 8.349609375, 8.6796875, 9.009765625, 9.33984375, 9.669921875, 10.0]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 5.0, 4.0, 10.0, 8.0, 14.0, 17.0, 15.0, 11.0, 15.0, 36.0, 19.0, 39.0, 35.0, 32.0, 43.0, 49.0, 55.0, 41.0, 48.0, 55.0, 53.0, 49.0, 37.0, 36.0, 39.0, 38.0, 29.0, 31.0, 11.0, 28.0, 21.0, 21.0, 10.0, 12.0, 10.0, 7.0, 4.0, 3.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.609375, -15.087890625, -14.56640625, -14.044921875, -13.5234375, -13.001953125, -12.48046875, -11.958984375, -11.4375, -10.916015625, -10.39453125, -9.873046875, -9.3515625, -8.830078125, -8.30859375, -7.787109375, -7.265625, -6.744140625, -6.22265625, -5.701171875, -5.1796875, -4.658203125, -4.13671875, -3.615234375, -3.09375, -2.572265625, -2.05078125, -1.529296875, -1.0078125, -0.486328125, 0.03515625, 0.556640625, 1.078125, 1.599609375, 2.12109375, 2.642578125, 3.1640625, 3.685546875, 4.20703125, 4.728515625, 5.25, 5.771484375, 6.29296875, 6.814453125, 7.3359375, 7.857421875, 8.37890625, 8.900390625, 9.421875, 9.943359375, 10.46484375, 10.986328125, 11.5078125, 12.029296875, 12.55078125, 13.072265625, 13.59375, 14.115234375, 14.63671875, 15.158203125, 15.6796875, 16.201171875, 16.72265625, 17.244140625, 17.765625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 24.0, 32.0, 70.0, 99.0, 201.0, 391.0, 604.0, 1066.0, 1876.0, 3216.0, 5871.0, 9526.0, 15517.0, 25198.0, 39398.0, 60128.0, 88556.0, 125151.0, 171395.0, 222625.0, 276698.0, 325164.0, 363913.0, 383450.0, 382102.0, 359446.0, 320340.0, 270123.0, 217317.0, 164764.0, 120209.0, 85311.0, 57335.0, 37200.0, 23760.0, 14856.0, 8947.0, 5242.0, 3060.0, 1718.0, 1069.0, 563.0, 335.0, 185.0, 102.0, 59.0, 34.0, 10.0, 11.0, 6.0, 5.0, 1.0], "bins": [-12.328125, -11.985107421875, -11.64208984375, -11.299072265625, -10.9560546875, -10.613037109375, -10.27001953125, -9.927001953125, -9.583984375, -9.240966796875, -8.89794921875, -8.554931640625, -8.2119140625, -7.868896484375, -7.52587890625, -7.182861328125, -6.83984375, -6.496826171875, -6.15380859375, -5.810791015625, -5.4677734375, -5.124755859375, -4.78173828125, -4.438720703125, -4.095703125, -3.752685546875, -3.40966796875, -3.066650390625, -2.7236328125, -2.380615234375, -2.03759765625, -1.694580078125, -1.3515625, -1.008544921875, -0.66552734375, -0.322509765625, 0.0205078125, 0.363525390625, 0.70654296875, 1.049560546875, 1.392578125, 1.735595703125, 2.07861328125, 2.421630859375, 2.7646484375, 3.107666015625, 3.45068359375, 3.793701171875, 4.13671875, 4.479736328125, 4.82275390625, 5.165771484375, 5.5087890625, 5.851806640625, 6.19482421875, 6.537841796875, 6.880859375, 7.223876953125, 7.56689453125, 7.909912109375, 8.2529296875, 8.595947265625, 8.93896484375, 9.281982421875, 9.625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 10.0, 11.0, 15.0, 16.0, 24.0, 34.0, 29.0, 29.0, 58.0, 60.0, 87.0, 107.0, 101.0, 129.0, 138.0, 133.0, 153.0, 160.0, 166.0, 188.0, 183.0, 212.0, 193.0, 213.0, 154.0, 168.0, 176.0, 146.0, 156.0, 137.0, 109.0, 96.0, 82.0, 80.0, 71.0, 43.0, 30.0, 36.0, 25.0, 23.0, 23.0, 12.0, 15.0, 8.0, 5.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.5, -6.29461669921875, -6.0892333984375, -5.88385009765625, -5.678466796875, -5.47308349609375, -5.2677001953125, -5.06231689453125, -4.85693359375, -4.65155029296875, -4.4461669921875, -4.24078369140625, -4.035400390625, -3.83001708984375, -3.6246337890625, -3.41925048828125, -3.2138671875, -3.00848388671875, -2.8031005859375, -2.59771728515625, -2.392333984375, -2.18695068359375, -1.9815673828125, -1.77618408203125, -1.57080078125, -1.36541748046875, -1.1600341796875, -0.95465087890625, -0.749267578125, -0.54388427734375, -0.3385009765625, -0.13311767578125, 0.072265625, 0.27764892578125, 0.4830322265625, 0.68841552734375, 0.893798828125, 1.09918212890625, 1.3045654296875, 1.50994873046875, 1.71533203125, 1.92071533203125, 2.1260986328125, 2.33148193359375, 2.536865234375, 2.74224853515625, 2.9476318359375, 3.15301513671875, 3.3583984375, 3.56378173828125, 3.7691650390625, 3.97454833984375, 4.179931640625, 4.38531494140625, 4.5906982421875, 4.79608154296875, 5.00146484375, 5.20684814453125, 5.4122314453125, 5.61761474609375, 5.822998046875, 6.02838134765625, 6.2337646484375, 6.43914794921875, 6.64453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 8.0, 9.0, 9.0, 15.0, 21.0, 30.0, 23.0, 23.0, 41.0, 35.0, 36.0, 42.0, 44.0, 42.0, 47.0, 61.0, 42.0, 45.0, 45.0, 48.0, 41.0, 29.0, 35.0, 32.0, 28.0, 31.0, 17.0, 29.0, 14.0, 14.0, 15.0, 8.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.612018585205078, -17.076082229614258, -16.540143966674805, -16.004207611083984, -15.468269348144531, -14.932332992553711, -14.396395683288574, -13.860458374023438, -13.3245210647583, -12.788583755493164, -12.252646446228027, -11.71670913696289, -11.18077278137207, -10.644834518432617, -10.108898162841797, -9.57296085357666, -9.037023544311523, -8.501086235046387, -7.96514892578125, -7.4292120933532715, -6.893274784088135, -6.357337474822998, -5.8214006423950195, -5.285463333129883, -4.749526023864746, -4.213588714599609, -3.6776516437530518, -3.141714572906494, -2.6057772636413574, -2.0698399543762207, -1.533902883529663, -0.9979658126831055, -0.46203041076660156, 0.0739067792892456, 0.6098439693450928, 1.14578115940094, 1.681718349456787, 2.217655658721924, 2.7535927295684814, 3.289529800415039, 3.825467109680176, 4.3614044189453125, 4.897341728210449, 5.433278560638428, 5.9692158699035645, 6.505153179168701, 7.04109001159668, 7.577027320861816, 8.112964630126953, 8.64890193939209, 9.184839248657227, 9.720776557922363, 10.2567138671875, 10.79265022277832, 11.328587532043457, 11.864524841308594, 12.40046215057373, 12.936399459838867, 13.472336769104004, 14.00827407836914, 14.544210433959961, 15.080148696899414, 15.616085052490234, 16.152023315429688, 16.687959671020508]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 6.0, 3.0, 7.0, 9.0, 11.0, 14.0, 21.0, 25.0, 27.0, 30.0, 32.0, 32.0, 38.0, 43.0, 49.0, 39.0, 42.0, 53.0, 59.0, 52.0, 55.0, 47.0, 42.0, 33.0, 39.0, 42.0, 26.0, 24.0, 18.0, 20.0, 17.0, 11.0, 7.0, 7.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.404544830322266, -18.736053466796875, -18.067562103271484, -17.399070739746094, -16.730579376220703, -16.062088012695312, -15.393597602844238, -14.725106239318848, -14.056614875793457, -13.388123512268066, -12.719632148742676, -12.051141738891602, -11.382650375366211, -10.71415901184082, -10.04566764831543, -9.377176284790039, -8.708684921264648, -8.040193557739258, -7.371702194213867, -6.703211307525635, -6.034719944000244, -5.3662285804748535, -4.697737693786621, -4.0292463302612305, -3.36075496673584, -2.692263603210449, -2.0237724781036377, -1.3552813529968262, -0.6867899894714355, -0.018298625946044922, 0.6501922607421875, 1.3186836242675781, 1.987173080444336, 2.6556644439697266, 3.324155569076538, 3.9926466941833496, 4.66113805770874, 5.329629421234131, 5.998120307922363, 6.666611671447754, 7.3351030349731445, 8.003594398498535, 8.672085762023926, 9.340576171875, 10.00906753540039, 10.677558898925781, 11.346050262451172, 12.014541625976562, 12.683032989501953, 13.351524353027344, 14.020015716552734, 14.688507080078125, 15.356998443603516, 16.025489807128906, 16.693981170654297, 17.362472534179688, 18.030963897705078, 18.69945526123047, 19.36794662475586, 20.03643798828125, 20.70492935180664, 21.37342071533203, 22.041912078857422, 22.710403442382812, 23.37889289855957]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 18.0, 36.0, 36.0, 52.0, 76.0, 134.0, 220.0, 339.0, 502.0, 822.0, 1313.0, 1917.0, 2989.0, 4796.0, 7474.0, 12010.0, 18644.0, 29426.0, 45755.0, 69854.0, 101362.0, 132664.0, 150358.0, 139694.0, 109386.0, 77183.0, 51500.0, 32880.0, 20900.0, 13149.0, 8241.0, 5334.0, 3443.0, 2153.0, 1406.0, 871.0, 586.0, 348.0, 235.0, 155.0, 106.0, 68.0, 48.0, 22.0, 12.0, 10.0, 9.0, 9.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.62890625, -2.55072021484375, -2.4725341796875, -2.39434814453125, -2.316162109375, -2.23797607421875, -2.1597900390625, -2.08160400390625, -2.00341796875, -1.92523193359375, -1.8470458984375, -1.76885986328125, -1.690673828125, -1.61248779296875, -1.5343017578125, -1.45611572265625, -1.3779296875, -1.29974365234375, -1.2215576171875, -1.14337158203125, -1.065185546875, -0.98699951171875, -0.9088134765625, -0.83062744140625, -0.75244140625, -0.67425537109375, -0.5960693359375, -0.51788330078125, -0.439697265625, -0.36151123046875, -0.2833251953125, -0.20513916015625, -0.126953125, -0.04876708984375, 0.0294189453125, 0.10760498046875, 0.185791015625, 0.26397705078125, 0.3421630859375, 0.42034912109375, 0.49853515625, 0.57672119140625, 0.6549072265625, 0.73309326171875, 0.811279296875, 0.88946533203125, 0.9676513671875, 1.04583740234375, 1.1240234375, 1.20220947265625, 1.2803955078125, 1.35858154296875, 1.436767578125, 1.51495361328125, 1.5931396484375, 1.67132568359375, 1.74951171875, 1.82769775390625, 1.9058837890625, 1.98406982421875, 2.062255859375, 2.14044189453125, 2.2186279296875, 2.29681396484375, 2.375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 7.0, 3.0, 6.0, 11.0, 18.0, 22.0, 18.0, 16.0, 27.0, 34.0, 35.0, 36.0, 35.0, 32.0, 26.0, 28.0, 57.0, 61.0, 53.0, 36.0, 52.0, 48.0, 45.0, 41.0, 32.0, 30.0, 32.0, 26.0, 18.0, 27.0, 14.0, 19.0, 10.0, 6.0, 13.0, 6.0, 0.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.71875, -19.0908203125, -18.462890625, -17.8349609375, -17.20703125, -16.5791015625, -15.951171875, -15.3232421875, -14.6953125, -14.0673828125, -13.439453125, -12.8115234375, -12.18359375, -11.5556640625, -10.927734375, -10.2998046875, -9.671875, -9.0439453125, -8.416015625, -7.7880859375, -7.16015625, -6.5322265625, -5.904296875, -5.2763671875, -4.6484375, -4.0205078125, -3.392578125, -2.7646484375, -2.13671875, -1.5087890625, -0.880859375, -0.2529296875, 0.375, 1.0029296875, 1.630859375, 2.2587890625, 2.88671875, 3.5146484375, 4.142578125, 4.7705078125, 5.3984375, 6.0263671875, 6.654296875, 7.2822265625, 7.91015625, 8.5380859375, 9.166015625, 9.7939453125, 10.421875, 11.0498046875, 11.677734375, 12.3056640625, 12.93359375, 13.5615234375, 14.189453125, 14.8173828125, 15.4453125, 16.0732421875, 16.701171875, 17.3291015625, 17.95703125, 18.5849609375, 19.212890625, 19.8408203125, 20.46875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 9.0, 14.0, 14.0, 24.0, 41.0, 58.0, 109.0, 186.0, 251.0, 428.0, 643.0, 1173.0, 1754.0, 2914.0, 4720.0, 7662.0, 12766.0, 20998.0, 33836.0, 53282.0, 80444.0, 113255.0, 142361.0, 150591.0, 132480.0, 100865.0, 69997.0, 44984.0, 28104.0, 17318.0, 10493.0, 6395.0, 3956.0, 2406.0, 1496.0, 906.0, 612.0, 340.0, 256.0, 148.0, 104.0, 62.0, 43.0, 19.0, 22.0, 7.0, 5.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.80859375, -2.7216796875, -2.634765625, -2.5478515625, -2.4609375, -2.3740234375, -2.287109375, -2.2001953125, -2.11328125, -2.0263671875, -1.939453125, -1.8525390625, -1.765625, -1.6787109375, -1.591796875, -1.5048828125, -1.41796875, -1.3310546875, -1.244140625, -1.1572265625, -1.0703125, -0.9833984375, -0.896484375, -0.8095703125, -0.72265625, -0.6357421875, -0.548828125, -0.4619140625, -0.375, -0.2880859375, -0.201171875, -0.1142578125, -0.02734375, 0.0595703125, 0.146484375, 0.2333984375, 0.3203125, 0.4072265625, 0.494140625, 0.5810546875, 0.66796875, 0.7548828125, 0.841796875, 0.9287109375, 1.015625, 1.1025390625, 1.189453125, 1.2763671875, 1.36328125, 1.4501953125, 1.537109375, 1.6240234375, 1.7109375, 1.7978515625, 1.884765625, 1.9716796875, 2.05859375, 2.1455078125, 2.232421875, 2.3193359375, 2.40625, 2.4931640625, 2.580078125, 2.6669921875, 2.75390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 10.0, 11.0, 8.0, 25.0, 18.0, 21.0, 28.0, 25.0, 42.0, 39.0, 39.0, 34.0, 46.0, 35.0, 36.0, 44.0, 38.0, 58.0, 42.0, 50.0, 53.0, 32.0, 33.0, 41.0, 29.0, 21.0, 13.0, 18.0, 20.0, 14.0, 14.0, 11.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8515625, -11.423583984375, -10.99560546875, -10.567626953125, -10.1396484375, -9.711669921875, -9.28369140625, -8.855712890625, -8.427734375, -7.999755859375, -7.57177734375, -7.143798828125, -6.7158203125, -6.287841796875, -5.85986328125, -5.431884765625, -5.00390625, -4.575927734375, -4.14794921875, -3.719970703125, -3.2919921875, -2.864013671875, -2.43603515625, -2.008056640625, -1.580078125, -1.152099609375, -0.72412109375, -0.296142578125, 0.1318359375, 0.559814453125, 0.98779296875, 1.415771484375, 1.84375, 2.271728515625, 2.69970703125, 3.127685546875, 3.5556640625, 3.983642578125, 4.41162109375, 4.839599609375, 5.267578125, 5.695556640625, 6.12353515625, 6.551513671875, 6.9794921875, 7.407470703125, 7.83544921875, 8.263427734375, 8.69140625, 9.119384765625, 9.54736328125, 9.975341796875, 10.4033203125, 10.831298828125, 11.25927734375, 11.687255859375, 12.115234375, 12.543212890625, 12.97119140625, 13.399169921875, 13.8271484375, 14.255126953125, 14.68310546875, 15.111083984375, 15.5390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 11.0, 9.0, 19.0, 25.0, 24.0, 38.0, 72.0, 87.0, 99.0, 182.0, 267.0, 383.0, 618.0, 963.0, 1486.0, 2481.0, 4180.0, 7021.0, 12280.0, 21670.0, 38974.0, 68937.0, 116190.0, 175531.0, 200601.0, 159245.0, 100852.0, 58696.0, 32836.0, 18763.0, 10530.0, 6023.0, 3502.0, 2177.0, 1337.0, 826.0, 533.0, 331.0, 222.0, 162.0, 100.0, 75.0, 67.0, 37.0, 40.0, 17.0, 10.0, 14.0, 6.0, 4.0, 3.0, 2.0, 1.0], "bins": [-0.30859375, -0.29986572265625, -0.2911376953125, -0.28240966796875, -0.273681640625, -0.26495361328125, -0.2562255859375, -0.24749755859375, -0.23876953125, -0.23004150390625, -0.2213134765625, -0.21258544921875, -0.203857421875, -0.19512939453125, -0.1864013671875, -0.17767333984375, -0.1689453125, -0.16021728515625, -0.1514892578125, -0.14276123046875, -0.134033203125, -0.12530517578125, -0.1165771484375, -0.10784912109375, -0.09912109375, -0.09039306640625, -0.0816650390625, -0.07293701171875, -0.064208984375, -0.05548095703125, -0.0467529296875, -0.03802490234375, -0.029296875, -0.02056884765625, -0.0118408203125, -0.00311279296875, 0.005615234375, 0.01434326171875, 0.0230712890625, 0.03179931640625, 0.04052734375, 0.04925537109375, 0.0579833984375, 0.06671142578125, 0.075439453125, 0.08416748046875, 0.0928955078125, 0.10162353515625, 0.1103515625, 0.11907958984375, 0.1278076171875, 0.13653564453125, 0.145263671875, 0.15399169921875, 0.1627197265625, 0.17144775390625, 0.18017578125, 0.18890380859375, 0.1976318359375, 0.20635986328125, 0.215087890625, 0.22381591796875, 0.2325439453125, 0.24127197265625, 0.25]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 17.0, 9.0, 15.0, 19.0, 27.0, 34.0, 41.0, 30.0, 40.0, 50.0, 61.0, 59.0, 51.0, 46.0, 54.0, 45.0, 56.0, 57.0, 40.0, 37.0, 27.0, 29.0, 31.0, 27.0, 20.0, 18.0, 10.0, 8.0, 7.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4405460357666016e-05, -4.319287836551666e-05, -4.198029637336731e-05, -4.0767714381217957e-05, -3.9555132389068604e-05, -3.834255039691925e-05, -3.71299684047699e-05, -3.5917386412620544e-05, -3.470480442047119e-05, -3.349222242832184e-05, -3.2279640436172485e-05, -3.106705844402313e-05, -2.985447645187378e-05, -2.8641894459724426e-05, -2.7429312467575073e-05, -2.621673047542572e-05, -2.5004148483276367e-05, -2.3791566491127014e-05, -2.257898449897766e-05, -2.1366402506828308e-05, -2.0153820514678955e-05, -1.8941238522529602e-05, -1.772865653038025e-05, -1.6516074538230896e-05, -1.5303492546081543e-05, -1.409091055393219e-05, -1.2878328561782837e-05, -1.1665746569633484e-05, -1.0453164577484131e-05, -9.240582585334778e-06, -8.028000593185425e-06, -6.815418601036072e-06, -5.602836608886719e-06, -4.390254616737366e-06, -3.1776726245880127e-06, -1.9650906324386597e-06, -7.525086402893066e-07, 4.600733518600464e-07, 1.6726553440093994e-06, 2.8852373361587524e-06, 4.0978193283081055e-06, 5.3104013204574585e-06, 6.5229833126068115e-06, 7.735565304756165e-06, 8.948147296905518e-06, 1.016072928905487e-05, 1.1373311281204224e-05, 1.2585893273353577e-05, 1.379847526550293e-05, 1.5011057257652283e-05, 1.6223639249801636e-05, 1.743622124195099e-05, 1.8648803234100342e-05, 1.9861385226249695e-05, 2.1073967218399048e-05, 2.22865492105484e-05, 2.3499131202697754e-05, 2.4711713194847107e-05, 2.592429518699646e-05, 2.7136877179145813e-05, 2.8349459171295166e-05, 2.956204116344452e-05, 3.077462315559387e-05, 3.1987205147743225e-05, 3.319978713989258e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 9.0, 8.0, 11.0, 14.0, 15.0, 22.0, 40.0, 61.0, 81.0, 109.0, 174.0, 248.0, 328.0, 502.0, 789.0, 1305.0, 2162.0, 3487.0, 6412.0, 12354.0, 24739.0, 53296.0, 114416.0, 222790.0, 274244.0, 171004.0, 82197.0, 37733.0, 18222.0, 9222.0, 4917.0, 2781.0, 1752.0, 1034.0, 673.0, 428.0, 308.0, 221.0, 129.0, 95.0, 62.0, 51.0, 35.0, 27.0, 17.0, 14.0, 8.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0], "bins": [-0.7900390625, -0.7676467895507812, -0.7452545166015625, -0.7228622436523438, -0.700469970703125, -0.6780776977539062, -0.6556854248046875, -0.6332931518554688, -0.61090087890625, -0.5885086059570312, -0.5661163330078125, -0.5437240600585938, -0.521331787109375, -0.49893951416015625, -0.4765472412109375, -0.45415496826171875, -0.4317626953125, -0.40937042236328125, -0.3869781494140625, -0.36458587646484375, -0.342193603515625, -0.31980133056640625, -0.2974090576171875, -0.27501678466796875, -0.25262451171875, -0.23023223876953125, -0.2078399658203125, -0.18544769287109375, -0.163055419921875, -0.14066314697265625, -0.1182708740234375, -0.09587860107421875, -0.073486328125, -0.05109405517578125, -0.0287017822265625, -0.00630950927734375, 0.016082763671875, 0.03847503662109375, 0.0608673095703125, 0.08325958251953125, 0.10565185546875, 0.12804412841796875, 0.1504364013671875, 0.17282867431640625, 0.195220947265625, 0.21761322021484375, 0.2400054931640625, 0.26239776611328125, 0.2847900390625, 0.30718231201171875, 0.3295745849609375, 0.35196685791015625, 0.374359130859375, 0.39675140380859375, 0.4191436767578125, 0.44153594970703125, 0.46392822265625, 0.48632049560546875, 0.5087127685546875, 0.5311050415039062, 0.553497314453125, 0.5758895874023438, 0.5982818603515625, 0.6206741333007812, 0.64306640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 1.0, 3.0, 7.0, 6.0, 15.0, 18.0, 22.0, 23.0, 27.0, 36.0, 55.0, 64.0, 73.0, 83.0, 107.0, 92.0, 71.0, 51.0, 41.0, 42.0, 32.0, 23.0, 23.0, 23.0, 4.0, 17.0, 11.0, 7.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.420654296875, -0.4088172912597656, -0.39698028564453125, -0.3851432800292969, -0.3733062744140625, -0.3614692687988281, -0.34963226318359375, -0.3377952575683594, -0.325958251953125, -0.3141212463378906, -0.30228424072265625, -0.2904472351074219, -0.2786102294921875, -0.2667732238769531, -0.25493621826171875, -0.24309921264648438, -0.23126220703125, -0.21942520141601562, -0.20758819580078125, -0.19575119018554688, -0.1839141845703125, -0.17207717895507812, -0.16024017333984375, -0.14840316772460938, -0.136566162109375, -0.12472915649414062, -0.11289215087890625, -0.10105514526367188, -0.0892181396484375, -0.07738113403320312, -0.06554412841796875, -0.053707122802734375, -0.0418701171875, -0.030033111572265625, -0.01819610595703125, -0.006359100341796875, 0.0054779052734375, 0.017314910888671875, 0.02915191650390625, 0.040988922119140625, 0.052825927734375, 0.06466293334960938, 0.07649993896484375, 0.08833694458007812, 0.1001739501953125, 0.11201095581054688, 0.12384796142578125, 0.13568496704101562, 0.14752197265625, 0.15935897827148438, 0.17119598388671875, 0.18303298950195312, 0.1948699951171875, 0.20670700073242188, 0.21854400634765625, 0.23038101196289062, 0.242218017578125, 0.2540550231933594, 0.26589202880859375, 0.2777290344238281, 0.2895660400390625, 0.3014030456542969, 0.31324005126953125, 0.3250770568847656, 0.3369140625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 9.0, 8.0, 10.0, 11.0, 14.0, 26.0, 24.0, 22.0, 31.0, 40.0, 32.0, 36.0, 51.0, 43.0, 45.0, 57.0, 49.0, 49.0, 43.0, 47.0, 46.0, 41.0, 22.0, 35.0, 35.0, 29.0, 25.0, 27.0, 18.0, 15.0, 16.0, 9.0, 10.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.778034210205078, -17.23383903503418, -16.68964385986328, -16.145448684692383, -15.601253509521484, -15.057058334350586, -14.512862205505371, -13.968667030334473, -13.424471855163574, -12.880276679992676, -12.336081504821777, -11.791886329650879, -11.247690200805664, -10.703495025634766, -10.159299850463867, -9.615104675292969, -9.07090950012207, -8.526714324951172, -7.982519149780273, -7.438323497772217, -6.894128322601318, -6.34993314743042, -5.805737495422363, -5.261542320251465, -4.717347145080566, -4.173151969909668, -3.6289565563201904, -3.084761142730713, -2.5405659675598145, -1.996370792388916, -1.4521753787994385, -0.9079799652099609, -0.3637847900390625, 0.1804105043411255, 0.7246057987213135, 1.2688010931015015, 1.8129963874816895, 2.357191562652588, 2.9013869762420654, 3.445582389831543, 3.9897775650024414, 4.53397274017334, 5.078167915344238, 5.622363567352295, 6.166558742523193, 6.710753917694092, 7.254949569702148, 7.799144744873047, 8.343339920043945, 8.887535095214844, 9.431730270385742, 9.97592544555664, 10.520120620727539, 11.064315795898438, 11.608511924743652, 12.15270709991455, 12.69690227508545, 13.241097450256348, 13.785292625427246, 14.329487800598145, 14.87368392944336, 15.417879104614258, 15.962074279785156, 16.506269454956055, 17.050464630126953]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 5.0, 3.0, 6.0, 10.0, 11.0, 13.0, 22.0, 24.0, 26.0, 31.0, 32.0, 33.0, 34.0, 44.0, 51.0, 35.0, 46.0, 50.0, 59.0, 50.0, 55.0, 51.0, 41.0, 34.0, 40.0, 40.0, 25.0, 27.0, 20.0, 17.0, 20.0, 10.0, 6.0, 8.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.389698028564453, -18.723114013671875, -18.05653190612793, -17.38994789123535, -16.723365783691406, -16.056781768798828, -15.390199661254883, -14.723615646362305, -14.05703353881836, -13.390450477600098, -12.723867416381836, -12.057284355163574, -11.390701293945312, -10.72411823272705, -10.057535171508789, -9.390951156616211, -8.72436809539795, -8.057785034179688, -7.391201972961426, -6.724618911743164, -6.058035850524902, -5.391452789306641, -4.724869251251221, -4.058286190032959, -3.3917031288146973, -2.7251200675964355, -2.058537006378174, -1.391953706741333, -0.7253706455230713, -0.05878758430480957, 0.6077957153320312, 1.274378776550293, 1.9409618377685547, 2.6075448989868164, 3.274127960205078, 3.940711259841919, 4.607294082641602, 5.273877143859863, 5.940460681915283, 6.607043743133545, 7.273626804351807, 7.940209865570068, 8.606793403625488, 9.27337646484375, 9.939959526062012, 10.606542587280273, 11.273125648498535, 11.939708709716797, 12.606291770935059, 13.27287483215332, 13.939457893371582, 14.606040954589844, 15.272624015808105, 15.939207077026367, 16.605791091918945, 17.27237319946289, 17.93895721435547, 18.605541229248047, 19.272123336791992, 19.93870735168457, 20.605289459228516, 21.271873474121094, 21.93845558166504, 22.605039596557617, 23.271621704101562]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 28.0, 34.0, 44.0, 69.0, 131.0, 209.0, 390.0, 608.0, 968.0, 1511.0, 2444.0, 3918.0, 5841.0, 8979.0, 13574.0, 19417.0, 27345.0, 37418.0, 49109.0, 61328.0, 75089.0, 85624.0, 92832.0, 93954.0, 91100.0, 83682.0, 72807.0, 59037.0, 46500.0, 35527.0, 25664.0, 18017.0, 12371.0, 8100.0, 5395.0, 3512.0, 2289.0, 1377.0, 888.0, 517.0, 351.0, 211.0, 129.0, 77.0, 46.0, 34.0, 13.0, 19.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.96875, -7.7149658203125, -7.461181640625, -7.2073974609375, -6.95361328125, -6.6998291015625, -6.446044921875, -6.1922607421875, -5.9384765625, -5.6846923828125, -5.430908203125, -5.1771240234375, -4.92333984375, -4.6695556640625, -4.415771484375, -4.1619873046875, -3.908203125, -3.6544189453125, -3.400634765625, -3.1468505859375, -2.89306640625, -2.6392822265625, -2.385498046875, -2.1317138671875, -1.8779296875, -1.6241455078125, -1.370361328125, -1.1165771484375, -0.86279296875, -0.6090087890625, -0.355224609375, -0.1014404296875, 0.15234375, 0.4061279296875, 0.659912109375, 0.9136962890625, 1.16748046875, 1.4212646484375, 1.675048828125, 1.9288330078125, 2.1826171875, 2.4364013671875, 2.690185546875, 2.9439697265625, 3.19775390625, 3.4515380859375, 3.705322265625, 3.9591064453125, 4.212890625, 4.4666748046875, 4.720458984375, 4.9742431640625, 5.22802734375, 5.4818115234375, 5.735595703125, 5.9893798828125, 6.2431640625, 6.4969482421875, 6.750732421875, 7.0045166015625, 7.25830078125, 7.5120849609375, 7.765869140625, 8.0196533203125, 8.2734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 6.0, 5.0, 10.0, 11.0, 16.0, 17.0, 26.0, 18.0, 21.0, 30.0, 35.0, 28.0, 38.0, 37.0, 43.0, 44.0, 43.0, 45.0, 48.0, 49.0, 43.0, 55.0, 40.0, 47.0, 31.0, 36.0, 30.0, 20.0, 25.0, 20.0, 16.0, 12.0, 8.0, 8.0, 6.0, 10.0, 5.0, 7.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.849853515625, -15.21533203125, -14.580810546875, -13.9462890625, -13.311767578125, -12.67724609375, -12.042724609375, -11.408203125, -10.773681640625, -10.13916015625, -9.504638671875, -8.8701171875, -8.235595703125, -7.60107421875, -6.966552734375, -6.33203125, -5.697509765625, -5.06298828125, -4.428466796875, -3.7939453125, -3.159423828125, -2.52490234375, -1.890380859375, -1.255859375, -0.621337890625, 0.01318359375, 0.647705078125, 1.2822265625, 1.916748046875, 2.55126953125, 3.185791015625, 3.8203125, 4.454833984375, 5.08935546875, 5.723876953125, 6.3583984375, 6.992919921875, 7.62744140625, 8.261962890625, 8.896484375, 9.531005859375, 10.16552734375, 10.800048828125, 11.4345703125, 12.069091796875, 12.70361328125, 13.338134765625, 13.97265625, 14.607177734375, 15.24169921875, 15.876220703125, 16.5107421875, 17.145263671875, 17.77978515625, 18.414306640625, 19.048828125, 19.683349609375, 20.31787109375, 20.952392578125, 21.5869140625, 22.221435546875, 22.85595703125, 23.490478515625, 24.125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 9.0, 12.0, 12.0, 16.0, 37.0, 43.0, 62.0, 121.0, 219.0, 333.0, 500.0, 843.0, 1340.0, 2176.0, 3276.0, 5130.0, 7725.0, 11416.0, 16601.0, 24223.0, 33270.0, 44278.0, 57490.0, 70214.0, 82341.0, 91493.0, 95068.0, 93965.0, 87583.0, 76528.0, 63553.0, 50346.0, 38632.0, 28371.0, 20185.0, 13924.0, 9632.0, 6234.0, 4058.0, 2644.0, 1709.0, 1123.0, 693.0, 437.0, 259.0, 189.0, 97.0, 59.0, 37.0, 23.0, 19.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-8.6953125, -8.4298095703125, -8.164306640625, -7.8988037109375, -7.63330078125, -7.3677978515625, -7.102294921875, -6.8367919921875, -6.5712890625, -6.3057861328125, -6.040283203125, -5.7747802734375, -5.50927734375, -5.2437744140625, -4.978271484375, -4.7127685546875, -4.447265625, -4.1817626953125, -3.916259765625, -3.6507568359375, -3.38525390625, -3.1197509765625, -2.854248046875, -2.5887451171875, -2.3232421875, -2.0577392578125, -1.792236328125, -1.5267333984375, -1.26123046875, -0.9957275390625, -0.730224609375, -0.4647216796875, -0.19921875, 0.0662841796875, 0.331787109375, 0.5972900390625, 0.86279296875, 1.1282958984375, 1.393798828125, 1.6593017578125, 1.9248046875, 2.1903076171875, 2.455810546875, 2.7213134765625, 2.98681640625, 3.2523193359375, 3.517822265625, 3.7833251953125, 4.048828125, 4.3143310546875, 4.579833984375, 4.8453369140625, 5.11083984375, 5.3763427734375, 5.641845703125, 5.9073486328125, 6.1728515625, 6.4383544921875, 6.703857421875, 6.9693603515625, 7.23486328125, 7.5003662109375, 7.765869140625, 8.0313720703125, 8.296875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 14.0, 26.0, 8.0, 16.0, 18.0, 10.0, 24.0, 27.0, 30.0, 28.0, 37.0, 36.0, 37.0, 49.0, 44.0, 36.0, 52.0, 34.0, 29.0, 31.0, 35.0, 34.0, 27.0, 33.0, 42.0, 24.0, 22.0, 27.0, 17.0, 16.0, 17.0, 17.0, 10.0, 10.0, 15.0, 12.0, 8.0, 9.0, 3.0, 8.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -10.374267578125, -10.02978515625, -9.685302734375, -9.3408203125, -8.996337890625, -8.65185546875, -8.307373046875, -7.962890625, -7.618408203125, -7.27392578125, -6.929443359375, -6.5849609375, -6.240478515625, -5.89599609375, -5.551513671875, -5.20703125, -4.862548828125, -4.51806640625, -4.173583984375, -3.8291015625, -3.484619140625, -3.14013671875, -2.795654296875, -2.451171875, -2.106689453125, -1.76220703125, -1.417724609375, -1.0732421875, -0.728759765625, -0.38427734375, -0.039794921875, 0.3046875, 0.649169921875, 0.99365234375, 1.338134765625, 1.6826171875, 2.027099609375, 2.37158203125, 2.716064453125, 3.060546875, 3.405029296875, 3.74951171875, 4.093994140625, 4.4384765625, 4.782958984375, 5.12744140625, 5.471923828125, 5.81640625, 6.160888671875, 6.50537109375, 6.849853515625, 7.1943359375, 7.538818359375, 7.88330078125, 8.227783203125, 8.572265625, 8.916748046875, 9.26123046875, 9.605712890625, 9.9501953125, 10.294677734375, 10.63916015625, 10.983642578125, 11.328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 19.0, 16.0, 29.0, 57.0, 72.0, 136.0, 214.0, 345.0, 598.0, 946.0, 1704.0, 3070.0, 5357.0, 9297.0, 16023.0, 26991.0, 41715.0, 62129.0, 84717.0, 107090.0, 122046.0, 127091.0, 117501.0, 100355.0, 76594.0, 54493.0, 35942.0, 22599.0, 13288.0, 7819.0, 4421.0, 2530.0, 1449.0, 767.0, 454.0, 264.0, 157.0, 89.0, 58.0, 37.0, 23.0, 23.0, 6.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.732421875, -3.609344482421875, -3.48626708984375, -3.363189697265625, -3.2401123046875, -3.117034912109375, -2.99395751953125, -2.870880126953125, -2.747802734375, -2.624725341796875, -2.50164794921875, -2.378570556640625, -2.2554931640625, -2.132415771484375, -2.00933837890625, -1.886260986328125, -1.76318359375, -1.640106201171875, -1.51702880859375, -1.393951416015625, -1.2708740234375, -1.147796630859375, -1.02471923828125, -0.901641845703125, -0.778564453125, -0.655487060546875, -0.53240966796875, -0.409332275390625, -0.2862548828125, -0.163177490234375, -0.04010009765625, 0.082977294921875, 0.2060546875, 0.329132080078125, 0.45220947265625, 0.575286865234375, 0.6983642578125, 0.821441650390625, 0.94451904296875, 1.067596435546875, 1.190673828125, 1.313751220703125, 1.43682861328125, 1.559906005859375, 1.6829833984375, 1.806060791015625, 1.92913818359375, 2.052215576171875, 2.17529296875, 2.298370361328125, 2.42144775390625, 2.544525146484375, 2.6676025390625, 2.790679931640625, 2.91375732421875, 3.036834716796875, 3.159912109375, 3.282989501953125, 3.40606689453125, 3.529144287109375, 3.6522216796875, 3.775299072265625, 3.89837646484375, 4.021453857421875, 4.14453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 14.0, 11.0, 16.0, 19.0, 28.0, 42.0, 39.0, 52.0, 53.0, 62.0, 65.0, 57.0, 65.0, 58.0, 54.0, 57.0, 61.0, 36.0, 37.0, 31.0, 29.0, 24.0, 21.0, 20.0, 15.0, 2.0, 8.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000537872314453125, -0.0005202814936637878, -0.0005026906728744507, -0.0004850998520851135, -0.00046750903129577637, -0.0004499182105064392, -0.00043232738971710205, -0.0004147365689277649, -0.00039714574813842773, -0.0003795549273490906, -0.0003619641065597534, -0.00034437328577041626, -0.0003267824649810791, -0.00030919164419174194, -0.0002916008234024048, -0.0002740100026130676, -0.00025641918182373047, -0.0002388283610343933, -0.00022123754024505615, -0.000203646719455719, -0.00018605589866638184, -0.00016846507787704468, -0.00015087425708770752, -0.00013328343629837036, -0.0001156926155090332, -9.810179471969604e-05, -8.051097393035889e-05, -6.292015314102173e-05, -4.532933235168457e-05, -2.7738511562347412e-05, -1.0147690773010254e-05, 7.443130016326904e-06, 2.5033950805664062e-05, 4.262477159500122e-05, 6.021559238433838e-05, 7.780641317367554e-05, 9.53972339630127e-05, 0.00011298805475234985, 0.000130578875541687, 0.00014816969633102417, 0.00016576051712036133, 0.00018335133790969849, 0.00020094215869903564, 0.0002185329794883728, 0.00023612380027770996, 0.0002537146210670471, 0.0002713054418563843, 0.00028889626264572144, 0.0003064870834350586, 0.00032407790422439575, 0.0003416687250137329, 0.00035925954580307007, 0.0003768503665924072, 0.0003944411873817444, 0.00041203200817108154, 0.0004296228289604187, 0.00044721364974975586, 0.000464804470539093, 0.0004823952913284302, 0.0004999861121177673, 0.0005175769329071045, 0.0005351677536964417, 0.0005527585744857788, 0.000570349395275116, 0.0005879402160644531]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 10.0, 13.0, 20.0, 41.0, 62.0, 93.0, 148.0, 235.0, 375.0, 569.0, 1106.0, 1796.0, 3079.0, 5498.0, 9192.0, 15419.0, 25951.0, 41219.0, 62180.0, 86327.0, 110643.0, 126919.0, 130879.0, 120563.0, 98900.0, 74602.0, 50875.0, 32745.0, 20291.0, 11754.0, 7118.0, 4030.0, 2368.0, 1363.0, 829.0, 522.0, 297.0, 187.0, 121.0, 78.0, 45.0, 36.0, 17.0, 14.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01171875, -3.87457275390625, -3.7374267578125, -3.60028076171875, -3.463134765625, -3.32598876953125, -3.1888427734375, -3.05169677734375, -2.91455078125, -2.77740478515625, -2.6402587890625, -2.50311279296875, -2.365966796875, -2.22882080078125, -2.0916748046875, -1.95452880859375, -1.8173828125, -1.68023681640625, -1.5430908203125, -1.40594482421875, -1.268798828125, -1.13165283203125, -0.9945068359375, -0.85736083984375, -0.72021484375, -0.58306884765625, -0.4459228515625, -0.30877685546875, -0.171630859375, -0.03448486328125, 0.1026611328125, 0.23980712890625, 0.376953125, 0.51409912109375, 0.6512451171875, 0.78839111328125, 0.925537109375, 1.06268310546875, 1.1998291015625, 1.33697509765625, 1.47412109375, 1.61126708984375, 1.7484130859375, 1.88555908203125, 2.022705078125, 2.15985107421875, 2.2969970703125, 2.43414306640625, 2.5712890625, 2.70843505859375, 2.8455810546875, 2.98272705078125, 3.119873046875, 3.25701904296875, 3.3941650390625, 3.53131103515625, 3.66845703125, 3.80560302734375, 3.9427490234375, 4.07989501953125, 4.217041015625, 4.35418701171875, 4.4913330078125, 4.62847900390625, 4.765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 2.0, 5.0, 4.0, 9.0, 9.0, 15.0, 27.0, 24.0, 31.0, 28.0, 40.0, 46.0, 33.0, 54.0, 47.0, 51.0, 54.0, 49.0, 45.0, 50.0, 55.0, 39.0, 33.0, 30.0, 33.0, 25.0, 24.0, 19.0, 17.0, 15.0, 19.0, 6.0, 15.0, 10.0, 7.0, 4.0, 4.0, 1.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6351470947265625, -1.575958251953125, -1.5167694091796875, -1.45758056640625, -1.3983917236328125, -1.339202880859375, -1.2800140380859375, -1.2208251953125, -1.1616363525390625, -1.102447509765625, -1.0432586669921875, -0.98406982421875, -0.9248809814453125, -0.865692138671875, -0.8065032958984375, -0.747314453125, -0.6881256103515625, -0.628936767578125, -0.5697479248046875, -0.51055908203125, -0.4513702392578125, -0.392181396484375, -0.3329925537109375, -0.2738037109375, -0.2146148681640625, -0.155426025390625, -0.0962371826171875, -0.03704833984375, 0.0221405029296875, 0.081329345703125, 0.1405181884765625, 0.19970703125, 0.2588958740234375, 0.318084716796875, 0.3772735595703125, 0.43646240234375, 0.4956512451171875, 0.554840087890625, 0.6140289306640625, 0.6732177734375, 0.7324066162109375, 0.791595458984375, 0.8507843017578125, 0.90997314453125, 0.9691619873046875, 1.028350830078125, 1.0875396728515625, 1.146728515625, 1.2059173583984375, 1.265106201171875, 1.3242950439453125, 1.38348388671875, 1.4426727294921875, 1.501861572265625, 1.5610504150390625, 1.6202392578125, 1.6794281005859375, 1.738616943359375, 1.7978057861328125, 1.85699462890625, 1.9161834716796875, 1.975372314453125, 2.0345611572265625, 2.09375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 6.0, 7.0, 12.0, 13.0, 26.0, 17.0, 21.0, 32.0, 27.0, 34.0, 35.0, 42.0, 48.0, 33.0, 50.0, 60.0, 48.0, 35.0, 42.0, 53.0, 34.0, 44.0, 31.0, 32.0, 42.0, 29.0, 24.0, 14.0, 14.0, 18.0, 8.0, 17.0, 10.0, 7.0, 3.0, 4.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.086942672729492, -17.560914993286133, -17.034887313842773, -16.508859634399414, -15.982831954956055, -15.456804275512695, -14.930777549743652, -14.404749870300293, -13.878722190856934, -13.352694511413574, -12.826666831970215, -12.300639152526855, -11.774612426757812, -11.248584747314453, -10.722557067871094, -10.196529388427734, -9.670501708984375, -9.144474029541016, -8.618446350097656, -8.092418670654297, -7.566391468048096, -7.040363788604736, -6.514336585998535, -5.988308906555176, -5.462281227111816, -4.936253547668457, -4.410225868225098, -3.8841986656188965, -3.358170986175537, -2.8321433067321777, -2.3061158657073975, -1.7800884246826172, -1.2540626525878906, -0.7280350923538208, -0.20200753211975098, 0.32402002811431885, 0.8500475883483887, 1.376075267791748, 1.9021027088165283, 2.4281301498413086, 2.954157829284668, 3.4801855087280273, 4.006213188171387, 4.532240390777588, 5.058268070220947, 5.584295749664307, 6.110322952270508, 6.636350631713867, 7.162378311157227, 7.688405990600586, 8.214433670043945, 8.740461349487305, 9.266489028930664, 9.792516708374023, 10.318543434143066, 10.844571113586426, 11.370598793029785, 11.896626472473145, 12.422654151916504, 12.948681831359863, 13.474708557128906, 14.000736236572266, 14.526763916015625, 15.052791595458984, 15.578819274902344]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 5.0, 10.0, 13.0, 17.0, 17.0, 26.0, 24.0, 25.0, 33.0, 34.0, 39.0, 40.0, 48.0, 40.0, 47.0, 56.0, 59.0, 41.0, 50.0, 37.0, 50.0, 38.0, 41.0, 32.0, 22.0, 32.0, 26.0, 17.0, 11.0, 14.0, 8.0, 13.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.4061222076416, -21.68741226196289, -20.96870231628418, -20.24999237060547, -19.531280517578125, -18.812570571899414, -18.093860626220703, -17.375150680541992, -16.65644073486328, -15.93773078918457, -15.219019889831543, -14.500309944152832, -13.781599044799805, -13.062889099121094, -12.344179153442383, -11.625469207763672, -10.906757354736328, -10.188047409057617, -9.46933650970459, -8.750626564025879, -8.031915664672852, -7.313205718994141, -6.59449577331543, -5.8757853507995605, -5.157074928283691, -4.438364505767822, -3.7196543216705322, -3.000944137573242, -2.282233715057373, -1.563523292541504, -0.844813346862793, -0.12610292434692383, 0.5926094055175781, 1.3113197088241577, 2.0300300121307373, 2.7487401962280273, 3.4674506187438965, 4.186161041259766, 4.904870986938477, 5.623581409454346, 6.342291831970215, 7.061002254486084, 7.779712677001953, 8.498422622680664, 9.217132568359375, 9.935843467712402, 10.654553413391113, 11.37326431274414, 12.091974258422852, 12.810684204101562, 13.52939510345459, 14.2481050491333, 14.966815948486328, 15.685525894165039, 16.40423583984375, 17.12294578552246, 17.841655731201172, 18.560365676879883, 19.279075622558594, 19.997787475585938, 20.71649742126465, 21.43520736694336, 22.15391731262207, 22.87262725830078, 23.591339111328125]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 11.0, 16.0, 29.0, 44.0, 88.0, 154.0, 236.0, 390.0, 582.0, 1015.0, 1723.0, 2680.0, 4361.0, 6782.0, 10669.0, 16837.0, 25305.0, 38028.0, 55033.0, 78360.0, 108239.0, 145426.0, 189166.0, 236433.0, 281995.0, 322045.0, 350568.0, 360728.0, 353185.0, 329240.0, 292441.0, 245553.0, 199344.0, 155027.0, 116065.0, 84697.0, 60077.0, 41899.0, 28030.0, 18461.0, 12079.0, 7854.0, 4947.0, 3190.0, 2047.0, 1206.0, 766.0, 488.0, 281.0, 204.0, 104.0, 69.0, 41.0, 24.0, 19.0, 4.0, 3.0, 4.0], "bins": [-11.4296875, -11.08984375, -10.75, -10.41015625, -10.0703125, -9.73046875, -9.390625, -9.05078125, -8.7109375, -8.37109375, -8.03125, -7.69140625, -7.3515625, -7.01171875, -6.671875, -6.33203125, -5.9921875, -5.65234375, -5.3125, -4.97265625, -4.6328125, -4.29296875, -3.953125, -3.61328125, -3.2734375, -2.93359375, -2.59375, -2.25390625, -1.9140625, -1.57421875, -1.234375, -0.89453125, -0.5546875, -0.21484375, 0.125, 0.46484375, 0.8046875, 1.14453125, 1.484375, 1.82421875, 2.1640625, 2.50390625, 2.84375, 3.18359375, 3.5234375, 3.86328125, 4.203125, 4.54296875, 4.8828125, 5.22265625, 5.5625, 5.90234375, 6.2421875, 6.58203125, 6.921875, 7.26171875, 7.6015625, 7.94140625, 8.28125, 8.62109375, 8.9609375, 9.30078125, 9.640625, 9.98046875, 10.3203125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 5.0, 2.0, 6.0, 7.0, 14.0, 17.0, 17.0, 14.0, 16.0, 42.0, 44.0, 42.0, 42.0, 42.0, 44.0, 48.0, 35.0, 44.0, 61.0, 63.0, 36.0, 57.0, 48.0, 33.0, 34.0, 29.0, 21.0, 26.0, 27.0, 22.0, 9.0, 12.0, 14.0, 8.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.234375, -20.591796875, -19.94921875, -19.306640625, -18.6640625, -18.021484375, -17.37890625, -16.736328125, -16.09375, -15.451171875, -14.80859375, -14.166015625, -13.5234375, -12.880859375, -12.23828125, -11.595703125, -10.953125, -10.310546875, -9.66796875, -9.025390625, -8.3828125, -7.740234375, -7.09765625, -6.455078125, -5.8125, -5.169921875, -4.52734375, -3.884765625, -3.2421875, -2.599609375, -1.95703125, -1.314453125, -0.671875, -0.029296875, 0.61328125, 1.255859375, 1.8984375, 2.541015625, 3.18359375, 3.826171875, 4.46875, 5.111328125, 5.75390625, 6.396484375, 7.0390625, 7.681640625, 8.32421875, 8.966796875, 9.609375, 10.251953125, 10.89453125, 11.537109375, 12.1796875, 12.822265625, 13.46484375, 14.107421875, 14.75, 15.392578125, 16.03515625, 16.677734375, 17.3203125, 17.962890625, 18.60546875, 19.248046875, 19.890625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 7.0, 6.0, 24.0, 21.0, 33.0, 76.0, 122.0, 190.0, 325.0, 591.0, 950.0, 1641.0, 2668.0, 4399.0, 7004.0, 11076.0, 17258.0, 26425.0, 39756.0, 57988.0, 82266.0, 113210.0, 150238.0, 192727.0, 236756.0, 279876.0, 314764.0, 340602.0, 351359.0, 344318.0, 322604.0, 289513.0, 247816.0, 202009.0, 159017.0, 120904.0, 88762.0, 63078.0, 43311.0, 29126.0, 19319.0, 12215.0, 7700.0, 4890.0, 2881.0, 1810.0, 1099.0, 628.0, 390.0, 222.0, 148.0, 66.0, 43.0, 33.0, 11.0, 12.0, 4.0, 4.0, 1.0, 3.0, 1.0], "bins": [-11.484375, -11.12109375, -10.7578125, -10.39453125, -10.03125, -9.66796875, -9.3046875, -8.94140625, -8.578125, -8.21484375, -7.8515625, -7.48828125, -7.125, -6.76171875, -6.3984375, -6.03515625, -5.671875, -5.30859375, -4.9453125, -4.58203125, -4.21875, -3.85546875, -3.4921875, -3.12890625, -2.765625, -2.40234375, -2.0390625, -1.67578125, -1.3125, -0.94921875, -0.5859375, -0.22265625, 0.140625, 0.50390625, 0.8671875, 1.23046875, 1.59375, 1.95703125, 2.3203125, 2.68359375, 3.046875, 3.41015625, 3.7734375, 4.13671875, 4.5, 4.86328125, 5.2265625, 5.58984375, 5.953125, 6.31640625, 6.6796875, 7.04296875, 7.40625, 7.76953125, 8.1328125, 8.49609375, 8.859375, 9.22265625, 9.5859375, 9.94921875, 10.3125, 10.67578125, 11.0390625, 11.40234375, 11.765625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 14.0, 30.0, 21.0, 28.0, 30.0, 46.0, 54.0, 65.0, 68.0, 101.0, 102.0, 104.0, 154.0, 173.0, 163.0, 169.0, 210.0, 210.0, 206.0, 215.0, 188.0, 203.0, 194.0, 156.0, 185.0, 165.0, 111.0, 133.0, 107.0, 90.0, 83.0, 61.0, 46.0, 42.0, 45.0, 23.0, 15.0, 14.0, 13.0, 10.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.953125, -7.6968994140625, -7.440673828125, -7.1844482421875, -6.92822265625, -6.6719970703125, -6.415771484375, -6.1595458984375, -5.9033203125, -5.6470947265625, -5.390869140625, -5.1346435546875, -4.87841796875, -4.6221923828125, -4.365966796875, -4.1097412109375, -3.853515625, -3.5972900390625, -3.341064453125, -3.0848388671875, -2.82861328125, -2.5723876953125, -2.316162109375, -2.0599365234375, -1.8037109375, -1.5474853515625, -1.291259765625, -1.0350341796875, -0.77880859375, -0.5225830078125, -0.266357421875, -0.0101318359375, 0.24609375, 0.5023193359375, 0.758544921875, 1.0147705078125, 1.27099609375, 1.5272216796875, 1.783447265625, 2.0396728515625, 2.2958984375, 2.5521240234375, 2.808349609375, 3.0645751953125, 3.32080078125, 3.5770263671875, 3.833251953125, 4.0894775390625, 4.345703125, 4.6019287109375, 4.858154296875, 5.1143798828125, 5.37060546875, 5.6268310546875, 5.883056640625, 6.1392822265625, 6.3955078125, 6.6517333984375, 6.907958984375, 7.1641845703125, 7.42041015625, 7.6766357421875, 7.932861328125, 8.1890869140625, 8.4453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 13.0, 14.0, 17.0, 23.0, 24.0, 25.0, 43.0, 29.0, 36.0, 34.0, 58.0, 48.0, 53.0, 35.0, 48.0, 45.0, 34.0, 39.0, 55.0, 45.0, 46.0, 37.0, 21.0, 22.0, 22.0, 22.0, 17.0, 16.0, 20.0, 8.0, 3.0, 8.0, 7.0, 0.0, 7.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.027252197265625, -19.412723541259766, -18.798194885253906, -18.183666229248047, -17.569137573242188, -16.954608917236328, -16.34008026123047, -15.725553512573242, -15.111024856567383, -14.496496200561523, -13.881967544555664, -13.267438888549805, -12.652911186218262, -12.038382530212402, -11.423853874206543, -10.809326171875, -10.194796562194824, -9.580267906188965, -8.965739250183105, -8.351211547851562, -7.736682891845703, -7.122154235839844, -6.507625579833984, -5.893097400665283, -5.278568744659424, -4.6640400886535645, -4.049511909484863, -3.434983253479004, -2.8204548358917236, -2.2059264183044434, -1.591397762298584, -0.9768695831298828, -0.36234092712402344, 0.2521875500679016, 0.8667160272598267, 1.4812445640563965, 2.0957729816436768, 2.710301399230957, 3.3248300552368164, 3.9393582344055176, 4.553886890411377, 5.168415546417236, 5.7829437255859375, 6.397472381591797, 7.012001037597656, 7.626529216766357, 8.241058349609375, 8.855586051940918, 9.470114707946777, 10.084643363952637, 10.699172019958496, 11.313699722290039, 11.928228378295898, 12.542757034301758, 13.157285690307617, 13.771814346313477, 14.386343002319336, 15.000871658325195, 15.615400314331055, 16.229928970336914, 16.844457626342773, 17.458984375, 18.07351303100586, 18.68804168701172, 19.302570343017578]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 14.0, 10.0, 11.0, 15.0, 12.0, 25.0, 19.0, 21.0, 27.0, 23.0, 33.0, 32.0, 38.0, 44.0, 50.0, 44.0, 51.0, 52.0, 46.0, 51.0, 45.0, 38.0, 31.0, 37.0, 22.0, 33.0, 23.0, 26.0, 19.0, 26.0, 21.0, 7.0, 13.0, 6.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.068527221679688, -19.354019165039062, -18.639509201049805, -17.92500114440918, -17.210491180419922, -16.495983123779297, -15.781474113464355, -15.066965103149414, -14.352456092834473, -13.637947082519531, -12.92343807220459, -12.208929061889648, -11.494421005249023, -10.779911041259766, -10.06540298461914, -9.3508939743042, -8.636384963989258, -7.921875953674316, -7.207366943359375, -6.492858409881592, -5.77834939956665, -5.063840389251709, -4.349331855773926, -3.6348228454589844, -2.920313835144043, -2.2058048248291016, -1.4912960529327393, -0.776787281036377, -0.06227827072143555, 0.6522307395935059, 1.366739273071289, 2.0812482833862305, 2.795755386352539, 3.5102643966674805, 4.224773406982422, 4.939281940460205, 5.6537909507751465, 6.368299961090088, 7.082808494567871, 7.7973175048828125, 8.511826515197754, 9.226335525512695, 9.940844535827637, 10.655353546142578, 11.369861602783203, 12.084371566772461, 12.798879623413086, 13.513388633728027, 14.227897644042969, 14.94240665435791, 15.656915664672852, 16.371423721313477, 17.085933685302734, 17.80044174194336, 18.514949798583984, 19.229459762573242, 19.9439697265625, 20.658477783203125, 21.372987747192383, 22.087495803833008, 22.802005767822266, 23.51651382446289, 24.231021881103516, 24.945531845092773, 25.6600399017334]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 8.0, 11.0, 20.0, 22.0, 44.0, 79.0, 132.0, 214.0, 408.0, 658.0, 1142.0, 1883.0, 3282.0, 5854.0, 10440.0, 18940.0, 33288.0, 58428.0, 97039.0, 144974.0, 180940.0, 172413.0, 128302.0, 81032.0, 47649.0, 26782.0, 14970.0, 8389.0, 4777.0, 2684.0, 1524.0, 867.0, 552.0, 304.0, 203.0, 116.0, 73.0, 39.0, 18.0, 25.0, 12.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.126953125, -3.0184326171875, -2.909912109375, -2.8013916015625, -2.69287109375, -2.5843505859375, -2.475830078125, -2.3673095703125, -2.2587890625, -2.1502685546875, -2.041748046875, -1.9332275390625, -1.82470703125, -1.7161865234375, -1.607666015625, -1.4991455078125, -1.390625, -1.2821044921875, -1.173583984375, -1.0650634765625, -0.95654296875, -0.8480224609375, -0.739501953125, -0.6309814453125, -0.5224609375, -0.4139404296875, -0.305419921875, -0.1968994140625, -0.08837890625, 0.0201416015625, 0.128662109375, 0.2371826171875, 0.345703125, 0.4542236328125, 0.562744140625, 0.6712646484375, 0.77978515625, 0.8883056640625, 0.996826171875, 1.1053466796875, 1.2138671875, 1.3223876953125, 1.430908203125, 1.5394287109375, 1.64794921875, 1.7564697265625, 1.864990234375, 1.9735107421875, 2.08203125, 2.1905517578125, 2.299072265625, 2.4075927734375, 2.51611328125, 2.6246337890625, 2.733154296875, 2.8416748046875, 2.9501953125, 3.0587158203125, 3.167236328125, 3.2757568359375, 3.38427734375, 3.4927978515625, 3.601318359375, 3.7098388671875, 3.818359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 13.0, 8.0, 13.0, 17.0, 16.0, 25.0, 18.0, 23.0, 25.0, 30.0, 34.0, 29.0, 41.0, 41.0, 39.0, 41.0, 55.0, 49.0, 58.0, 41.0, 34.0, 35.0, 36.0, 23.0, 34.0, 32.0, 30.0, 18.0, 28.0, 20.0, 19.0, 10.0, 13.0, 7.0, 6.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.015625, -20.28955078125, -19.5634765625, -18.83740234375, -18.111328125, -17.38525390625, -16.6591796875, -15.93310546875, -15.20703125, -14.48095703125, -13.7548828125, -13.02880859375, -12.302734375, -11.57666015625, -10.8505859375, -10.12451171875, -9.3984375, -8.67236328125, -7.9462890625, -7.22021484375, -6.494140625, -5.76806640625, -5.0419921875, -4.31591796875, -3.58984375, -2.86376953125, -2.1376953125, -1.41162109375, -0.685546875, 0.04052734375, 0.7666015625, 1.49267578125, 2.21875, 2.94482421875, 3.6708984375, 4.39697265625, 5.123046875, 5.84912109375, 6.5751953125, 7.30126953125, 8.02734375, 8.75341796875, 9.4794921875, 10.20556640625, 10.931640625, 11.65771484375, 12.3837890625, 13.10986328125, 13.8359375, 14.56201171875, 15.2880859375, 16.01416015625, 16.740234375, 17.46630859375, 18.1923828125, 18.91845703125, 19.64453125, 20.37060546875, 21.0966796875, 21.82275390625, 22.548828125, 23.27490234375, 24.0009765625, 24.72705078125, 25.453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 13.0, 9.0, 18.0, 42.0, 58.0, 90.0, 154.0, 196.0, 320.0, 404.0, 676.0, 1103.0, 1510.0, 2449.0, 3477.0, 5676.0, 8292.0, 12620.0, 18986.0, 27648.0, 40783.0, 57939.0, 78922.0, 101194.0, 118747.0, 124217.0, 114380.0, 95073.0, 72195.0, 51801.0, 36123.0, 24705.0, 16438.0, 11062.0, 7205.0, 4831.0, 3085.0, 2063.0, 1349.0, 936.0, 588.0, 413.0, 261.0, 184.0, 120.0, 80.0, 43.0, 28.0, 16.0, 11.0, 9.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.62890625, -2.547637939453125, -2.46636962890625, -2.385101318359375, -2.3038330078125, -2.222564697265625, -2.14129638671875, -2.060028076171875, -1.978759765625, -1.897491455078125, -1.81622314453125, -1.734954833984375, -1.6536865234375, -1.572418212890625, -1.49114990234375, -1.409881591796875, -1.32861328125, -1.247344970703125, -1.16607666015625, -1.084808349609375, -1.0035400390625, -0.922271728515625, -0.84100341796875, -0.759735107421875, -0.678466796875, -0.597198486328125, -0.51593017578125, -0.434661865234375, -0.3533935546875, -0.272125244140625, -0.19085693359375, -0.109588623046875, -0.0283203125, 0.052947998046875, 0.13421630859375, 0.215484619140625, 0.2967529296875, 0.378021240234375, 0.45928955078125, 0.540557861328125, 0.621826171875, 0.703094482421875, 0.78436279296875, 0.865631103515625, 0.9468994140625, 1.028167724609375, 1.10943603515625, 1.190704345703125, 1.27197265625, 1.353240966796875, 1.43450927734375, 1.515777587890625, 1.5970458984375, 1.678314208984375, 1.75958251953125, 1.840850830078125, 1.922119140625, 2.003387451171875, 2.08465576171875, 2.165924072265625, 2.2471923828125, 2.328460693359375, 2.40972900390625, 2.490997314453125, 2.572265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 6.0, 6.0, 5.0, 8.0, 5.0, 20.0, 12.0, 14.0, 12.0, 24.0, 22.0, 18.0, 29.0, 31.0, 27.0, 31.0, 36.0, 40.0, 43.0, 44.0, 46.0, 39.0, 37.0, 41.0, 45.0, 35.0, 45.0, 28.0, 32.0, 28.0, 31.0, 27.0, 25.0, 21.0, 24.0, 11.0, 15.0, 11.0, 6.0, 7.0, 5.0, 4.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.484375, -13.014404296875, -12.54443359375, -12.074462890625, -11.6044921875, -11.134521484375, -10.66455078125, -10.194580078125, -9.724609375, -9.254638671875, -8.78466796875, -8.314697265625, -7.8447265625, -7.374755859375, -6.90478515625, -6.434814453125, -5.96484375, -5.494873046875, -5.02490234375, -4.554931640625, -4.0849609375, -3.614990234375, -3.14501953125, -2.675048828125, -2.205078125, -1.735107421875, -1.26513671875, -0.795166015625, -0.3251953125, 0.144775390625, 0.61474609375, 1.084716796875, 1.5546875, 2.024658203125, 2.49462890625, 2.964599609375, 3.4345703125, 3.904541015625, 4.37451171875, 4.844482421875, 5.314453125, 5.784423828125, 6.25439453125, 6.724365234375, 7.1943359375, 7.664306640625, 8.13427734375, 8.604248046875, 9.07421875, 9.544189453125, 10.01416015625, 10.484130859375, 10.9541015625, 11.424072265625, 11.89404296875, 12.364013671875, 12.833984375, 13.303955078125, 13.77392578125, 14.243896484375, 14.7138671875, 15.183837890625, 15.65380859375, 16.123779296875, 16.59375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 3.0, 3.0, 6.0, 17.0, 17.0, 20.0, 38.0, 61.0, 86.0, 112.0, 197.0, 245.0, 372.0, 555.0, 843.0, 1205.0, 1813.0, 2739.0, 3976.0, 5924.0, 9085.0, 13667.0, 20706.0, 31518.0, 47260.0, 68321.0, 94857.0, 122216.0, 138711.0, 130963.0, 106799.0, 79761.0, 55177.0, 37626.0, 24909.0, 16019.0, 10884.0, 7143.0, 4760.0, 3208.0, 2131.0, 1529.0, 946.0, 715.0, 446.0, 316.0, 239.0, 145.0, 92.0, 54.0, 43.0, 32.0, 17.0, 14.0, 9.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.2164306640625, -0.20960426330566406, -0.20277786254882812, -0.1959514617919922, -0.18912506103515625, -0.1822986602783203, -0.17547225952148438, -0.16864585876464844, -0.1618194580078125, -0.15499305725097656, -0.14816665649414062, -0.1413402557373047, -0.13451385498046875, -0.1276874542236328, -0.12086105346679688, -0.11403465270996094, -0.107208251953125, -0.10038185119628906, -0.09355545043945312, -0.08672904968261719, -0.07990264892578125, -0.07307624816894531, -0.06624984741210938, -0.05942344665527344, -0.0525970458984375, -0.04577064514160156, -0.038944244384765625, -0.03211784362792969, -0.02529144287109375, -0.018465042114257812, -0.011638641357421875, -0.0048122406005859375, 0.00201416015625, 0.008840560913085938, 0.015666961669921875, 0.022493362426757812, 0.02931976318359375, 0.03614616394042969, 0.042972564697265625, 0.04979896545410156, 0.0566253662109375, 0.06345176696777344, 0.07027816772460938, 0.07710456848144531, 0.08393096923828125, 0.09075736999511719, 0.09758377075195312, 0.10441017150878906, 0.111236572265625, 0.11806297302246094, 0.12488937377929688, 0.1317157745361328, 0.13854217529296875, 0.1453685760498047, 0.15219497680664062, 0.15902137756347656, 0.1658477783203125, 0.17267417907714844, 0.17950057983398438, 0.1863269805908203, 0.19315338134765625, 0.1999797821044922, 0.20680618286132812, 0.21363258361816406, 0.220458984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 8.0, 3.0, 2.0, 14.0, 13.0, 21.0, 14.0, 13.0, 27.0, 22.0, 26.0, 36.0, 37.0, 36.0, 50.0, 46.0, 43.0, 50.0, 46.0, 50.0, 49.0, 38.0, 47.0, 43.0, 42.0, 46.0, 28.0, 21.0, 27.0, 22.0, 19.0, 8.0, 9.0, 12.0, 7.0, 5.0, 6.0, 3.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.641843795776367e-05, -3.528594970703125e-05, -3.415346145629883e-05, -3.3020973205566406e-05, -3.1888484954833984e-05, -3.075599670410156e-05, -2.962350845336914e-05, -2.849102020263672e-05, -2.7358531951904297e-05, -2.6226043701171875e-05, -2.5093555450439453e-05, -2.396106719970703e-05, -2.282857894897461e-05, -2.1696090698242188e-05, -2.0563602447509766e-05, -1.9431114196777344e-05, -1.8298625946044922e-05, -1.71661376953125e-05, -1.6033649444580078e-05, -1.4901161193847656e-05, -1.3768672943115234e-05, -1.2636184692382812e-05, -1.150369644165039e-05, -1.0371208190917969e-05, -9.238719940185547e-06, -8.106231689453125e-06, -6.973743438720703e-06, -5.841255187988281e-06, -4.708766937255859e-06, -3.5762786865234375e-06, -2.4437904357910156e-06, -1.3113021850585938e-06, -1.7881393432617188e-07, 9.5367431640625e-07, 2.086162567138672e-06, 3.2186508178710938e-06, 4.351139068603516e-06, 5.4836273193359375e-06, 6.616115570068359e-06, 7.748603820800781e-06, 8.881092071533203e-06, 1.0013580322265625e-05, 1.1146068572998047e-05, 1.2278556823730469e-05, 1.341104507446289e-05, 1.4543533325195312e-05, 1.5676021575927734e-05, 1.6808509826660156e-05, 1.7940998077392578e-05, 1.9073486328125e-05, 2.0205974578857422e-05, 2.1338462829589844e-05, 2.2470951080322266e-05, 2.3603439331054688e-05, 2.473592758178711e-05, 2.586841583251953e-05, 2.7000904083251953e-05, 2.8133392333984375e-05, 2.9265880584716797e-05, 3.039836883544922e-05, 3.153085708618164e-05, 3.266334533691406e-05, 3.3795833587646484e-05, 3.4928321838378906e-05, 3.606081008911133e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 9.0, 16.0, 8.0, 15.0, 18.0, 33.0, 57.0, 102.0, 154.0, 199.0, 321.0, 455.0, 687.0, 1007.0, 1578.0, 2255.0, 3391.0, 5148.0, 7816.0, 11783.0, 17991.0, 27338.0, 41200.0, 61750.0, 89427.0, 121036.0, 144989.0, 142284.0, 115147.0, 83076.0, 56963.0, 38240.0, 25168.0, 16467.0, 10883.0, 7261.0, 4707.0, 3096.0, 2090.0, 1483.0, 955.0, 668.0, 410.0, 290.0, 215.0, 129.0, 74.0, 58.0, 38.0, 20.0, 20.0, 11.0, 10.0, 6.0, 4.0, 4.0, 1.0, 2.0], "bins": [-0.440673828125, -0.4272804260253906, -0.41388702392578125, -0.4004936218261719, -0.3871002197265625, -0.3737068176269531, -0.36031341552734375, -0.3469200134277344, -0.333526611328125, -0.3201332092285156, -0.30673980712890625, -0.2933464050292969, -0.2799530029296875, -0.2665596008300781, -0.25316619873046875, -0.23977279663085938, -0.22637939453125, -0.21298599243164062, -0.19959259033203125, -0.18619918823242188, -0.1728057861328125, -0.15941238403320312, -0.14601898193359375, -0.13262557983398438, -0.119232177734375, -0.10583877563476562, -0.09244537353515625, -0.07905197143554688, -0.0656585693359375, -0.052265167236328125, -0.03887176513671875, -0.025478363037109375, -0.0120849609375, 0.001308441162109375, 0.01470184326171875, 0.028095245361328125, 0.0414886474609375, 0.054882049560546875, 0.06827545166015625, 0.08166885375976562, 0.095062255859375, 0.10845565795898438, 0.12184906005859375, 0.13524246215820312, 0.1486358642578125, 0.16202926635742188, 0.17542266845703125, 0.18881607055664062, 0.20220947265625, 0.21560287475585938, 0.22899627685546875, 0.24238967895507812, 0.2557830810546875, 0.2691764831542969, 0.28256988525390625, 0.2959632873535156, 0.309356689453125, 0.3227500915527344, 0.33614349365234375, 0.3495368957519531, 0.3629302978515625, 0.3763236999511719, 0.38971710205078125, 0.4031105041503906, 0.41650390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 9.0, 6.0, 10.0, 9.0, 14.0, 12.0, 10.0, 10.0, 16.0, 27.0, 37.0, 32.0, 51.0, 52.0, 85.0, 77.0, 69.0, 72.0, 58.0, 55.0, 49.0, 50.0, 38.0, 21.0, 32.0, 16.0, 14.0, 12.0, 10.0, 8.0, 6.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2213134765625, -0.2126331329345703, -0.20395278930664062, -0.19527244567871094, -0.18659210205078125, -0.17791175842285156, -0.16923141479492188, -0.1605510711669922, -0.1518707275390625, -0.1431903839111328, -0.13451004028320312, -0.12582969665527344, -0.11714935302734375, -0.10846900939941406, -0.09978866577148438, -0.09110832214355469, -0.082427978515625, -0.07374763488769531, -0.06506729125976562, -0.05638694763183594, -0.04770660400390625, -0.03902626037597656, -0.030345916748046875, -0.021665573120117188, -0.0129852294921875, -0.0043048858642578125, 0.004375457763671875, 0.013055801391601562, 0.02173614501953125, 0.030416488647460938, 0.039096832275390625, 0.04777717590332031, 0.05645751953125, 0.06513786315917969, 0.07381820678710938, 0.08249855041503906, 0.09117889404296875, 0.09985923767089844, 0.10853958129882812, 0.11721992492675781, 0.1259002685546875, 0.1345806121826172, 0.14326095581054688, 0.15194129943847656, 0.16062164306640625, 0.16930198669433594, 0.17798233032226562, 0.1866626739501953, 0.195343017578125, 0.2040233612060547, 0.21270370483398438, 0.22138404846191406, 0.23006439208984375, 0.23874473571777344, 0.24742507934570312, 0.2561054229736328, 0.2647857666015625, 0.2734661102294922, 0.2821464538574219, 0.29082679748535156, 0.29950714111328125, 0.30818748474121094, 0.3168678283691406, 0.3255481719970703, 0.334228515625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 3.0, 5.0, 15.0, 8.0, 13.0, 28.0, 26.0, 26.0, 34.0, 36.0, 36.0, 37.0, 48.0, 58.0, 38.0, 45.0, 53.0, 45.0, 36.0, 29.0, 58.0, 52.0, 44.0, 34.0, 22.0, 25.0, 23.0, 18.0, 17.0, 21.0, 18.0, 4.0, 6.0, 6.0, 8.0, 1.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.251113891601562, -19.63152503967285, -19.01193618774414, -18.39234733581543, -17.77275848388672, -17.153169631958008, -16.533580780029297, -15.91399097442627, -15.294402122497559, -14.674813270568848, -14.055224418640137, -13.435635566711426, -12.816045761108398, -12.196456909179688, -11.576868057250977, -10.957279205322266, -10.337690353393555, -9.718101501464844, -9.098512649536133, -8.478923797607422, -7.859334468841553, -7.239745616912842, -6.620156288146973, -6.000567436218262, -5.380978584289551, -4.76138973236084, -4.141800880432129, -3.5222115516662598, -2.902622699737549, -2.283033847808838, -1.6634447574615479, -1.0438556671142578, -0.4242687225341797, 0.1953202486038208, 0.8149092197418213, 1.4344981908798218, 2.0540871620178223, 2.673676013946533, 3.2932651042938232, 3.9128541946411133, 4.532443046569824, 5.152031898498535, 5.771620750427246, 6.391210079193115, 7.010798931121826, 7.630387783050537, 8.249977111816406, 8.869565963745117, 9.489154815673828, 10.108743667602539, 10.72833251953125, 11.347921371459961, 11.967510223388672, 12.587099075317383, 13.20668888092041, 13.826277732849121, 14.445866584777832, 15.065455436706543, 15.685044288635254, 16.30463409423828, 16.924222946166992, 17.543811798095703, 18.163400650024414, 18.782989501953125, 19.402578353881836]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 12.0, 11.0, 13.0, 13.0, 14.0, 23.0, 20.0, 22.0, 26.0, 22.0, 33.0, 31.0, 39.0, 47.0, 46.0, 46.0, 49.0, 55.0, 42.0, 55.0, 44.0, 36.0, 31.0, 38.0, 24.0, 29.0, 26.0, 25.0, 19.0, 30.0, 17.0, 7.0, 15.0, 5.0, 9.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15969467163086, -19.44611167907715, -18.732526779174805, -18.018943786621094, -17.305360794067383, -16.591777801513672, -15.878192901611328, -15.164609909057617, -14.45102596282959, -13.737442016601562, -13.023859024047852, -12.310275077819824, -11.596691131591797, -10.883108139038086, -10.169524192810059, -9.455940246582031, -8.74235725402832, -8.028773307800293, -7.315190315246582, -6.601606369018555, -5.8880228996276855, -5.174439430236816, -4.460855484008789, -3.74727201461792, -3.033688545227051, -2.3201050758361816, -1.6065213680267334, -0.8929376602172852, -0.17935419082641602, 0.5342292785644531, 1.2478132247924805, 1.9613966941833496, 2.6749801635742188, 3.388563632965088, 4.102147102355957, 4.815731048583984, 5.5293145179748535, 6.242897987365723, 6.95648193359375, 7.670065402984619, 8.383648872375488, 9.097232818603516, 9.810815811157227, 10.524399757385254, 11.237983703613281, 11.951566696166992, 12.66515064239502, 13.378734588623047, 14.092317581176758, 14.805901527404785, 15.519484519958496, 16.233068466186523, 16.946651458740234, 17.660236358642578, 18.37381935119629, 19.08740234375, 19.800987243652344, 20.514570236206055, 21.2281551361084, 21.94173812866211, 22.65532112121582, 23.36890411376953, 24.082489013671875, 24.796072006225586, 25.509654998779297]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 14.0, 9.0, 14.0, 39.0, 42.0, 76.0, 112.0, 205.0, 307.0, 479.0, 778.0, 1231.0, 1993.0, 3005.0, 4376.0, 6943.0, 10165.0, 14581.0, 21117.0, 28688.0, 38454.0, 49283.0, 61294.0, 72789.0, 82085.0, 88408.0, 90607.0, 88222.0, 81048.0, 70486.0, 59095.0, 47327.0, 36586.0, 27174.0, 19688.0, 13849.0, 9591.0, 6447.0, 4170.0, 2775.0, 1760.0, 1177.0, 763.0, 506.0, 298.0, 202.0, 107.0, 78.0, 59.0, 23.0, 15.0, 8.0, 3.0, 6.0, 3.0, 3.0], "bins": [-9.515625, -9.2391357421875, -8.962646484375, -8.6861572265625, -8.40966796875, -8.1331787109375, -7.856689453125, -7.5802001953125, -7.3037109375, -7.0272216796875, -6.750732421875, -6.4742431640625, -6.19775390625, -5.9212646484375, -5.644775390625, -5.3682861328125, -5.091796875, -4.8153076171875, -4.538818359375, -4.2623291015625, -3.98583984375, -3.7093505859375, -3.432861328125, -3.1563720703125, -2.8798828125, -2.6033935546875, -2.326904296875, -2.0504150390625, -1.77392578125, -1.4974365234375, -1.220947265625, -0.9444580078125, -0.66796875, -0.3914794921875, -0.114990234375, 0.1614990234375, 0.43798828125, 0.7144775390625, 0.990966796875, 1.2674560546875, 1.5439453125, 1.8204345703125, 2.096923828125, 2.3734130859375, 2.64990234375, 2.9263916015625, 3.202880859375, 3.4793701171875, 3.755859375, 4.0323486328125, 4.308837890625, 4.5853271484375, 4.86181640625, 5.1383056640625, 5.414794921875, 5.6912841796875, 5.9677734375, 6.2442626953125, 6.520751953125, 6.7972412109375, 7.07373046875, 7.3502197265625, 7.626708984375, 7.9031982421875, 8.1796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 15.0, 15.0, 11.0, 16.0, 23.0, 16.0, 28.0, 23.0, 35.0, 28.0, 29.0, 43.0, 36.0, 40.0, 49.0, 40.0, 42.0, 37.0, 60.0, 48.0, 33.0, 36.0, 37.0, 30.0, 27.0, 30.0, 25.0, 18.0, 22.0, 23.0, 15.0, 18.0, 5.0, 15.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -19.0078125, -18.296875, -17.5859375, -16.875, -16.1640625, -15.453125, -14.7421875, -14.03125, -13.3203125, -12.609375, -11.8984375, -11.1875, -10.4765625, -9.765625, -9.0546875, -8.34375, -7.6328125, -6.921875, -6.2109375, -5.5, -4.7890625, -4.078125, -3.3671875, -2.65625, -1.9453125, -1.234375, -0.5234375, 0.1875, 0.8984375, 1.609375, 2.3203125, 3.03125, 3.7421875, 4.453125, 5.1640625, 5.875, 6.5859375, 7.296875, 8.0078125, 8.71875, 9.4296875, 10.140625, 10.8515625, 11.5625, 12.2734375, 12.984375, 13.6953125, 14.40625, 15.1171875, 15.828125, 16.5390625, 17.25, 17.9609375, 18.671875, 19.3828125, 20.09375, 20.8046875, 21.515625, 22.2265625, 22.9375, 23.6484375, 24.359375, 25.0703125, 25.78125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 9.0, 5.0, 27.0, 16.0, 36.0, 64.0, 94.0, 160.0, 230.0, 397.0, 620.0, 978.0, 1653.0, 2582.0, 4005.0, 6127.0, 9355.0, 14039.0, 20227.0, 28816.0, 39158.0, 51758.0, 65399.0, 77946.0, 88041.0, 95172.0, 95737.0, 91479.0, 82339.0, 69803.0, 56335.0, 43599.0, 32278.0, 23143.0, 15979.0, 10893.0, 7213.0, 4641.0, 2980.0, 1880.0, 1299.0, 820.0, 476.0, 320.0, 192.0, 90.0, 61.0, 39.0, 22.0, 9.0, 13.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.3616943359375, -9.051513671875, -8.7413330078125, -8.43115234375, -8.1209716796875, -7.810791015625, -7.5006103515625, -7.1904296875, -6.8802490234375, -6.570068359375, -6.2598876953125, -5.94970703125, -5.6395263671875, -5.329345703125, -5.0191650390625, -4.708984375, -4.3988037109375, -4.088623046875, -3.7784423828125, -3.46826171875, -3.1580810546875, -2.847900390625, -2.5377197265625, -2.2275390625, -1.9173583984375, -1.607177734375, -1.2969970703125, -0.98681640625, -0.6766357421875, -0.366455078125, -0.0562744140625, 0.25390625, 0.5640869140625, 0.874267578125, 1.1844482421875, 1.49462890625, 1.8048095703125, 2.114990234375, 2.4251708984375, 2.7353515625, 3.0455322265625, 3.355712890625, 3.6658935546875, 3.97607421875, 4.2862548828125, 4.596435546875, 4.9066162109375, 5.216796875, 5.5269775390625, 5.837158203125, 6.1473388671875, 6.45751953125, 6.7677001953125, 7.077880859375, 7.3880615234375, 7.6982421875, 8.0084228515625, 8.318603515625, 8.6287841796875, 8.93896484375, 9.2491455078125, 9.559326171875, 9.8695068359375, 10.1796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 13.0, 11.0, 6.0, 7.0, 14.0, 18.0, 17.0, 22.0, 28.0, 23.0, 24.0, 32.0, 22.0, 31.0, 38.0, 22.0, 40.0, 36.0, 40.0, 43.0, 44.0, 33.0, 33.0, 34.0, 36.0, 47.0, 43.0, 33.0, 28.0, 23.0, 26.0, 19.0, 28.0, 20.0, 12.0, 12.0, 7.0, 8.0, 5.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.4283447265625, -10.997314453125, -10.5662841796875, -10.13525390625, -9.7042236328125, -9.273193359375, -8.8421630859375, -8.4111328125, -7.9801025390625, -7.549072265625, -7.1180419921875, -6.68701171875, -6.2559814453125, -5.824951171875, -5.3939208984375, -4.962890625, -4.5318603515625, -4.100830078125, -3.6697998046875, -3.23876953125, -2.8077392578125, -2.376708984375, -1.9456787109375, -1.5146484375, -1.0836181640625, -0.652587890625, -0.2215576171875, 0.20947265625, 0.6405029296875, 1.071533203125, 1.5025634765625, 1.93359375, 2.3646240234375, 2.795654296875, 3.2266845703125, 3.65771484375, 4.0887451171875, 4.519775390625, 4.9508056640625, 5.3818359375, 5.8128662109375, 6.243896484375, 6.6749267578125, 7.10595703125, 7.5369873046875, 7.968017578125, 8.3990478515625, 8.830078125, 9.2611083984375, 9.692138671875, 10.1231689453125, 10.55419921875, 10.9852294921875, 11.416259765625, 11.8472900390625, 12.2783203125, 12.7093505859375, 13.140380859375, 13.5714111328125, 14.00244140625, 14.4334716796875, 14.864501953125, 15.2955322265625, 15.7265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 14.0, 21.0, 34.0, 66.0, 111.0, 172.0, 269.0, 410.0, 681.0, 1117.0, 1934.0, 3310.0, 5462.0, 9280.0, 15158.0, 24748.0, 37615.0, 54948.0, 75414.0, 95477.0, 112528.0, 119862.0, 117222.0, 103589.0, 84349.0, 63122.0, 44335.0, 29602.0, 19039.0, 11247.0, 6986.0, 4116.0, 2479.0, 1550.0, 889.0, 510.0, 313.0, 213.0, 137.0, 89.0, 50.0, 29.0, 20.0, 15.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.11163330078125, -3.9732666015625, -3.83489990234375, -3.696533203125, -3.55816650390625, -3.4197998046875, -3.28143310546875, -3.14306640625, -3.00469970703125, -2.8663330078125, -2.72796630859375, -2.589599609375, -2.45123291015625, -2.3128662109375, -2.17449951171875, -2.0361328125, -1.89776611328125, -1.7593994140625, -1.62103271484375, -1.482666015625, -1.34429931640625, -1.2059326171875, -1.06756591796875, -0.92919921875, -0.79083251953125, -0.6524658203125, -0.51409912109375, -0.375732421875, -0.23736572265625, -0.0989990234375, 0.03936767578125, 0.177734375, 0.31610107421875, 0.4544677734375, 0.59283447265625, 0.731201171875, 0.86956787109375, 1.0079345703125, 1.14630126953125, 1.28466796875, 1.42303466796875, 1.5614013671875, 1.69976806640625, 1.838134765625, 1.97650146484375, 2.1148681640625, 2.25323486328125, 2.3916015625, 2.52996826171875, 2.6683349609375, 2.80670166015625, 2.945068359375, 3.08343505859375, 3.2218017578125, 3.36016845703125, 3.49853515625, 3.63690185546875, 3.7752685546875, 3.91363525390625, 4.052001953125, 4.19036865234375, 4.3287353515625, 4.46710205078125, 4.60546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 9.0, 6.0, 15.0, 17.0, 12.0, 27.0, 26.0, 34.0, 23.0, 35.0, 36.0, 43.0, 41.0, 34.0, 61.0, 43.0, 45.0, 35.0, 35.0, 39.0, 43.0, 48.0, 41.0, 32.0, 31.0, 19.0, 18.0, 22.0, 21.0, 19.0, 13.0, 16.0, 15.0, 6.0, 3.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0005240440368652344, -0.0005087852478027344, -0.0004935264587402344, -0.0004782676696777344, -0.0004630088806152344, -0.0004477500915527344, -0.0004324913024902344, -0.0004172325134277344, -0.0004019737243652344, -0.0003867149353027344, -0.0003714561462402344, -0.0003561973571777344, -0.0003409385681152344, -0.0003256797790527344, -0.0003104209899902344, -0.0002951622009277344, -0.0002799034118652344, -0.0002646446228027344, -0.0002493858337402344, -0.00023412704467773438, -0.00021886825561523438, -0.00020360946655273438, -0.00018835067749023438, -0.00017309188842773438, -0.00015783309936523438, -0.00014257431030273438, -0.00012731552124023438, -0.00011205673217773438, -9.679794311523438e-05, -8.153915405273438e-05, -6.628036499023438e-05, -5.1021575927734375e-05, -3.5762786865234375e-05, -2.0503997802734375e-05, -5.245208740234375e-06, 1.0013580322265625e-05, 2.5272369384765625e-05, 4.0531158447265625e-05, 5.5789947509765625e-05, 7.104873657226562e-05, 8.630752563476562e-05, 0.00010156631469726562, 0.00011682510375976562, 0.00013208389282226562, 0.00014734268188476562, 0.00016260147094726562, 0.00017786026000976562, 0.00019311904907226562, 0.00020837783813476562, 0.00022363662719726562, 0.00023889541625976562, 0.0002541542053222656, 0.0002694129943847656, 0.0002846717834472656, 0.0002999305725097656, 0.0003151893615722656, 0.0003304481506347656, 0.0003457069396972656, 0.0003609657287597656, 0.0003762245178222656, 0.0003914833068847656, 0.0004067420959472656, 0.0004220008850097656, 0.0004372596740722656, 0.0004525184631347656]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 9.0, 9.0, 10.0, 28.0, 27.0, 40.0, 59.0, 94.0, 107.0, 188.0, 266.0, 429.0, 614.0, 943.0, 1536.0, 2435.0, 3961.0, 6200.0, 9733.0, 15429.0, 23570.0, 34660.0, 50109.0, 67767.0, 86114.0, 101441.0, 110715.0, 111486.0, 102968.0, 88101.0, 69759.0, 52831.0, 37021.0, 25213.0, 16255.0, 10359.0, 6661.0, 4101.0, 2620.0, 1676.0, 1035.0, 700.0, 442.0, 281.0, 205.0, 122.0, 75.0, 59.0, 42.0, 19.0, 10.0, 11.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0], "bins": [-4.4296875, -4.29156494140625, -4.1534423828125, -4.01531982421875, -3.877197265625, -3.73907470703125, -3.6009521484375, -3.46282958984375, -3.32470703125, -3.18658447265625, -3.0484619140625, -2.91033935546875, -2.772216796875, -2.63409423828125, -2.4959716796875, -2.35784912109375, -2.2197265625, -2.08160400390625, -1.9434814453125, -1.80535888671875, -1.667236328125, -1.52911376953125, -1.3909912109375, -1.25286865234375, -1.11474609375, -0.97662353515625, -0.8385009765625, -0.70037841796875, -0.562255859375, -0.42413330078125, -0.2860107421875, -0.14788818359375, -0.009765625, 0.12835693359375, 0.2664794921875, 0.40460205078125, 0.542724609375, 0.68084716796875, 0.8189697265625, 0.95709228515625, 1.09521484375, 1.23333740234375, 1.3714599609375, 1.50958251953125, 1.647705078125, 1.78582763671875, 1.9239501953125, 2.06207275390625, 2.2001953125, 2.33831787109375, 2.4764404296875, 2.61456298828125, 2.752685546875, 2.89080810546875, 3.0289306640625, 3.16705322265625, 3.30517578125, 3.44329833984375, 3.5814208984375, 3.71954345703125, 3.857666015625, 3.99578857421875, 4.1339111328125, 4.27203369140625, 4.41015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 10.0, 12.0, 10.0, 13.0, 20.0, 18.0, 30.0, 37.0, 46.0, 49.0, 51.0, 57.0, 50.0, 66.0, 65.0, 63.0, 54.0, 46.0, 46.0, 45.0, 39.0, 26.0, 33.0, 21.0, 17.0, 25.0, 10.0, 10.0, 6.0, 7.0, 6.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.278472900390625, -2.20343017578125, -2.128387451171875, -2.0533447265625, -1.978302001953125, -1.90325927734375, -1.828216552734375, -1.753173828125, -1.678131103515625, -1.60308837890625, -1.528045654296875, -1.4530029296875, -1.377960205078125, -1.30291748046875, -1.227874755859375, -1.15283203125, -1.077789306640625, -1.00274658203125, -0.927703857421875, -0.8526611328125, -0.777618408203125, -0.70257568359375, -0.627532958984375, -0.552490234375, -0.477447509765625, -0.40240478515625, -0.327362060546875, -0.2523193359375, -0.177276611328125, -0.10223388671875, -0.027191162109375, 0.0478515625, 0.122894287109375, 0.19793701171875, 0.272979736328125, 0.3480224609375, 0.423065185546875, 0.49810791015625, 0.573150634765625, 0.648193359375, 0.723236083984375, 0.79827880859375, 0.873321533203125, 0.9483642578125, 1.023406982421875, 1.09844970703125, 1.173492431640625, 1.24853515625, 1.323577880859375, 1.39862060546875, 1.473663330078125, 1.5487060546875, 1.623748779296875, 1.69879150390625, 1.773834228515625, 1.848876953125, 1.923919677734375, 1.99896240234375, 2.074005126953125, 2.1490478515625, 2.224090576171875, 2.29913330078125, 2.374176025390625, 2.44921875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 6.0, 8.0, 10.0, 10.0, 15.0, 12.0, 17.0, 32.0, 28.0, 35.0, 25.0, 47.0, 33.0, 42.0, 44.0, 49.0, 44.0, 47.0, 47.0, 43.0, 37.0, 41.0, 35.0, 37.0, 37.0, 31.0, 30.0, 16.0, 24.0, 15.0, 18.0, 10.0, 13.0, 10.0, 7.0, 9.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.210351943969727, -18.620548248291016, -18.030744552612305, -17.440940856933594, -16.851137161254883, -16.261333465576172, -15.671530723571777, -15.081727981567383, -14.491924285888672, -13.902120590209961, -13.31231689453125, -12.722513198852539, -12.132710456848145, -11.542906761169434, -10.953103065490723, -10.363300323486328, -9.7734956741333, -9.18369197845459, -8.593888282775879, -8.004085540771484, -7.414281845092773, -6.8244781494140625, -6.234674453735352, -5.644871234893799, -5.055067539215088, -4.465263843536377, -3.875460624694824, -3.2856569290161133, -2.6958534717559814, -2.1060500144958496, -1.5162463188171387, -0.9264430999755859, -0.336639404296875, 0.2531641125679016, 0.8429676294326782, 1.4327712059020996, 2.0225746631622314, 2.6123781204223633, 3.202181816101074, 3.791985034942627, 4.381788730621338, 4.971592426300049, 5.561395645141602, 6.1511993408203125, 6.741003036499023, 7.330806255340576, 7.920609951019287, 8.51041316986084, 9.10021686553955, 9.690020561218262, 10.279824256896973, 10.869626998901367, 11.459430694580078, 12.049234390258789, 12.6390380859375, 13.228841781616211, 13.818645477294922, 14.408449172973633, 14.998252868652344, 15.588056564331055, 16.177860260009766, 16.767662048339844, 17.357467651367188, 17.947269439697266, 18.537073135375977]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 3.0, 9.0, 12.0, 13.0, 12.0, 16.0, 16.0, 21.0, 24.0, 34.0, 30.0, 26.0, 40.0, 35.0, 40.0, 44.0, 38.0, 48.0, 57.0, 53.0, 49.0, 41.0, 40.0, 27.0, 41.0, 19.0, 24.0, 34.0, 23.0, 25.0, 23.0, 19.0, 9.0, 7.0, 12.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-25.008621215820312, -24.212242126464844, -23.415864944458008, -22.61948585510254, -21.82310676574707, -21.026729583740234, -20.230350494384766, -19.433971405029297, -18.637592315673828, -17.84121322631836, -17.044836044311523, -16.248456954956055, -15.452077865600586, -14.655699729919434, -13.859321594238281, -13.062942504882812, -12.266565322875977, -11.470187187194824, -10.673808097839355, -9.877429962158203, -9.081050872802734, -8.284672737121582, -7.48829460144043, -6.691915988922119, -5.895537376403809, -5.099158763885498, -4.3027801513671875, -3.506402015686035, -2.7100234031677246, -1.913644790649414, -1.1172666549682617, -0.32088804244995117, 0.4754924774169922, 1.2718709707260132, 2.068249464035034, 2.8646278381347656, 3.661006450653076, 4.457385063171387, 5.253763198852539, 6.05014181137085, 6.84652042388916, 7.642899036407471, 8.439277648925781, 9.235655784606934, 10.032033920288086, 10.828413009643555, 11.624791145324707, 12.42116928100586, 13.217548370361328, 14.01392650604248, 14.81030559539795, 15.606683731079102, 16.40306282043457, 17.199440002441406, 17.995819091796875, 18.792198181152344, 19.588577270507812, 20.38495635986328, 21.181333541870117, 21.977712631225586, 22.774091720581055, 23.57046890258789, 24.36684799194336, 25.163227081298828, 25.959604263305664]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 9.0, 19.0, 32.0, 33.0, 84.0, 133.0, 216.0, 391.0, 697.0, 1066.0, 1778.0, 2738.0, 4719.0, 7545.0, 11672.0, 18333.0, 28848.0, 42713.0, 63257.0, 91163.0, 127900.0, 171148.0, 222109.0, 275129.0, 323481.0, 360235.0, 380323.0, 378960.0, 355602.0, 315179.0, 265175.0, 211282.0, 162617.0, 118935.0, 84358.0, 57736.0, 39295.0, 25605.0, 16178.0, 10440.0, 6483.0, 4092.0, 2518.0, 1616.0, 953.0, 589.0, 355.0, 199.0, 139.0, 77.0, 53.0, 32.0, 22.0, 18.0, 2.0, 1.0, 5.0, 1.0, 1.0, 3.0], "bins": [-13.96875, -13.51708984375, -13.0654296875, -12.61376953125, -12.162109375, -11.71044921875, -11.2587890625, -10.80712890625, -10.35546875, -9.90380859375, -9.4521484375, -9.00048828125, -8.548828125, -8.09716796875, -7.6455078125, -7.19384765625, -6.7421875, -6.29052734375, -5.8388671875, -5.38720703125, -4.935546875, -4.48388671875, -4.0322265625, -3.58056640625, -3.12890625, -2.67724609375, -2.2255859375, -1.77392578125, -1.322265625, -0.87060546875, -0.4189453125, 0.03271484375, 0.484375, 0.93603515625, 1.3876953125, 1.83935546875, 2.291015625, 2.74267578125, 3.1943359375, 3.64599609375, 4.09765625, 4.54931640625, 5.0009765625, 5.45263671875, 5.904296875, 6.35595703125, 6.8076171875, 7.25927734375, 7.7109375, 8.16259765625, 8.6142578125, 9.06591796875, 9.517578125, 9.96923828125, 10.4208984375, 10.87255859375, 11.32421875, 11.77587890625, 12.2275390625, 12.67919921875, 13.130859375, 13.58251953125, 14.0341796875, 14.48583984375, 14.9375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 11.0, 9.0, 18.0, 15.0, 22.0, 20.0, 27.0, 31.0, 30.0, 30.0, 41.0, 42.0, 43.0, 60.0, 54.0, 49.0, 43.0, 61.0, 44.0, 55.0, 36.0, 26.0, 31.0, 39.0, 27.0, 22.0, 27.0, 18.0, 10.0, 9.0, 9.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.28125, -23.460693359375, -22.64013671875, -21.819580078125, -20.9990234375, -20.178466796875, -19.35791015625, -18.537353515625, -17.716796875, -16.896240234375, -16.07568359375, -15.255126953125, -14.4345703125, -13.614013671875, -12.79345703125, -11.972900390625, -11.15234375, -10.331787109375, -9.51123046875, -8.690673828125, -7.8701171875, -7.049560546875, -6.22900390625, -5.408447265625, -4.587890625, -3.767333984375, -2.94677734375, -2.126220703125, -1.3056640625, -0.485107421875, 0.33544921875, 1.156005859375, 1.9765625, 2.797119140625, 3.61767578125, 4.438232421875, 5.2587890625, 6.079345703125, 6.89990234375, 7.720458984375, 8.541015625, 9.361572265625, 10.18212890625, 11.002685546875, 11.8232421875, 12.643798828125, 13.46435546875, 14.284912109375, 15.10546875, 15.926025390625, 16.74658203125, 17.567138671875, 18.3876953125, 19.208251953125, 20.02880859375, 20.849365234375, 21.669921875, 22.490478515625, 23.31103515625, 24.131591796875, 24.9521484375, 25.772705078125, 26.59326171875, 27.413818359375, 28.234375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 14.0, 16.0, 44.0, 71.0, 125.0, 236.0, 403.0, 758.0, 1286.0, 2119.0, 3817.0, 6609.0, 11372.0, 19164.0, 31287.0, 49612.0, 76882.0, 114512.0, 163466.0, 221435.0, 284619.0, 344011.0, 389662.0, 414948.0, 411032.0, 382601.0, 332920.0, 272654.0, 210752.0, 153137.0, 106948.0, 71584.0, 45803.0, 28879.0, 17209.0, 10151.0, 5919.0, 3493.0, 2106.0, 1184.0, 635.0, 348.0, 215.0, 121.0, 55.0, 31.0, 22.0, 8.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.40625, -17.846923828125, -17.28759765625, -16.728271484375, -16.1689453125, -15.609619140625, -15.05029296875, -14.490966796875, -13.931640625, -13.372314453125, -12.81298828125, -12.253662109375, -11.6943359375, -11.135009765625, -10.57568359375, -10.016357421875, -9.45703125, -8.897705078125, -8.33837890625, -7.779052734375, -7.2197265625, -6.660400390625, -6.10107421875, -5.541748046875, -4.982421875, -4.423095703125, -3.86376953125, -3.304443359375, -2.7451171875, -2.185791015625, -1.62646484375, -1.067138671875, -0.5078125, 0.051513671875, 0.61083984375, 1.170166015625, 1.7294921875, 2.288818359375, 2.84814453125, 3.407470703125, 3.966796875, 4.526123046875, 5.08544921875, 5.644775390625, 6.2041015625, 6.763427734375, 7.32275390625, 7.882080078125, 8.44140625, 9.000732421875, 9.56005859375, 10.119384765625, 10.6787109375, 11.238037109375, 11.79736328125, 12.356689453125, 12.916015625, 13.475341796875, 14.03466796875, 14.593994140625, 15.1533203125, 15.712646484375, 16.27197265625, 16.831298828125, 17.390625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 5.0, 10.0, 14.0, 19.0, 31.0, 21.0, 40.0, 39.0, 55.0, 74.0, 74.0, 93.0, 120.0, 115.0, 163.0, 161.0, 170.0, 183.0, 206.0, 191.0, 210.0, 208.0, 216.0, 199.0, 200.0, 180.0, 180.0, 141.0, 132.0, 120.0, 99.0, 87.0, 78.0, 45.0, 43.0, 41.0, 30.0, 24.0, 18.0, 8.0, 7.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3125, -9.96484375, -9.6171875, -9.26953125, -8.921875, -8.57421875, -8.2265625, -7.87890625, -7.53125, -7.18359375, -6.8359375, -6.48828125, -6.140625, -5.79296875, -5.4453125, -5.09765625, -4.75, -4.40234375, -4.0546875, -3.70703125, -3.359375, -3.01171875, -2.6640625, -2.31640625, -1.96875, -1.62109375, -1.2734375, -0.92578125, -0.578125, -0.23046875, 0.1171875, 0.46484375, 0.8125, 1.16015625, 1.5078125, 1.85546875, 2.203125, 2.55078125, 2.8984375, 3.24609375, 3.59375, 3.94140625, 4.2890625, 4.63671875, 4.984375, 5.33203125, 5.6796875, 6.02734375, 6.375, 6.72265625, 7.0703125, 7.41796875, 7.765625, 8.11328125, 8.4609375, 8.80859375, 9.15625, 9.50390625, 9.8515625, 10.19921875, 10.546875, 10.89453125, 11.2421875, 11.58984375, 11.9375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 13.0, 9.0, 15.0, 12.0, 16.0, 25.0, 27.0, 36.0, 49.0, 39.0, 38.0, 62.0, 62.0, 50.0, 58.0, 44.0, 47.0, 41.0, 48.0, 44.0, 33.0, 47.0, 31.0, 32.0, 16.0, 22.0, 22.0, 8.0, 17.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.577030181884766, -30.613937377929688, -29.65084457397461, -28.68775177001953, -27.724658966064453, -26.761566162109375, -25.798473358154297, -24.83538055419922, -23.87228775024414, -22.909194946289062, -21.946102142333984, -20.983009338378906, -20.019916534423828, -19.05682373046875, -18.093730926513672, -17.130638122558594, -16.16754722595215, -15.20445442199707, -14.241361618041992, -13.278268814086914, -12.315176010131836, -11.352083206176758, -10.388991355895996, -9.425898551940918, -8.46280574798584, -7.499712944030762, -6.536620140075684, -5.573527812957764, -4.6104350090026855, -3.6473422050476074, -2.6842498779296875, -1.7211570739746094, -0.7580642700195312, 0.20502841472625732, 1.168121099472046, 2.131213665008545, 3.094306468963623, 4.057399272918701, 5.020491600036621, 5.983584403991699, 6.946677207946777, 7.9097700119018555, 8.872862815856934, 9.835954666137695, 10.799047470092773, 11.762140274047852, 12.72523307800293, 13.688325881958008, 14.651418685913086, 15.614511489868164, 16.577604293823242, 17.54069709777832, 18.5037899017334, 19.466882705688477, 20.429973602294922, 21.39306640625, 22.356159210205078, 23.319252014160156, 24.282344818115234, 25.245437622070312, 26.20853042602539, 27.17162322998047, 28.134716033935547, 29.097808837890625, 30.060901641845703]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 1.0, 3.0, 8.0, 9.0, 16.0, 17.0, 19.0, 12.0, 30.0, 22.0, 32.0, 38.0, 35.0, 33.0, 40.0, 58.0, 52.0, 44.0, 41.0, 41.0, 51.0, 33.0, 35.0, 47.0, 44.0, 33.0, 21.0, 30.0, 36.0, 26.0, 19.0, 13.0, 15.0, 10.0, 12.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.46427917480469, -34.44151306152344, -33.41874313354492, -32.39597702026367, -31.37320899963379, -30.350440979003906, -29.327674865722656, -28.304906845092773, -27.28213882446289, -26.259370803833008, -25.236602783203125, -24.213836669921875, -23.191068649291992, -22.16830062866211, -21.14553451538086, -20.122766494750977, -19.099998474121094, -18.07723045349121, -17.054462432861328, -16.031696319580078, -15.008928298950195, -13.986160278320312, -12.963393211364746, -11.94062614440918, -10.917858123779297, -9.895090103149414, -8.872323036193848, -7.849555492401123, -6.826787948608398, -5.804020404815674, -4.781252861022949, -3.7584853172302246, -2.7357139587402344, -1.7129464149475098, -0.6901788711547852, 0.33258867263793945, 1.355356216430664, 2.3781237602233887, 3.4008913040161133, 4.423658847808838, 5.4464263916015625, 6.469193935394287, 7.491961479187012, 8.514728546142578, 9.537496566772461, 10.560264587402344, 11.58303165435791, 12.605798721313477, 13.62856674194336, 14.651334762573242, 15.674101829528809, 16.696868896484375, 17.719636917114258, 18.74240493774414, 19.76517105102539, 20.787939071655273, 21.810707092285156, 22.83347511291504, 23.856243133544922, 24.879009246826172, 25.901777267456055, 26.924545288085938, 27.947311401367188, 28.97007942199707, 29.992847442626953]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 12.0, 16.0, 17.0, 26.0, 51.0, 85.0, 115.0, 190.0, 300.0, 450.0, 725.0, 1180.0, 1926.0, 3108.0, 5443.0, 9340.0, 16154.0, 28211.0, 48811.0, 80772.0, 123981.0, 163005.0, 173114.0, 142854.0, 99699.0, 62447.0, 36342.0, 21026.0, 11894.0, 6870.0, 4064.0, 2442.0, 1403.0, 894.0, 552.0, 368.0, 242.0, 149.0, 90.0, 59.0, 39.0, 34.0, 15.0, 10.0, 12.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.88671875, -4.74395751953125, -4.6011962890625, -4.45843505859375, -4.315673828125, -4.17291259765625, -4.0301513671875, -3.88739013671875, -3.74462890625, -3.60186767578125, -3.4591064453125, -3.31634521484375, -3.173583984375, -3.03082275390625, -2.8880615234375, -2.74530029296875, -2.6025390625, -2.45977783203125, -2.3170166015625, -2.17425537109375, -2.031494140625, -1.88873291015625, -1.7459716796875, -1.60321044921875, -1.46044921875, -1.31768798828125, -1.1749267578125, -1.03216552734375, -0.889404296875, -0.74664306640625, -0.6038818359375, -0.46112060546875, -0.318359375, -0.17559814453125, -0.0328369140625, 0.10992431640625, 0.252685546875, 0.39544677734375, 0.5382080078125, 0.68096923828125, 0.82373046875, 0.96649169921875, 1.1092529296875, 1.25201416015625, 1.394775390625, 1.53753662109375, 1.6802978515625, 1.82305908203125, 1.9658203125, 2.10858154296875, 2.2513427734375, 2.39410400390625, 2.536865234375, 2.67962646484375, 2.8223876953125, 2.96514892578125, 3.10791015625, 3.25067138671875, 3.3934326171875, 3.53619384765625, 3.678955078125, 3.82171630859375, 3.9644775390625, 4.10723876953125, 4.25]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 3.0, 15.0, 13.0, 17.0, 16.0, 12.0, 32.0, 23.0, 25.0, 41.0, 43.0, 38.0, 49.0, 37.0, 40.0, 37.0, 47.0, 50.0, 47.0, 45.0, 41.0, 36.0, 40.0, 33.0, 31.0, 29.0, 32.0, 21.0, 19.0, 16.0, 15.0, 13.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.0625, -35.9921875, -34.921875, -33.8515625, -32.78125, -31.7109375, -30.640625, -29.5703125, -28.5, -27.4296875, -26.359375, -25.2890625, -24.21875, -23.1484375, -22.078125, -21.0078125, -19.9375, -18.8671875, -17.796875, -16.7265625, -15.65625, -14.5859375, -13.515625, -12.4453125, -11.375, -10.3046875, -9.234375, -8.1640625, -7.09375, -6.0234375, -4.953125, -3.8828125, -2.8125, -1.7421875, -0.671875, 0.3984375, 1.46875, 2.5390625, 3.609375, 4.6796875, 5.75, 6.8203125, 7.890625, 8.9609375, 10.03125, 11.1015625, 12.171875, 13.2421875, 14.3125, 15.3828125, 16.453125, 17.5234375, 18.59375, 19.6640625, 20.734375, 21.8046875, 22.875, 23.9453125, 25.015625, 26.0859375, 27.15625, 28.2265625, 29.296875, 30.3671875, 31.4375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 20.0, 36.0, 42.0, 82.0, 106.0, 151.0, 229.0, 401.0, 578.0, 839.0, 1390.0, 1930.0, 2946.0, 4433.0, 6630.0, 9734.0, 14906.0, 22036.0, 33016.0, 48295.0, 68988.0, 93823.0, 117820.0, 131299.0, 124732.0, 105989.0, 80424.0, 57229.0, 39530.0, 27209.0, 17725.0, 12151.0, 7941.0, 5386.0, 3440.0, 2407.0, 1593.0, 1046.0, 673.0, 469.0, 293.0, 220.0, 123.0, 83.0, 49.0, 37.0, 23.0, 11.0, 13.0, 11.0, 6.0, 1.0, 1.0, 1.0], "bins": [-3.7890625, -3.676727294921875, -3.56439208984375, -3.452056884765625, -3.3397216796875, -3.227386474609375, -3.11505126953125, -3.002716064453125, -2.890380859375, -2.778045654296875, -2.66571044921875, -2.553375244140625, -2.4410400390625, -2.328704833984375, -2.21636962890625, -2.104034423828125, -1.99169921875, -1.879364013671875, -1.76702880859375, -1.654693603515625, -1.5423583984375, -1.430023193359375, -1.31768798828125, -1.205352783203125, -1.093017578125, -0.980682373046875, -0.86834716796875, -0.756011962890625, -0.6436767578125, -0.531341552734375, -0.41900634765625, -0.306671142578125, -0.1943359375, -0.082000732421875, 0.03033447265625, 0.142669677734375, 0.2550048828125, 0.367340087890625, 0.47967529296875, 0.592010498046875, 0.704345703125, 0.816680908203125, 0.92901611328125, 1.041351318359375, 1.1536865234375, 1.266021728515625, 1.37835693359375, 1.490692138671875, 1.60302734375, 1.715362548828125, 1.82769775390625, 1.940032958984375, 2.0523681640625, 2.164703369140625, 2.27703857421875, 2.389373779296875, 2.501708984375, 2.614044189453125, 2.72637939453125, 2.838714599609375, 2.9510498046875, 3.063385009765625, 3.17572021484375, 3.288055419921875, 3.400390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 10.0, 15.0, 6.0, 8.0, 8.0, 19.0, 12.0, 19.0, 17.0, 17.0, 21.0, 21.0, 28.0, 39.0, 26.0, 34.0, 39.0, 34.0, 43.0, 37.0, 38.0, 38.0, 32.0, 28.0, 36.0, 29.0, 33.0, 33.0, 26.0, 32.0, 21.0, 16.0, 16.0, 26.0, 20.0, 13.0, 14.0, 15.0, 6.0, 8.0, 12.0, 7.0, 9.0, 7.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-17.140625, -16.609130859375, -16.07763671875, -15.546142578125, -15.0146484375, -14.483154296875, -13.95166015625, -13.420166015625, -12.888671875, -12.357177734375, -11.82568359375, -11.294189453125, -10.7626953125, -10.231201171875, -9.69970703125, -9.168212890625, -8.63671875, -8.105224609375, -7.57373046875, -7.042236328125, -6.5107421875, -5.979248046875, -5.44775390625, -4.916259765625, -4.384765625, -3.853271484375, -3.32177734375, -2.790283203125, -2.2587890625, -1.727294921875, -1.19580078125, -0.664306640625, -0.1328125, 0.398681640625, 0.93017578125, 1.461669921875, 1.9931640625, 2.524658203125, 3.05615234375, 3.587646484375, 4.119140625, 4.650634765625, 5.18212890625, 5.713623046875, 6.2451171875, 6.776611328125, 7.30810546875, 7.839599609375, 8.37109375, 8.902587890625, 9.43408203125, 9.965576171875, 10.4970703125, 11.028564453125, 11.56005859375, 12.091552734375, 12.623046875, 13.154541015625, 13.68603515625, 14.217529296875, 14.7490234375, 15.280517578125, 15.81201171875, 16.343505859375, 16.875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 16.0, 12.0, 23.0, 28.0, 36.0, 56.0, 78.0, 127.0, 187.0, 329.0, 477.0, 631.0, 1174.0, 1646.0, 2581.0, 4131.0, 6437.0, 10351.0, 16286.0, 26193.0, 41569.0, 65272.0, 98306.0, 136082.0, 161153.0, 148991.0, 113790.0, 77336.0, 50330.0, 31283.0, 19721.0, 12340.0, 7823.0, 4991.0, 3067.0, 1994.0, 1261.0, 839.0, 533.0, 345.0, 228.0, 176.0, 97.0, 76.0, 42.0, 36.0, 18.0, 19.0, 15.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.38916015625, -0.3776130676269531, -0.36606597900390625, -0.3545188903808594, -0.3429718017578125, -0.3314247131347656, -0.31987762451171875, -0.3083305358886719, -0.296783447265625, -0.2852363586425781, -0.27368927001953125, -0.2621421813964844, -0.2505950927734375, -0.23904800415039062, -0.22750091552734375, -0.21595382690429688, -0.20440673828125, -0.19285964965820312, -0.18131256103515625, -0.16976547241210938, -0.1582183837890625, -0.14667129516601562, -0.13512420654296875, -0.12357711791992188, -0.112030029296875, -0.10048294067382812, -0.08893585205078125, -0.07738876342773438, -0.0658416748046875, -0.054294586181640625, -0.04274749755859375, -0.031200408935546875, -0.0196533203125, -0.008106231689453125, 0.00344085693359375, 0.014987945556640625, 0.0265350341796875, 0.038082122802734375, 0.04962921142578125, 0.061176300048828125, 0.072723388671875, 0.08427047729492188, 0.09581756591796875, 0.10736465454101562, 0.1189117431640625, 0.13045883178710938, 0.14200592041015625, 0.15355300903320312, 0.16510009765625, 0.17664718627929688, 0.18819427490234375, 0.19974136352539062, 0.2112884521484375, 0.22283554077148438, 0.23438262939453125, 0.24592971801757812, 0.257476806640625, 0.2690238952636719, 0.28057098388671875, 0.2921180725097656, 0.3036651611328125, 0.3152122497558594, 0.32675933837890625, 0.3383064270019531, 0.349853515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 5.0, 13.0, 11.0, 24.0, 26.0, 31.0, 31.0, 34.0, 44.0, 43.0, 51.0, 53.0, 57.0, 48.0, 36.0, 66.0, 52.0, 52.0, 43.0, 30.0, 35.0, 41.0, 27.0, 39.0, 30.0, 22.0, 13.0, 11.0, 10.0, 1.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65648078918457e-05, -5.482882261276245e-05, -5.30928373336792e-05, -5.135685205459595e-05, -4.9620866775512695e-05, -4.788488149642944e-05, -4.614889621734619e-05, -4.441291093826294e-05, -4.267692565917969e-05, -4.0940940380096436e-05, -3.9204955101013184e-05, -3.746896982192993e-05, -3.573298454284668e-05, -3.399699926376343e-05, -3.2261013984680176e-05, -3.0525028705596924e-05, -2.8789043426513672e-05, -2.705305814743042e-05, -2.5317072868347168e-05, -2.3581087589263916e-05, -2.1845102310180664e-05, -2.0109117031097412e-05, -1.837313175201416e-05, -1.6637146472930908e-05, -1.4901161193847656e-05, -1.3165175914764404e-05, -1.1429190635681152e-05, -9.6932053565979e-06, -7.957220077514648e-06, -6.2212347984313965e-06, -4.4852495193481445e-06, -2.7492642402648926e-06, -1.0132789611816406e-06, 7.227063179016113e-07, 2.4586915969848633e-06, 4.194676876068115e-06, 5.930662155151367e-06, 7.666647434234619e-06, 9.402632713317871e-06, 1.1138617992401123e-05, 1.2874603271484375e-05, 1.4610588550567627e-05, 1.634657382965088e-05, 1.808255910873413e-05, 1.9818544387817383e-05, 2.1554529666900635e-05, 2.3290514945983887e-05, 2.502650022506714e-05, 2.676248550415039e-05, 2.8498470783233643e-05, 3.0234456062316895e-05, 3.1970441341400146e-05, 3.37064266204834e-05, 3.544241189956665e-05, 3.71783971786499e-05, 3.8914382457733154e-05, 4.0650367736816406e-05, 4.238635301589966e-05, 4.412233829498291e-05, 4.585832357406616e-05, 4.7594308853149414e-05, 4.9330294132232666e-05, 5.106627941131592e-05, 5.280226469039917e-05, 5.453824996948242e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 13.0, 16.0, 31.0, 45.0, 62.0, 107.0, 174.0, 290.0, 421.0, 723.0, 1156.0, 1891.0, 3150.0, 5182.0, 9005.0, 15396.0, 27503.0, 49094.0, 86679.0, 146943.0, 208455.0, 194382.0, 127292.0, 73847.0, 41207.0, 23283.0, 13127.0, 7601.0, 4481.0, 2670.0, 1669.0, 1023.0, 625.0, 371.0, 233.0, 158.0, 91.0, 63.0, 29.0, 20.0, 17.0, 12.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85009765625, -0.8234100341796875, -0.796722412109375, -0.7700347900390625, -0.74334716796875, -0.7166595458984375, -0.689971923828125, -0.6632843017578125, -0.6365966796875, -0.6099090576171875, -0.583221435546875, -0.5565338134765625, -0.52984619140625, -0.5031585693359375, -0.476470947265625, -0.4497833251953125, -0.423095703125, -0.3964080810546875, -0.369720458984375, -0.3430328369140625, -0.31634521484375, -0.2896575927734375, -0.262969970703125, -0.2362823486328125, -0.2095947265625, -0.1829071044921875, -0.156219482421875, -0.1295318603515625, -0.10284423828125, -0.0761566162109375, -0.049468994140625, -0.0227813720703125, 0.00390625, 0.0305938720703125, 0.057281494140625, 0.0839691162109375, 0.11065673828125, 0.1373443603515625, 0.164031982421875, 0.1907196044921875, 0.2174072265625, 0.2440948486328125, 0.270782470703125, 0.2974700927734375, 0.32415771484375, 0.3508453369140625, 0.377532958984375, 0.4042205810546875, 0.430908203125, 0.4575958251953125, 0.484283447265625, 0.5109710693359375, 0.53765869140625, 0.5643463134765625, 0.591033935546875, 0.6177215576171875, 0.6444091796875, 0.6710968017578125, 0.697784423828125, 0.7244720458984375, 0.75115966796875, 0.7778472900390625, 0.804534912109375, 0.8312225341796875, 0.85791015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 8.0, 8.0, 12.0, 10.0, 20.0, 17.0, 15.0, 24.0, 28.0, 47.0, 40.0, 51.0, 56.0, 74.0, 85.0, 73.0, 65.0, 54.0, 50.0, 41.0, 40.0, 28.0, 29.0, 24.0, 19.0, 11.0, 11.0, 13.0, 4.0, 6.0, 7.0, 3.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.40673828125, -0.39270782470703125, -0.3786773681640625, -0.36464691162109375, -0.350616455078125, -0.33658599853515625, -0.3225555419921875, -0.30852508544921875, -0.29449462890625, -0.28046417236328125, -0.2664337158203125, -0.25240325927734375, -0.238372802734375, -0.22434234619140625, -0.2103118896484375, -0.19628143310546875, -0.1822509765625, -0.16822052001953125, -0.1541900634765625, -0.14015960693359375, -0.126129150390625, -0.11209869384765625, -0.0980682373046875, -0.08403778076171875, -0.07000732421875, -0.05597686767578125, -0.0419464111328125, -0.02791595458984375, -0.013885498046875, 0.00014495849609375, 0.0141754150390625, 0.02820587158203125, 0.042236328125, 0.05626678466796875, 0.0702972412109375, 0.08432769775390625, 0.098358154296875, 0.11238861083984375, 0.1264190673828125, 0.14044952392578125, 0.15447998046875, 0.16851043701171875, 0.1825408935546875, 0.19657135009765625, 0.210601806640625, 0.22463226318359375, 0.2386627197265625, 0.25269317626953125, 0.2667236328125, 0.28075408935546875, 0.2947845458984375, 0.30881500244140625, 0.322845458984375, 0.33687591552734375, 0.3509063720703125, 0.36493682861328125, 0.37896728515625, 0.39299774169921875, 0.4070281982421875, 0.42105865478515625, 0.435089111328125, 0.44911956787109375, 0.4631500244140625, 0.47718048095703125, 0.4912109375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 1.0, 8.0, 13.0, 11.0, 15.0, 14.0, 14.0, 25.0, 29.0, 45.0, 44.0, 39.0, 50.0, 54.0, 60.0, 54.0, 53.0, 45.0, 50.0, 44.0, 42.0, 41.0, 41.0, 43.0, 28.0, 27.0, 20.0, 22.0, 15.0, 16.0, 13.0, 2.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.737403869628906, -30.766916275024414, -29.796428680419922, -28.825939178466797, -27.855451583862305, -26.884963989257812, -25.91447639465332, -24.943988800048828, -23.973499298095703, -23.00301170349121, -22.03252410888672, -21.062034606933594, -20.0915470123291, -19.12105941772461, -18.150571823120117, -17.180084228515625, -16.209596633911133, -15.23910903930664, -14.268620491027832, -13.29813289642334, -12.327644348144531, -11.357156753540039, -10.386669158935547, -9.416181564331055, -8.445693016052246, -7.475204944610596, -6.504716873168945, -5.534229278564453, -4.563741207122803, -3.5932531356811523, -2.62276554107666, -1.6522774696350098, -0.6817913055419922, 0.28869664669036865, 1.2591845989227295, 2.229672431945801, 3.200160503387451, 4.170648574829102, 5.141136169433594, 6.111624240875244, 7.0821123123168945, 8.052599906921387, 9.023088455200195, 9.993576049804688, 10.96406364440918, 11.934552192687988, 12.90503978729248, 13.875528335571289, 14.846015930175781, 15.816503524780273, 16.786991119384766, 17.75748062133789, 18.727968215942383, 19.698455810546875, 20.668943405151367, 21.63943099975586, 22.609920501708984, 23.580408096313477, 24.55089569091797, 25.521385192871094, 26.491872787475586, 27.462360382080078, 28.43284797668457, 29.403335571289062, 30.373823165893555]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 2.0, 3.0, 7.0, 10.0, 15.0, 18.0, 17.0, 15.0, 29.0, 20.0, 32.0, 40.0, 32.0, 33.0, 42.0, 55.0, 49.0, 48.0, 45.0, 40.0, 49.0, 34.0, 35.0, 44.0, 44.0, 35.0, 24.0, 29.0, 37.0, 24.0, 18.0, 15.0, 15.0, 8.0, 11.0, 9.0, 6.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.5777587890625, -34.55222702026367, -33.526695251464844, -32.50116729736328, -31.47563362121582, -30.450103759765625, -29.424571990966797, -28.39904022216797, -27.37350845336914, -26.347976684570312, -25.322446823120117, -24.29691505432129, -23.27138328552246, -22.245853424072266, -21.220321655273438, -20.19478988647461, -19.169260025024414, -18.143728256225586, -17.11819839477539, -16.092666625976562, -15.067134857177734, -14.041604042053223, -13.016073226928711, -11.990541458129883, -10.965010643005371, -9.93947982788086, -8.913948059082031, -7.8884172439575195, -6.86288595199585, -5.83735466003418, -4.811823844909668, -3.786292552947998, -2.760761260986328, -1.7352300882339478, -0.7096989154815674, 0.31583213806152344, 1.3413634300231934, 2.3668947219848633, 3.392425537109375, 4.417956829071045, 5.443488121032715, 6.469019412994385, 7.494550704956055, 8.520081520080566, 9.545612335205078, 10.571144104003906, 11.596674919128418, 12.62220573425293, 13.647737503051758, 14.67326831817627, 15.698800086975098, 16.72433090209961, 17.749862670898438, 18.775394439697266, 19.80092430114746, 20.82645606994629, 21.851985931396484, 22.877517700195312, 23.903047561645508, 24.928579330444336, 25.954111099243164, 26.97964096069336, 28.005172729492188, 29.030704498291016, 30.056236267089844]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 9.0, 16.0, 17.0, 37.0, 72.0, 86.0, 144.0, 235.0, 348.0, 611.0, 890.0, 1406.0, 2316.0, 3967.0, 6404.0, 10282.0, 16212.0, 25260.0, 37840.0, 54439.0, 73606.0, 93268.0, 108211.0, 115877.0, 113518.0, 101953.0, 84127.0, 64442.0, 46056.0, 31502.0, 20789.0, 13009.0, 8288.0, 5046.0, 3092.0, 1949.0, 1177.0, 752.0, 455.0, 340.0, 211.0, 106.0, 53.0, 47.0, 35.0, 25.0, 9.0, 9.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6875, -14.194091796875, -13.70068359375, -13.207275390625, -12.7138671875, -12.220458984375, -11.72705078125, -11.233642578125, -10.740234375, -10.246826171875, -9.75341796875, -9.260009765625, -8.7666015625, -8.273193359375, -7.77978515625, -7.286376953125, -6.79296875, -6.299560546875, -5.80615234375, -5.312744140625, -4.8193359375, -4.325927734375, -3.83251953125, -3.339111328125, -2.845703125, -2.352294921875, -1.85888671875, -1.365478515625, -0.8720703125, -0.378662109375, 0.11474609375, 0.608154296875, 1.1015625, 1.594970703125, 2.08837890625, 2.581787109375, 3.0751953125, 3.568603515625, 4.06201171875, 4.555419921875, 5.048828125, 5.542236328125, 6.03564453125, 6.529052734375, 7.0224609375, 7.515869140625, 8.00927734375, 8.502685546875, 8.99609375, 9.489501953125, 9.98291015625, 10.476318359375, 10.9697265625, 11.463134765625, 11.95654296875, 12.449951171875, 12.943359375, 13.436767578125, 13.93017578125, 14.423583984375, 14.9169921875, 15.410400390625, 15.90380859375, 16.397216796875, 16.890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 10.0, 13.0, 10.0, 15.0, 13.0, 27.0, 21.0, 29.0, 22.0, 27.0, 34.0, 37.0, 50.0, 31.0, 49.0, 45.0, 46.0, 40.0, 48.0, 34.0, 39.0, 36.0, 23.0, 45.0, 28.0, 25.0, 25.0, 35.0, 25.0, 26.0, 16.0, 13.0, 13.0, 6.0, 9.0, 7.0, 9.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-33.6875, -32.759521484375, -31.83154296875, -30.903564453125, -29.9755859375, -29.047607421875, -28.11962890625, -27.191650390625, -26.263671875, -25.335693359375, -24.40771484375, -23.479736328125, -22.5517578125, -21.623779296875, -20.69580078125, -19.767822265625, -18.83984375, -17.911865234375, -16.98388671875, -16.055908203125, -15.1279296875, -14.199951171875, -13.27197265625, -12.343994140625, -11.416015625, -10.488037109375, -9.56005859375, -8.632080078125, -7.7041015625, -6.776123046875, -5.84814453125, -4.920166015625, -3.9921875, -3.064208984375, -2.13623046875, -1.208251953125, -0.2802734375, 0.647705078125, 1.57568359375, 2.503662109375, 3.431640625, 4.359619140625, 5.28759765625, 6.215576171875, 7.1435546875, 8.071533203125, 8.99951171875, 9.927490234375, 10.85546875, 11.783447265625, 12.71142578125, 13.639404296875, 14.5673828125, 15.495361328125, 16.42333984375, 17.351318359375, 18.279296875, 19.207275390625, 20.13525390625, 21.063232421875, 21.9912109375, 22.919189453125, 23.84716796875, 24.775146484375, 25.703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 6.0, 10.0, 19.0, 26.0, 38.0, 54.0, 79.0, 132.0, 180.0, 272.0, 429.0, 658.0, 986.0, 1484.0, 2427.0, 3548.0, 5500.0, 8165.0, 12807.0, 18966.0, 28582.0, 41661.0, 58031.0, 77487.0, 96325.0, 110454.0, 115579.0, 110348.0, 95247.0, 77111.0, 57439.0, 41106.0, 28159.0, 19113.0, 12538.0, 8278.0, 5275.0, 3478.0, 2293.0, 1397.0, 982.0, 635.0, 424.0, 308.0, 185.0, 110.0, 80.0, 61.0, 30.0, 27.0, 17.0, 8.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.5625, -16.986328125, -16.41015625, -15.833984375, -15.2578125, -14.681640625, -14.10546875, -13.529296875, -12.953125, -12.376953125, -11.80078125, -11.224609375, -10.6484375, -10.072265625, -9.49609375, -8.919921875, -8.34375, -7.767578125, -7.19140625, -6.615234375, -6.0390625, -5.462890625, -4.88671875, -4.310546875, -3.734375, -3.158203125, -2.58203125, -2.005859375, -1.4296875, -0.853515625, -0.27734375, 0.298828125, 0.875, 1.451171875, 2.02734375, 2.603515625, 3.1796875, 3.755859375, 4.33203125, 4.908203125, 5.484375, 6.060546875, 6.63671875, 7.212890625, 7.7890625, 8.365234375, 8.94140625, 9.517578125, 10.09375, 10.669921875, 11.24609375, 11.822265625, 12.3984375, 12.974609375, 13.55078125, 14.126953125, 14.703125, 15.279296875, 15.85546875, 16.431640625, 17.0078125, 17.583984375, 18.16015625, 18.736328125, 19.3125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 10.0, 7.0, 10.0, 7.0, 21.0, 14.0, 19.0, 21.0, 25.0, 33.0, 34.0, 35.0, 31.0, 53.0, 45.0, 38.0, 51.0, 39.0, 47.0, 39.0, 47.0, 37.0, 44.0, 39.0, 29.0, 34.0, 32.0, 13.0, 16.0, 29.0, 17.0, 20.0, 13.0, 11.0, 9.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.703125, -20.07568359375, -19.4482421875, -18.82080078125, -18.193359375, -17.56591796875, -16.9384765625, -16.31103515625, -15.68359375, -15.05615234375, -14.4287109375, -13.80126953125, -13.173828125, -12.54638671875, -11.9189453125, -11.29150390625, -10.6640625, -10.03662109375, -9.4091796875, -8.78173828125, -8.154296875, -7.52685546875, -6.8994140625, -6.27197265625, -5.64453125, -5.01708984375, -4.3896484375, -3.76220703125, -3.134765625, -2.50732421875, -1.8798828125, -1.25244140625, -0.625, 0.00244140625, 0.6298828125, 1.25732421875, 1.884765625, 2.51220703125, 3.1396484375, 3.76708984375, 4.39453125, 5.02197265625, 5.6494140625, 6.27685546875, 6.904296875, 7.53173828125, 8.1591796875, 8.78662109375, 9.4140625, 10.04150390625, 10.6689453125, 11.29638671875, 11.923828125, 12.55126953125, 13.1787109375, 13.80615234375, 14.43359375, 15.06103515625, 15.6884765625, 16.31591796875, 16.943359375, 17.57080078125, 18.1982421875, 18.82568359375, 19.453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 4.0, 5.0, 10.0, 14.0, 30.0, 50.0, 59.0, 100.0, 149.0, 241.0, 311.0, 514.0, 774.0, 1191.0, 1834.0, 2941.0, 4753.0, 7683.0, 12567.0, 20824.0, 33868.0, 52217.0, 75365.0, 100100.0, 120330.0, 130321.0, 125776.0, 108507.0, 83722.0, 59955.0, 39848.0, 24845.0, 15133.0, 9283.0, 5559.0, 3429.0, 2158.0, 1324.0, 914.0, 633.0, 403.0, 285.0, 189.0, 129.0, 65.0, 58.0, 44.0, 22.0, 7.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83203125, -6.59381103515625, -6.3555908203125, -6.11737060546875, -5.879150390625, -5.64093017578125, -5.4027099609375, -5.16448974609375, -4.92626953125, -4.68804931640625, -4.4498291015625, -4.21160888671875, -3.973388671875, -3.73516845703125, -3.4969482421875, -3.25872802734375, -3.0205078125, -2.78228759765625, -2.5440673828125, -2.30584716796875, -2.067626953125, -1.82940673828125, -1.5911865234375, -1.35296630859375, -1.11474609375, -0.87652587890625, -0.6383056640625, -0.40008544921875, -0.161865234375, 0.07635498046875, 0.3145751953125, 0.55279541015625, 0.791015625, 1.02923583984375, 1.2674560546875, 1.50567626953125, 1.743896484375, 1.98211669921875, 2.2203369140625, 2.45855712890625, 2.69677734375, 2.93499755859375, 3.1732177734375, 3.41143798828125, 3.649658203125, 3.88787841796875, 4.1260986328125, 4.36431884765625, 4.6025390625, 4.84075927734375, 5.0789794921875, 5.31719970703125, 5.555419921875, 5.79364013671875, 6.0318603515625, 6.27008056640625, 6.50830078125, 6.74652099609375, 6.9847412109375, 7.22296142578125, 7.461181640625, 7.69940185546875, 7.9376220703125, 8.17584228515625, 8.4140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 7.0, 13.0, 20.0, 22.0, 34.0, 33.0, 21.0, 49.0, 60.0, 60.0, 56.0, 60.0, 43.0, 50.0, 76.0, 61.0, 60.0, 52.0, 43.0, 36.0, 33.0, 9.0, 18.0, 11.0, 11.0, 9.0, 6.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.0012407302856445312, -0.0012067779898643494, -0.0011728256940841675, -0.0011388733983039856, -0.0011049211025238037, -0.0010709688067436218, -0.00103701651096344, -0.001003064215183258, -0.0009691119194030762, -0.0009351596236228943, -0.0009012073278427124, -0.0008672550320625305, -0.0008333027362823486, -0.0007993504405021667, -0.0007653981447219849, -0.000731445848941803, -0.0006974935531616211, -0.0006635412573814392, -0.0006295889616012573, -0.0005956366658210754, -0.0005616843700408936, -0.0005277320742607117, -0.0004937797784805298, -0.0004598274827003479, -0.000425875186920166, -0.00039192289113998413, -0.00035797059535980225, -0.00032401829957962036, -0.0002900660037994385, -0.0002561137080192566, -0.0002221614122390747, -0.00018820911645889282, -0.00015425682067871094, -0.00012030452489852905, -8.635222911834717e-05, -5.239993333816528e-05, -1.84476375579834e-05, 1.5504658222198486e-05, 4.945695400238037e-05, 8.340924978256226e-05, 0.00011736154556274414, 0.00015131384134292603, 0.0001852661371231079, 0.0002192184329032898, 0.0002531707286834717, 0.00028712302446365356, 0.00032107532024383545, 0.00035502761602401733, 0.0003889799118041992, 0.0004229322075843811, 0.000456884503364563, 0.0004908367991447449, 0.0005247890949249268, 0.0005587413907051086, 0.0005926936864852905, 0.0006266459822654724, 0.0006605982780456543, 0.0006945505738258362, 0.0007285028696060181, 0.0007624551653862, 0.0007964074611663818, 0.0008303597569465637, 0.0008643120527267456, 0.0008982643485069275, 0.0009322166442871094]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 7.0, 13.0, 21.0, 26.0, 45.0, 70.0, 121.0, 170.0, 267.0, 389.0, 572.0, 924.0, 1455.0, 2220.0, 3321.0, 5400.0, 8698.0, 13982.0, 23333.0, 36404.0, 56039.0, 80368.0, 105203.0, 124706.0, 131365.0, 123217.0, 103041.0, 78399.0, 54456.0, 35536.0, 22143.0, 13700.0, 8415.0, 5304.0, 3269.0, 2091.0, 1350.0, 881.0, 574.0, 319.0, 265.0, 159.0, 117.0, 70.0, 43.0, 26.0, 22.0, 16.0, 8.0, 9.0, 5.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.91015625, -7.65875244140625, -7.4073486328125, -7.15594482421875, -6.904541015625, -6.65313720703125, -6.4017333984375, -6.15032958984375, -5.89892578125, -5.64752197265625, -5.3961181640625, -5.14471435546875, -4.893310546875, -4.64190673828125, -4.3905029296875, -4.13909912109375, -3.8876953125, -3.63629150390625, -3.3848876953125, -3.13348388671875, -2.882080078125, -2.63067626953125, -2.3792724609375, -2.12786865234375, -1.87646484375, -1.62506103515625, -1.3736572265625, -1.12225341796875, -0.870849609375, -0.61944580078125, -0.3680419921875, -0.11663818359375, 0.134765625, 0.38616943359375, 0.6375732421875, 0.88897705078125, 1.140380859375, 1.39178466796875, 1.6431884765625, 1.89459228515625, 2.14599609375, 2.39739990234375, 2.6488037109375, 2.90020751953125, 3.151611328125, 3.40301513671875, 3.6544189453125, 3.90582275390625, 4.1572265625, 4.40863037109375, 4.6600341796875, 4.91143798828125, 5.162841796875, 5.41424560546875, 5.6656494140625, 5.91705322265625, 6.16845703125, 6.41986083984375, 6.6712646484375, 6.92266845703125, 7.174072265625, 7.42547607421875, 7.6768798828125, 7.92828369140625, 8.1796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 8.0, 15.0, 13.0, 17.0, 16.0, 20.0, 22.0, 38.0, 35.0, 37.0, 46.0, 42.0, 54.0, 58.0, 68.0, 65.0, 60.0, 47.0, 50.0, 40.0, 59.0, 37.0, 25.0, 20.0, 25.0, 12.0, 13.0, 11.0, 10.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 8.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.68817138671875, -2.5716552734375, -2.45513916015625, -2.338623046875, -2.22210693359375, -2.1055908203125, -1.98907470703125, -1.87255859375, -1.75604248046875, -1.6395263671875, -1.52301025390625, -1.406494140625, -1.28997802734375, -1.1734619140625, -1.05694580078125, -0.9404296875, -0.82391357421875, -0.7073974609375, -0.59088134765625, -0.474365234375, -0.35784912109375, -0.2413330078125, -0.12481689453125, -0.00830078125, 0.10821533203125, 0.2247314453125, 0.34124755859375, 0.457763671875, 0.57427978515625, 0.6907958984375, 0.80731201171875, 0.923828125, 1.04034423828125, 1.1568603515625, 1.27337646484375, 1.389892578125, 1.50640869140625, 1.6229248046875, 1.73944091796875, 1.85595703125, 1.97247314453125, 2.0889892578125, 2.20550537109375, 2.322021484375, 2.43853759765625, 2.5550537109375, 2.67156982421875, 2.7880859375, 2.90460205078125, 3.0211181640625, 3.13763427734375, 3.254150390625, 3.37066650390625, 3.4871826171875, 3.60369873046875, 3.72021484375, 3.83673095703125, 3.9532470703125, 4.06976318359375, 4.186279296875, 4.30279541015625, 4.4193115234375, 4.53582763671875, 4.65234375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 3.0, 3.0, 8.0, 14.0, 7.0, 16.0, 22.0, 14.0, 16.0, 22.0, 31.0, 36.0, 41.0, 32.0, 58.0, 45.0, 57.0, 36.0, 56.0, 42.0, 45.0, 36.0, 50.0, 33.0, 42.0, 37.0, 36.0, 32.0, 23.0, 21.0, 18.0, 12.0, 13.0, 6.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.74311637878418, -26.811674118041992, -25.880233764648438, -24.94879150390625, -24.017349243164062, -23.085908889770508, -22.15446662902832, -21.223026275634766, -20.291584014892578, -19.36014175415039, -18.428701400756836, -17.49725914001465, -16.56581687927246, -15.634376525878906, -14.702934265136719, -13.771492958068848, -12.84005069732666, -11.908609390258789, -10.977167129516602, -10.04572582244873, -9.11428451538086, -8.182842254638672, -7.251400947570801, -6.31995964050293, -5.3885178565979, -4.457076072692871, -3.525634765625, -2.5941929817199707, -1.6627514362335205, -0.7313098907470703, 0.20013189315795898, 1.13157320022583, 2.0630149841308594, 2.9944565296173096, 3.9258980751037598, 4.857339859008789, 5.78878116607666, 6.7202229499816895, 7.651664733886719, 8.58310604095459, 9.514547348022461, 10.445988655090332, 11.37743091583252, 12.30887222290039, 13.240313529968262, 14.171754837036133, 15.10319709777832, 16.034637451171875, 16.966079711914062, 17.89752197265625, 18.828962326049805, 19.760404586791992, 20.69184684753418, 21.623287200927734, 22.554729461669922, 23.48617172241211, 24.417613983154297, 25.349056243896484, 26.28049659729004, 27.211938858032227, 28.143381118774414, 29.07482147216797, 30.006263732910156, 30.937705993652344, 31.8691463470459]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 5.0, 5.0, 7.0, 13.0, 9.0, 16.0, 18.0, 12.0, 15.0, 17.0, 35.0, 24.0, 33.0, 35.0, 31.0, 49.0, 43.0, 48.0, 50.0, 41.0, 44.0, 48.0, 41.0, 41.0, 34.0, 34.0, 25.0, 16.0, 34.0, 31.0, 19.0, 27.0, 17.0, 17.0, 13.0, 13.0, 14.0, 6.0, 1.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-39.94686508178711, -38.799678802490234, -37.652488708496094, -36.50530242919922, -35.358116149902344, -34.2109260559082, -33.06373977661133, -31.91655158996582, -30.769363403320312, -29.622175216674805, -28.474987030029297, -27.327800750732422, -26.180612564086914, -25.033424377441406, -23.88623809814453, -22.739049911499023, -21.591861724853516, -20.444673538208008, -19.2974853515625, -18.150299072265625, -17.003110885620117, -15.85592269897461, -14.708735466003418, -13.561548233032227, -12.414360046386719, -11.267171859741211, -10.11998462677002, -8.972797393798828, -7.82560920715332, -6.678421497344971, -5.531233787536621, -4.38404655456543, -3.2368621826171875, -2.089674472808838, -0.9424867630004883, 0.20470094680786133, 1.351888656616211, 2.4990763664245605, 3.64626407623291, 4.793451309204102, 5.940639495849609, 7.087827205657959, 8.235014915466309, 9.3822021484375, 10.529390335083008, 11.676578521728516, 12.823765754699707, 13.970952987670898, 15.118141174316406, 16.265329360961914, 17.412517547607422, 18.559703826904297, 19.706892013549805, 20.854080200195312, 22.001266479492188, 23.148454666137695, 24.295642852783203, 25.44283103942871, 26.59001922607422, 27.737205505371094, 28.8843936920166, 30.03158187866211, 31.178768157958984, 32.325958251953125, 33.47314453125]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 6.0, 3.0, 5.0, 10.0, 13.0, 12.0, 16.0, 24.0, 37.0, 53.0, 63.0, 106.0, 113.0, 173.0, 251.0, 337.0, 452.0, 654.0, 893.0, 1190.0, 1547.0, 1935.0, 2541.0, 3237.0, 4229.0, 5893.0, 997599.0, 7931.0, 5160.0, 3775.0, 2955.0, 2317.0, 1868.0, 1373.0, 1060.0, 762.0, 574.0, 407.0, 295.0, 228.0, 152.0, 96.0, 74.0, 47.0, 35.0, 34.0, 26.0, 15.0, 8.0, 9.0, 5.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0], "bins": [-257.81195068359375, -250.18467712402344, -242.55738830566406, -234.93011474609375, -227.30282592773438, -219.67555236816406, -212.04827880859375, -204.42098999023438, -196.79371643066406, -189.16644287109375, -181.53915405273438, -173.91188049316406, -166.2845916748047, -158.65731811523438, -151.030029296875, -143.4027557373047, -135.77548217773438, -128.14820861816406, -120.52091979980469, -112.89364624023438, -105.26636505126953, -97.63908386230469, -90.01180267333984, -82.384521484375, -74.75723266601562, -67.12995147705078, -59.5026741027832, -51.87539291381836, -44.24811553955078, -36.62083435058594, -28.993553161621094, -21.366275787353516, -13.738998413085938, -6.111718654632568, 1.5155611038208008, 9.142841339111328, 16.77012062072754, 24.39739990234375, 32.024681091308594, 39.65195846557617, 47.279239654541016, 54.90652084350586, 62.53379821777344, 70.16107940673828, 77.78836059570312, 85.41563415527344, 93.04292297363281, 100.67019653320312, 108.29747772216797, 115.92475891113281, 123.55204010009766, 131.1793212890625, 138.8065948486328, 146.43386840820312, 154.0611572265625, 161.6884307861328, 169.3157196044922, 176.9429931640625, 184.57028198242188, 192.1975555419922, 199.82484436035156, 207.45211791992188, 215.07940673828125, 222.70668029785156, 230.33395385742188]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 10.0, 17.0, 19.0, 28.0, 37.0, 35.0, 44.0, 65.0, 85.0, 132.0, 170.0, 218.0, 295.0, 412.0, 574.0, 896.0, 1311.0, 2061.0, 3273.0, 5378.0, 8518.0, 13349.0, 19840.0, 28639.0, 64402.0, 51195416.0, 47716.0, 26262.0, 18170.0, 12240.0, 7995.0, 4768.0, 3061.0, 1844.0, 1212.0, 805.0, 539.0, 393.0, 294.0, 207.0, 152.0, 131.0, 94.0, 70.0, 46.0, 34.0, 27.0, 15.0, 16.0, 7.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-271.0247802734375, -262.1094970703125, -253.19424438476562, -244.2789764404297, -235.36370849609375, -226.44842529296875, -217.5331573486328, -208.61788940429688, -199.70262145996094, -190.787353515625, -181.87208557128906, -172.95681762695312, -164.04153442382812, -155.12628173828125, -146.21099853515625, -137.2957305908203, -128.38046264648438, -119.46519470214844, -110.5499267578125, -101.63465118408203, -92.7193832397461, -83.80411529541016, -74.88883972167969, -65.97357177734375, -57.05830383300781, -48.143035888671875, -39.22776412963867, -30.3124942779541, -21.39722442626953, -12.481956481933594, -3.5666847229003906, 5.3485870361328125, 14.26385498046875, 23.17912483215332, 32.09439468383789, 41.009666442871094, 49.92493438720703, 58.84020233154297, 67.75547790527344, 76.67074584960938, 85.58601379394531, 94.50128173828125, 103.41654968261719, 112.33182525634766, 121.2470932006836, 130.162353515625, 139.07763671875, 147.99290466308594, 156.90817260742188, 165.8234405517578, 174.73870849609375, 183.6539764404297, 192.56924438476562, 201.48452758789062, 210.39979553222656, 219.3150634765625, 228.23033142089844, 237.14559936523438, 246.0608673095703, 254.97613525390625, 263.89141845703125, 272.8066711425781, 281.7219543457031, 290.63720703125, 299.552490234375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 9.0, 31.0, 38.0, 51.0, 78.0, 133.0, 193.0, 284.0, 468.0, 716.0, 1103.0, 1790.0, 3057.0, 5101.0, 8824.0, 15114.0, 27621.0, 49058.0, 87531.0, 153575.0, 263976.0, 465697.0, 1303595.0, 2411586.0, 685559.0, 340396.0, 200253.0, 114439.0, 65571.0, 36856.0, 20479.0, 11645.0, 6715.0, 3800.0, 2232.0, 1455.0, 934.0, 563.0, 350.0, 182.0, 117.0, 94.0, 45.0, 24.0, 25.0, 22.0, 12.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-6.1484375, -5.95166015625, -5.7548828125, -5.55810546875, -5.361328125, -5.16455078125, -4.9677734375, -4.77099609375, -4.57421875, -4.37744140625, -4.1806640625, -3.98388671875, -3.787109375, -3.59033203125, -3.3935546875, -3.19677734375, -3.0, -2.80322265625, -2.6064453125, -2.40966796875, -2.212890625, -2.01611328125, -1.8193359375, -1.62255859375, -1.42578125, -1.22900390625, -1.0322265625, -0.83544921875, -0.638671875, -0.44189453125, -0.2451171875, -0.04833984375, 0.1484375, 0.34521484375, 0.5419921875, 0.73876953125, 0.935546875, 1.13232421875, 1.3291015625, 1.52587890625, 1.72265625, 1.91943359375, 2.1162109375, 2.31298828125, 2.509765625, 2.70654296875, 2.9033203125, 3.10009765625, 3.296875, 3.49365234375, 3.6904296875, 3.88720703125, 4.083984375, 4.28076171875, 4.4775390625, 4.67431640625, 4.87109375, 5.06787109375, 5.2646484375, 5.46142578125, 5.658203125, 5.85498046875, 6.0517578125, 6.24853515625, 6.4453125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 14.0, 4.0, 6.0, 8.0, 8.0, 8.0, 14.0, 14.0, 14.0, 23.0, 23.0, 26.0, 27.0, 31.0, 27.0, 35.0, 47.0, 33.0, 48.0, 105.0, 414.0, 485.0, 169.0, 55.0, 39.0, 40.0, 27.0, 34.0, 23.0, 26.0, 28.0, 21.0, 17.0, 19.0, 19.0, 12.0, 11.0, 12.0, 11.0, 8.0, 8.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-32.8125, -31.8203125, -30.828125, -29.8359375, -28.84375, -27.8515625, -26.859375, -25.8671875, -24.875, -23.8828125, -22.890625, -21.8984375, -20.90625, -19.9140625, -18.921875, -17.9296875, -16.9375, -15.9453125, -14.953125, -13.9609375, -12.96875, -11.9765625, -10.984375, -9.9921875, -9.0, -8.0078125, -7.015625, -6.0234375, -5.03125, -4.0390625, -3.046875, -2.0546875, -1.0625, -0.0703125, 0.921875, 1.9140625, 2.90625, 3.8984375, 4.890625, 5.8828125, 6.875, 7.8671875, 8.859375, 9.8515625, 10.84375, 11.8359375, 12.828125, 13.8203125, 14.8125, 15.8046875, 16.796875, 17.7890625, 18.78125, 19.7734375, 20.765625, 21.7578125, 22.75, 23.7421875, 24.734375, 25.7265625, 26.71875, 27.7109375, 28.703125, 29.6953125, 30.6875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 7.0, 8.0, 11.0, 23.0, 25.0, 36.0, 46.0, 73.0, 92.0, 155.0, 225.0, 359.0, 625.0, 930.0, 1516.0, 2459.0, 4011.0, 6471.0, 10569.0, 17234.0, 28243.0, 46962.0, 76492.0, 124549.0, 197085.0, 302826.0, 509852.0, 2249613.0, 1527200.0, 441482.0, 275343.0, 178626.0, 112001.0, 69054.0, 41978.0, 25362.0, 15274.0, 9420.0, 5723.0, 3561.0, 2152.0, 1316.0, 894.0, 544.0, 354.0, 232.0, 162.0, 93.0, 64.0, 43.0, 28.0, 12.0, 16.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.43359375, -5.26318359375, -5.0927734375, -4.92236328125, -4.751953125, -4.58154296875, -4.4111328125, -4.24072265625, -4.0703125, -3.89990234375, -3.7294921875, -3.55908203125, -3.388671875, -3.21826171875, -3.0478515625, -2.87744140625, -2.70703125, -2.53662109375, -2.3662109375, -2.19580078125, -2.025390625, -1.85498046875, -1.6845703125, -1.51416015625, -1.34375, -1.17333984375, -1.0029296875, -0.83251953125, -0.662109375, -0.49169921875, -0.3212890625, -0.15087890625, 0.01953125, 0.18994140625, 0.3603515625, 0.53076171875, 0.701171875, 0.87158203125, 1.0419921875, 1.21240234375, 1.3828125, 1.55322265625, 1.7236328125, 1.89404296875, 2.064453125, 2.23486328125, 2.4052734375, 2.57568359375, 2.74609375, 2.91650390625, 3.0869140625, 3.25732421875, 3.427734375, 3.59814453125, 3.7685546875, 3.93896484375, 4.109375, 4.27978515625, 4.4501953125, 4.62060546875, 4.791015625, 4.96142578125, 5.1318359375, 5.30224609375, 5.47265625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 8.0, 4.0, 18.0, 6.0, 12.0, 14.0, 23.0, 14.0, 21.0, 20.0, 18.0, 26.0, 36.0, 23.0, 24.0, 29.0, 32.0, 33.0, 39.0, 43.0, 401.0, 584.0, 119.0, 40.0, 50.0, 34.0, 32.0, 33.0, 34.0, 24.0, 30.0, 17.0, 18.0, 16.0, 28.0, 12.0, 15.0, 5.0, 9.0, 9.0, 11.0, 9.0, 6.0, 7.0, 3.0, 6.0, 5.0, 3.0, 4.0, 2.0], "bins": [-44.0, -42.7470703125, -41.494140625, -40.2412109375, -38.98828125, -37.7353515625, -36.482421875, -35.2294921875, -33.9765625, -32.7236328125, -31.470703125, -30.2177734375, -28.96484375, -27.7119140625, -26.458984375, -25.2060546875, -23.953125, -22.7001953125, -21.447265625, -20.1943359375, -18.94140625, -17.6884765625, -16.435546875, -15.1826171875, -13.9296875, -12.6767578125, -11.423828125, -10.1708984375, -8.91796875, -7.6650390625, -6.412109375, -5.1591796875, -3.90625, -2.6533203125, -1.400390625, -0.1474609375, 1.10546875, 2.3583984375, 3.611328125, 4.8642578125, 6.1171875, 7.3701171875, 8.623046875, 9.8759765625, 11.12890625, 12.3818359375, 13.634765625, 14.8876953125, 16.140625, 17.3935546875, 18.646484375, 19.8994140625, 21.15234375, 22.4052734375, 23.658203125, 24.9111328125, 26.1640625, 27.4169921875, 28.669921875, 29.9228515625, 31.17578125, 32.4287109375, 33.681640625, 34.9345703125, 36.1875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 2.0, 5.0, 7.0, 9.0, 11.0, 13.0, 22.0, 29.0, 26.0, 49.0, 69.0, 97.0, 122.0, 172.0, 260.0, 345.0, 516.0, 759.0, 1212.0, 1890.0, 2868.0, 4297.0, 7188.0, 11303.0, 18631.0, 29892.0, 48980.0, 83750.0, 235822.0, 5541692.0, 130052.0, 66079.0, 40049.0, 24682.0, 14914.0, 9066.0, 5768.0, 3586.0, 2439.0, 1469.0, 1001.0, 697.0, 503.0, 295.0, 230.0, 160.0, 137.0, 97.0, 51.0, 46.0, 30.0, 13.0, 6.0, 9.0, 12.0, 5.0, 4.0, 3.0, 1.0, 3.0], "bins": [-19.890625, -19.29296875, -18.6953125, -18.09765625, -17.5, -16.90234375, -16.3046875, -15.70703125, -15.109375, -14.51171875, -13.9140625, -13.31640625, -12.71875, -12.12109375, -11.5234375, -10.92578125, -10.328125, -9.73046875, -9.1328125, -8.53515625, -7.9375, -7.33984375, -6.7421875, -6.14453125, -5.546875, -4.94921875, -4.3515625, -3.75390625, -3.15625, -2.55859375, -1.9609375, -1.36328125, -0.765625, -0.16796875, 0.4296875, 1.02734375, 1.625, 2.22265625, 2.8203125, 3.41796875, 4.015625, 4.61328125, 5.2109375, 5.80859375, 6.40625, 7.00390625, 7.6015625, 8.19921875, 8.796875, 9.39453125, 9.9921875, 10.58984375, 11.1875, 11.78515625, 12.3828125, 12.98046875, 13.578125, 14.17578125, 14.7734375, 15.37109375, 15.96875, 16.56640625, 17.1640625, 17.76171875, 18.359375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 8.0, 11.0, 8.0, 20.0, 17.0, 13.0, 19.0, 22.0, 22.0, 20.0, 22.0, 29.0, 41.0, 35.0, 36.0, 32.0, 28.0, 52.0, 181.0, 837.0, 108.0, 52.0, 48.0, 44.0, 32.0, 29.0, 35.0, 17.0, 38.0, 12.0, 20.0, 25.0, 13.0, 16.0, 14.0, 14.0, 12.0, 10.0, 6.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-64.1875, -62.20361328125, -60.2197265625, -58.23583984375, -56.251953125, -54.26806640625, -52.2841796875, -50.30029296875, -48.31640625, -46.33251953125, -44.3486328125, -42.36474609375, -40.380859375, -38.39697265625, -36.4130859375, -34.42919921875, -32.4453125, -30.46142578125, -28.4775390625, -26.49365234375, -24.509765625, -22.52587890625, -20.5419921875, -18.55810546875, -16.57421875, -14.59033203125, -12.6064453125, -10.62255859375, -8.638671875, -6.65478515625, -4.6708984375, -2.68701171875, -0.703125, 1.28076171875, 3.2646484375, 5.24853515625, 7.232421875, 9.21630859375, 11.2001953125, 13.18408203125, 15.16796875, 17.15185546875, 19.1357421875, 21.11962890625, 23.103515625, 25.08740234375, 27.0712890625, 29.05517578125, 31.0390625, 33.02294921875, 35.0068359375, 36.99072265625, 38.974609375, 40.95849609375, 42.9423828125, 44.92626953125, 46.91015625, 48.89404296875, 50.8779296875, 52.86181640625, 54.845703125, 56.82958984375, 58.8134765625, 60.79736328125, 62.78125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 2.0, 5.0, 9.0, 11.0, 17.0, 40.0, 71.0, 146.0, 460.0, 94.0, 55.0, 21.0, 15.0, 12.0, 13.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-618.604736328125, -600.5810546875, -582.557373046875, -564.53369140625, -546.5100708007812, -528.4863891601562, -510.46270751953125, -492.43902587890625, -474.41534423828125, -456.39166259765625, -438.3680114746094, -420.3443298339844, -402.3206481933594, -384.2969970703125, -366.2733154296875, -348.2496337890625, -330.2259826660156, -312.2023010253906, -294.17864990234375, -276.15496826171875, -258.13128662109375, -240.1076202392578, -222.08395385742188, -204.06027221679688, -186.03660583496094, -168.012939453125, -149.9892578125, -131.96559143066406, -113.9419174194336, -95.91824340820312, -77.89457702636719, -59.87090301513672, -41.84722900390625, -23.823556900024414, -5.799884796142578, 12.223785400390625, 30.247459411621094, 48.27113342285156, 66.2947998046875, 84.31847381591797, 102.34214782714844, 120.3658218383789, 138.38949584960938, 156.4131622314453, 174.43682861328125, 192.46051025390625, 210.4841766357422, 228.50784301757812, 246.53152465820312, 264.5552062988281, 282.578857421875, 300.6025390625, 318.626220703125, 336.64990234375, 354.6735534667969, 372.6972351074219, 390.72088623046875, 408.74456787109375, 426.7682189941406, 444.7919006347656, 462.8155822753906, 480.8392333984375, 498.8629150390625, 516.8865966796875, 534.9102783203125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 6.0, 14.0, 8.0, 15.0, 25.0, 25.0, 51.0, 86.0, 192.0, 239.0, 74.0, 58.0, 49.0, 33.0, 11.0, 11.0, 13.0, 17.0, 11.0, 1.0, 7.0, 7.0, 2.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1072.4566650390625, -1041.036865234375, -1009.6170654296875, -978.197265625, -946.7774658203125, -915.357666015625, -883.9378662109375, -852.51806640625, -821.0982666015625, -789.678466796875, -758.2586669921875, -726.8388671875, -695.4190673828125, -663.999267578125, -632.5794677734375, -601.15966796875, -569.7398681640625, -538.320068359375, -506.9002685546875, -475.48046875, -444.0606689453125, -412.640869140625, -381.2210693359375, -349.80126953125, -318.3814697265625, -286.961669921875, -255.5418701171875, -224.1220703125, -192.7022705078125, -161.282470703125, -129.8626708984375, -98.44287109375, -67.0230712890625, -35.603271484375, -4.1834716796875, 27.236328125, 58.6561279296875, 90.075927734375, 121.4957275390625, 152.91552734375, 184.3353271484375, 215.755126953125, 247.1749267578125, 278.5947265625, 310.0145263671875, 341.434326171875, 372.8541259765625, 404.27392578125, 435.6937255859375, 467.113525390625, 498.5333251953125, 529.953125, 561.3729248046875, 592.792724609375, 624.2125244140625, 655.63232421875, 687.0521240234375, 718.471923828125, 749.8917236328125, 781.3115234375, 812.7313232421875, 844.151123046875, 875.5709228515625, 906.99072265625, 938.4105224609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 12.0, 16.0, 11.0, 30.0, 34.0, 59.0, 77.0, 124.0, 198.0, 286.0, 444.0, 730.0, 1287.0, 2336.0, 4454.0, 9058.0, 19794.0, 51909.0, 225951.0, 3693177.0, 119359.0, 36696.0, 14487.0, 6460.0, 3077.0, 1724.0, 887.0, 571.0, 340.0, 194.0, 148.0, 96.0, 58.0, 47.0, 32.0, 28.0, 23.0, 17.0, 11.0, 7.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.61053466796875, -4.4476318359375, -4.28472900390625, -4.121826171875, -3.95892333984375, -3.7960205078125, -3.63311767578125, -3.47021484375, -3.30731201171875, -3.1444091796875, -2.98150634765625, -2.818603515625, -2.65570068359375, -2.4927978515625, -2.32989501953125, -2.1669921875, -2.00408935546875, -1.8411865234375, -1.67828369140625, -1.515380859375, -1.35247802734375, -1.1895751953125, -1.02667236328125, -0.86376953125, -0.70086669921875, -0.5379638671875, -0.37506103515625, -0.212158203125, -0.04925537109375, 0.1136474609375, 0.27655029296875, 0.439453125, 0.60235595703125, 0.7652587890625, 0.92816162109375, 1.091064453125, 1.25396728515625, 1.4168701171875, 1.57977294921875, 1.74267578125, 1.90557861328125, 2.0684814453125, 2.23138427734375, 2.394287109375, 2.55718994140625, 2.7200927734375, 2.88299560546875, 3.0458984375, 3.20880126953125, 3.3717041015625, 3.53460693359375, 3.697509765625, 3.86041259765625, 4.0233154296875, 4.18621826171875, 4.34912109375, 4.51202392578125, 4.6749267578125, 4.83782958984375, 5.000732421875, 5.16363525390625, 5.3265380859375, 5.48944091796875, 5.65234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 4.0, 5.0, 3.0, 8.0, 11.0, 10.0, 19.0, 26.0, 34.0, 677.0, 78.0, 31.0, 16.0, 16.0, 4.0, 12.0, 7.0, 5.0, 8.0, 3.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0625, -1.99053955078125, -1.9185791015625, -1.84661865234375, -1.774658203125, -1.70269775390625, -1.6307373046875, -1.55877685546875, -1.48681640625, -1.41485595703125, -1.3428955078125, -1.27093505859375, -1.198974609375, -1.12701416015625, -1.0550537109375, -0.98309326171875, -0.9111328125, -0.83917236328125, -0.7672119140625, -0.69525146484375, -0.623291015625, -0.55133056640625, -0.4793701171875, -0.40740966796875, -0.33544921875, -0.26348876953125, -0.1915283203125, -0.11956787109375, -0.047607421875, 0.02435302734375, 0.0963134765625, 0.16827392578125, 0.240234375, 0.31219482421875, 0.3841552734375, 0.45611572265625, 0.528076171875, 0.60003662109375, 0.6719970703125, 0.74395751953125, 0.81591796875, 0.88787841796875, 0.9598388671875, 1.03179931640625, 1.103759765625, 1.17572021484375, 1.2476806640625, 1.31964111328125, 1.3916015625, 1.46356201171875, 1.5355224609375, 1.60748291015625, 1.679443359375, 1.75140380859375, 1.8233642578125, 1.89532470703125, 1.96728515625, 2.03924560546875, 2.1112060546875, 2.18316650390625, 2.255126953125, 2.32708740234375, 2.3990478515625, 2.47100830078125, 2.54296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 5.0, 10.0, 11.0, 9.0, 13.0, 26.0, 25.0, 46.0, 57.0, 102.0, 127.0, 170.0, 332.0, 529.0, 866.0, 1517.0, 2548.0, 4769.0, 9537.0, 19880.0, 45706.0, 119165.0, 381624.0, 1808265.0, 1342266.0, 294556.0, 93436.0, 36281.0, 15868.0, 7489.0, 3974.0, 2065.0, 1071.0, 691.0, 446.0, 239.0, 163.0, 109.0, 82.0, 65.0, 34.0, 22.0, 23.0, 13.0, 15.0, 10.0, 7.0, 7.0, 6.0, 6.0, 3.0, 0.0, 2.0, 2.0], "bins": [-2.443359375, -2.371307373046875, -2.29925537109375, -2.227203369140625, -2.1551513671875, -2.083099365234375, -2.01104736328125, -1.938995361328125, -1.866943359375, -1.794891357421875, -1.72283935546875, -1.650787353515625, -1.5787353515625, -1.506683349609375, -1.43463134765625, -1.362579345703125, -1.29052734375, -1.218475341796875, -1.14642333984375, -1.074371337890625, -1.0023193359375, -0.930267333984375, -0.85821533203125, -0.786163330078125, -0.714111328125, -0.642059326171875, -0.57000732421875, -0.497955322265625, -0.4259033203125, -0.353851318359375, -0.28179931640625, -0.209747314453125, -0.1376953125, -0.065643310546875, 0.00640869140625, 0.078460693359375, 0.1505126953125, 0.222564697265625, 0.29461669921875, 0.366668701171875, 0.438720703125, 0.510772705078125, 0.58282470703125, 0.654876708984375, 0.7269287109375, 0.798980712890625, 0.87103271484375, 0.943084716796875, 1.01513671875, 1.087188720703125, 1.15924072265625, 1.231292724609375, 1.3033447265625, 1.375396728515625, 1.44744873046875, 1.519500732421875, 1.591552734375, 1.663604736328125, 1.73565673828125, 1.807708740234375, 1.8797607421875, 1.951812744140625, 2.02386474609375, 2.095916748046875, 2.16796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 7.0, 18.0, 13.0, 17.0, 23.0, 35.0, 36.0, 48.0, 65.0, 77.0, 102.0, 128.0, 157.0, 237.0, 308.0, 420.0, 644.0, 500.0, 294.0, 248.0, 187.0, 116.0, 84.0, 64.0, 57.0, 34.0, 35.0, 19.0, 24.0, 17.0, 10.0, 7.0, 6.0, 9.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.7177734375, -1.6681060791015625, -1.618438720703125, -1.5687713623046875, -1.51910400390625, -1.4694366455078125, -1.419769287109375, -1.3701019287109375, -1.3204345703125, -1.2707672119140625, -1.221099853515625, -1.1714324951171875, -1.12176513671875, -1.0720977783203125, -1.022430419921875, -0.9727630615234375, -0.923095703125, -0.8734283447265625, -0.823760986328125, -0.7740936279296875, -0.72442626953125, -0.6747589111328125, -0.625091552734375, -0.5754241943359375, -0.5257568359375, -0.4760894775390625, -0.426422119140625, -0.3767547607421875, -0.32708740234375, -0.2774200439453125, -0.227752685546875, -0.1780853271484375, -0.12841796875, -0.0787506103515625, -0.029083251953125, 0.0205841064453125, 0.07025146484375, 0.1199188232421875, 0.169586181640625, 0.2192535400390625, 0.2689208984375, 0.3185882568359375, 0.368255615234375, 0.4179229736328125, 0.46759033203125, 0.5172576904296875, 0.566925048828125, 0.6165924072265625, 0.666259765625, 0.7159271240234375, 0.765594482421875, 0.8152618408203125, 0.86492919921875, 0.9145965576171875, 0.964263916015625, 1.0139312744140625, 1.0635986328125, 1.1132659912109375, 1.162933349609375, 1.2126007080078125, 1.26226806640625, 1.3119354248046875, 1.361602783203125, 1.4112701416015625, 1.4609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 13.0, 26.0, 81.0, 222.0, 356.0, 197.0, 76.0, 22.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.911849975585938, -31.19810676574707, -30.484363555908203, -29.770618438720703, -29.056875228881836, -28.34313201904297, -27.62938690185547, -26.9156436920166, -26.201900482177734, -25.488157272338867, -24.7744140625, -24.0606689453125, -23.346925735473633, -22.633182525634766, -21.919437408447266, -21.2056941986084, -20.49195098876953, -19.778207778930664, -19.064464569091797, -18.350719451904297, -17.63697624206543, -16.923233032226562, -16.209487915039062, -15.495744705200195, -14.782001495361328, -14.068258285522461, -13.354514122009277, -12.640769958496094, -11.927026748657227, -11.21328353881836, -10.499539375305176, -9.785795211791992, -9.072052955627441, -8.358308792114258, -7.644565582275391, -6.930821895599365, -6.21707820892334, -5.5033345222473145, -4.789590835571289, -4.075847148895264, -3.3621034622192383, -2.648359775543213, -1.9346160888671875, -1.220872402191162, -0.5071287155151367, 0.20661497116088867, 0.9203586578369141, 1.6341023445129395, 2.347846031188965, 3.0615897178649902, 3.7753334045410156, 4.489077091217041, 5.202820777893066, 5.916564464569092, 6.630308151245117, 7.344051837921143, 8.057795524597168, 8.771539688110352, 9.485282897949219, 10.199026107788086, 10.91277027130127, 11.626514434814453, 12.34025764465332, 13.054000854492188, 13.767745018005371]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 12.0, 11.0, 10.0, 22.0, 19.0, 19.0, 33.0, 24.0, 36.0, 37.0, 49.0, 40.0, 52.0, 48.0, 43.0, 67.0, 48.0, 60.0, 48.0, 49.0, 38.0, 39.0, 41.0, 24.0, 34.0, 21.0, 17.0, 11.0, 9.0, 12.0, 7.0, 8.0, 5.0, 4.0, 1.0, 2.0], "bins": [-12.806951522827148, -12.502330780029297, -12.197710037231445, -11.893089294433594, -11.588468551635742, -11.283846855163574, -10.979226112365723, -10.674605369567871, -10.36998462677002, -10.065363883972168, -9.760743141174316, -9.456122398376465, -9.151500701904297, -8.846879959106445, -8.542259216308594, -8.237638473510742, -7.933017730712891, -7.628396987915039, -7.3237762451171875, -7.019155025482178, -6.714534282684326, -6.409913539886475, -6.105292320251465, -5.800671577453613, -5.496050834655762, -5.19143009185791, -4.886809349060059, -4.582188129425049, -4.277567386627197, -3.9729466438293457, -3.668325662612915, -3.3637046813964844, -3.0590829849243164, -2.754462242126465, -2.449841260910034, -2.1452202796936035, -1.840599536895752, -1.5359786748886108, -1.2313578128814697, -0.9267368316650391, -0.6221160888671875, -0.3174952268600464, -0.012874364852905273, 0.29174649715423584, 0.596367359161377, 0.9009882211685181, 1.2056090831756592, 1.5102300643920898, 1.8148508071899414, 2.119471549987793, 2.4240925312042236, 2.7287135124206543, 3.033334255218506, 3.3379549980163574, 3.642575979232788, 3.9471969604492188, 4.25181770324707, 4.556438446044922, 4.861059188842773, 5.165680408477783, 5.470301151275635, 5.774921894073486, 6.079543113708496, 6.384163856506348, 6.688784599304199]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 13.0, 8.0, 12.0, 13.0, 31.0, 27.0, 41.0, 59.0, 81.0, 118.0, 163.0, 273.0, 378.0, 646.0, 1144.0, 1949.0, 3530.0, 6987.0, 14735.0, 36794.0, 593255.0, 328210.0, 32142.0, 13408.0, 6503.0, 3371.0, 1882.0, 1039.0, 601.0, 377.0, 232.0, 129.0, 109.0, 74.0, 53.0, 36.0, 32.0, 28.0, 16.0, 7.0, 8.0, 11.0, 9.0, 1.0, 1.0, 9.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.93048095703125, -4.7711181640625, -4.61175537109375, -4.452392578125, -4.29302978515625, -4.1336669921875, -3.97430419921875, -3.81494140625, -3.65557861328125, -3.4962158203125, -3.33685302734375, -3.177490234375, -3.01812744140625, -2.8587646484375, -2.69940185546875, -2.5400390625, -2.38067626953125, -2.2213134765625, -2.06195068359375, -1.902587890625, -1.74322509765625, -1.5838623046875, -1.42449951171875, -1.26513671875, -1.10577392578125, -0.9464111328125, -0.78704833984375, -0.627685546875, -0.46832275390625, -0.3089599609375, -0.14959716796875, 0.009765625, 0.16912841796875, 0.3284912109375, 0.48785400390625, 0.647216796875, 0.80657958984375, 0.9659423828125, 1.12530517578125, 1.28466796875, 1.44403076171875, 1.6033935546875, 1.76275634765625, 1.922119140625, 2.08148193359375, 2.2408447265625, 2.40020751953125, 2.5595703125, 2.71893310546875, 2.8782958984375, 3.03765869140625, 3.197021484375, 3.35638427734375, 3.5157470703125, 3.67510986328125, 3.83447265625, 3.99383544921875, 4.1531982421875, 4.31256103515625, 4.471923828125, 4.63128662109375, 4.7906494140625, 4.95001220703125, 5.109375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 3.0, 3.0, 5.0, 11.0, 6.0, 10.0, 14.0, 23.0, 43.0, 167.0, 406.0, 161.0, 53.0, 15.0, 17.0, 7.0, 11.0, 8.0, 10.0, 4.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0078125, -1.9398193359375, -1.871826171875, -1.8038330078125, -1.73583984375, -1.6678466796875, -1.599853515625, -1.5318603515625, -1.4638671875, -1.3958740234375, -1.327880859375, -1.2598876953125, -1.19189453125, -1.1239013671875, -1.055908203125, -0.9879150390625, -0.919921875, -0.8519287109375, -0.783935546875, -0.7159423828125, -0.64794921875, -0.5799560546875, -0.511962890625, -0.4439697265625, -0.3759765625, -0.3079833984375, -0.239990234375, -0.1719970703125, -0.10400390625, -0.0360107421875, 0.031982421875, 0.0999755859375, 0.16796875, 0.2359619140625, 0.303955078125, 0.3719482421875, 0.43994140625, 0.5079345703125, 0.575927734375, 0.6439208984375, 0.7119140625, 0.7799072265625, 0.847900390625, 0.9158935546875, 0.98388671875, 1.0518798828125, 1.119873046875, 1.1878662109375, 1.255859375, 1.3238525390625, 1.391845703125, 1.4598388671875, 1.52783203125, 1.5958251953125, 1.663818359375, 1.7318115234375, 1.7998046875, 1.8677978515625, 1.935791015625, 2.0037841796875, 2.07177734375, 2.1397705078125, 2.207763671875, 2.2757568359375, 2.34375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 9.0, 13.0, 12.0, 11.0, 9.0, 14.0, 26.0, 32.0, 49.0, 53.0, 96.0, 208.0, 384.0, 884.0, 2006.0, 4941.0, 13338.0, 41490.0, 151012.0, 502439.0, 238986.0, 61738.0, 19015.0, 6870.0, 2653.0, 1113.0, 470.0, 256.0, 150.0, 73.0, 45.0, 34.0, 32.0, 22.0, 12.0, 14.0, 12.0, 6.0, 3.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.6796875, -5.50579833984375, -5.3319091796875, -5.15802001953125, -4.984130859375, -4.81024169921875, -4.6363525390625, -4.46246337890625, -4.28857421875, -4.11468505859375, -3.9407958984375, -3.76690673828125, -3.593017578125, -3.41912841796875, -3.2452392578125, -3.07135009765625, -2.8974609375, -2.72357177734375, -2.5496826171875, -2.37579345703125, -2.201904296875, -2.02801513671875, -1.8541259765625, -1.68023681640625, -1.50634765625, -1.33245849609375, -1.1585693359375, -0.98468017578125, -0.810791015625, -0.63690185546875, -0.4630126953125, -0.28912353515625, -0.115234375, 0.05865478515625, 0.2325439453125, 0.40643310546875, 0.580322265625, 0.75421142578125, 0.9281005859375, 1.10198974609375, 1.27587890625, 1.44976806640625, 1.6236572265625, 1.79754638671875, 1.971435546875, 2.14532470703125, 2.3192138671875, 2.49310302734375, 2.6669921875, 2.84088134765625, 3.0147705078125, 3.18865966796875, 3.362548828125, 3.53643798828125, 3.7103271484375, 3.88421630859375, 4.05810546875, 4.23199462890625, 4.4058837890625, 4.57977294921875, 4.753662109375, 4.92755126953125, 5.1014404296875, 5.27532958984375, 5.44921875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 12.0, 11.0, 18.0, 24.0, 28.0, 20.0, 28.0, 26.0, 32.0, 38.0, 32.0, 31.0, 38.0, 31.0, 39.0, 37.0, 45.0, 39.0, 37.0, 42.0, 27.0, 24.0, 46.0, 31.0, 22.0, 23.0, 25.0, 24.0, 19.0, 22.0, 18.0, 16.0, 14.0, 10.0, 17.0, 7.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.78515625, -6.58624267578125, -6.3873291015625, -6.18841552734375, -5.989501953125, -5.79058837890625, -5.5916748046875, -5.39276123046875, -5.19384765625, -4.99493408203125, -4.7960205078125, -4.59710693359375, -4.398193359375, -4.19927978515625, -4.0003662109375, -3.80145263671875, -3.6025390625, -3.40362548828125, -3.2047119140625, -3.00579833984375, -2.806884765625, -2.60797119140625, -2.4090576171875, -2.21014404296875, -2.01123046875, -1.81231689453125, -1.6134033203125, -1.41448974609375, -1.215576171875, -1.01666259765625, -0.8177490234375, -0.61883544921875, -0.419921875, -0.22100830078125, -0.0220947265625, 0.17681884765625, 0.375732421875, 0.57464599609375, 0.7735595703125, 0.97247314453125, 1.17138671875, 1.37030029296875, 1.5692138671875, 1.76812744140625, 1.967041015625, 2.16595458984375, 2.3648681640625, 2.56378173828125, 2.7626953125, 2.96160888671875, 3.1605224609375, 3.35943603515625, 3.558349609375, 3.75726318359375, 3.9561767578125, 4.15509033203125, 4.35400390625, 4.55291748046875, 4.7518310546875, 4.95074462890625, 5.149658203125, 5.34857177734375, 5.5474853515625, 5.74639892578125, 5.9453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 4.0, 9.0, 13.0, 17.0, 29.0, 35.0, 66.0, 94.0, 166.0, 275.0, 515.0, 1059.0, 2488.0, 7380.0, 35587.0, 784125.0, 192465.0, 16351.0, 4386.0, 1730.0, 771.0, 400.0, 212.0, 117.0, 93.0, 48.0, 29.0, 27.0, 13.0, 13.0, 8.0, 6.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.89581298828125, -5.6978759765625, -5.49993896484375, -5.302001953125, -5.10406494140625, -4.9061279296875, -4.70819091796875, -4.51025390625, -4.31231689453125, -4.1143798828125, -3.91644287109375, -3.718505859375, -3.52056884765625, -3.3226318359375, -3.12469482421875, -2.9267578125, -2.72882080078125, -2.5308837890625, -2.33294677734375, -2.135009765625, -1.93707275390625, -1.7391357421875, -1.54119873046875, -1.34326171875, -1.14532470703125, -0.9473876953125, -0.74945068359375, -0.551513671875, -0.35357666015625, -0.1556396484375, 0.04229736328125, 0.240234375, 0.43817138671875, 0.6361083984375, 0.83404541015625, 1.031982421875, 1.22991943359375, 1.4278564453125, 1.62579345703125, 1.82373046875, 2.02166748046875, 2.2196044921875, 2.41754150390625, 2.615478515625, 2.81341552734375, 3.0113525390625, 3.20928955078125, 3.4072265625, 3.60516357421875, 3.8031005859375, 4.00103759765625, 4.198974609375, 4.39691162109375, 4.5948486328125, 4.79278564453125, 4.99072265625, 5.18865966796875, 5.3865966796875, 5.58453369140625, 5.782470703125, 5.98040771484375, 6.1783447265625, 6.37628173828125, 6.57421875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 11.0, 22.0, 27.0, 39.0, 58.0, 91.0, 113.0, 121.0, 144.0, 106.0, 85.0, 56.0, 34.0, 26.0, 17.0, 18.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00021696090698242188, -0.00021111220121383667, -0.00020526349544525146, -0.00019941478967666626, -0.00019356608390808105, -0.00018771737813949585, -0.00018186867237091064, -0.00017601996660232544, -0.00017017126083374023, -0.00016432255506515503, -0.00015847384929656982, -0.00015262514352798462, -0.00014677643775939941, -0.0001409277319908142, -0.000135079026222229, -0.0001292303204536438, -0.0001233816146850586, -0.00011753290891647339, -0.00011168420314788818, -0.00010583549737930298, -9.998679161071777e-05, -9.413808584213257e-05, -8.828938007354736e-05, -8.244067430496216e-05, -7.659196853637695e-05, -7.074326276779175e-05, -6.489455699920654e-05, -5.904585123062134e-05, -5.319714546203613e-05, -4.734843969345093e-05, -4.149973392486572e-05, -3.565102815628052e-05, -2.9802322387695312e-05, -2.3953616619110107e-05, -1.8104910850524902e-05, -1.2256205081939697e-05, -6.407499313354492e-06, -5.587935447692871e-07, 5.289912223815918e-06, 1.1138617992401123e-05, 1.6987323760986328e-05, 2.2836029529571533e-05, 2.8684735298156738e-05, 3.453344106674194e-05, 4.038214683532715e-05, 4.6230852603912354e-05, 5.207955837249756e-05, 5.7928264141082764e-05, 6.377696990966797e-05, 6.962567567825317e-05, 7.547438144683838e-05, 8.132308721542358e-05, 8.717179298400879e-05, 9.3020498752594e-05, 9.88692045211792e-05, 0.0001047179102897644, 0.00011056661605834961, 0.00011641532182693481, 0.00012226402759552002, 0.00012811273336410522, 0.00013396143913269043, 0.00013981014490127563, 0.00014565885066986084, 0.00015150755643844604, 0.00015735626220703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 14.0, 17.0, 13.0, 37.0, 44.0, 84.0, 174.0, 267.0, 536.0, 1254.0, 3067.0, 9157.0, 37885.0, 320299.0, 596044.0, 59769.0, 12912.0, 3973.0, 1511.0, 683.0, 341.0, 193.0, 100.0, 50.0, 45.0, 26.0, 15.0, 12.0, 6.0, 10.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.255859375, -3.101776123046875, -2.94769287109375, -2.793609619140625, -2.6395263671875, -2.485443115234375, -2.33135986328125, -2.177276611328125, -2.023193359375, -1.869110107421875, -1.71502685546875, -1.560943603515625, -1.4068603515625, -1.252777099609375, -1.09869384765625, -0.944610595703125, -0.79052734375, -0.636444091796875, -0.48236083984375, -0.328277587890625, -0.1741943359375, -0.020111083984375, 0.13397216796875, 0.288055419921875, 0.442138671875, 0.596221923828125, 0.75030517578125, 0.904388427734375, 1.0584716796875, 1.212554931640625, 1.36663818359375, 1.520721435546875, 1.6748046875, 1.828887939453125, 1.98297119140625, 2.137054443359375, 2.2911376953125, 2.445220947265625, 2.59930419921875, 2.753387451171875, 2.907470703125, 3.061553955078125, 3.21563720703125, 3.369720458984375, 3.5238037109375, 3.677886962890625, 3.83197021484375, 3.986053466796875, 4.14013671875, 4.294219970703125, 4.44830322265625, 4.602386474609375, 4.7564697265625, 4.910552978515625, 5.06463623046875, 5.218719482421875, 5.372802734375, 5.526885986328125, 5.68096923828125, 5.835052490234375, 5.9891357421875, 6.143218994140625, 6.29730224609375, 6.451385498046875, 6.60546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 3.0, 11.0, 5.0, 10.0, 13.0, 20.0, 18.0, 24.0, 23.0, 27.0, 58.0, 61.0, 70.0, 77.0, 100.0, 87.0, 63.0, 66.0, 43.0, 45.0, 40.0, 22.0, 23.0, 16.0, 15.0, 16.0, 7.0, 8.0, 4.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.133209228515625, -4.98907470703125, -4.844940185546875, -4.7008056640625, -4.556671142578125, -4.41253662109375, -4.268402099609375, -4.124267578125, -3.980133056640625, -3.83599853515625, -3.691864013671875, -3.5477294921875, -3.403594970703125, -3.25946044921875, -3.115325927734375, -2.97119140625, -2.827056884765625, -2.68292236328125, -2.538787841796875, -2.3946533203125, -2.250518798828125, -2.10638427734375, -1.962249755859375, -1.818115234375, -1.673980712890625, -1.52984619140625, -1.385711669921875, -1.2415771484375, -1.097442626953125, -0.95330810546875, -0.809173583984375, -0.6650390625, -0.520904541015625, -0.37677001953125, -0.232635498046875, -0.0885009765625, 0.055633544921875, 0.19976806640625, 0.343902587890625, 0.488037109375, 0.632171630859375, 0.77630615234375, 0.920440673828125, 1.0645751953125, 1.208709716796875, 1.35284423828125, 1.496978759765625, 1.64111328125, 1.785247802734375, 1.92938232421875, 2.073516845703125, 2.2176513671875, 2.361785888671875, 2.50592041015625, 2.650054931640625, 2.794189453125, 2.938323974609375, 3.08245849609375, 3.226593017578125, 3.3707275390625, 3.514862060546875, 3.65899658203125, 3.803131103515625, 3.947265625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 10.0, 12.0, 48.0, 180.0, 511.0, 166.0, 48.0, 13.0, 5.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.89703369140625, -99.28172302246094, -94.6664047241211, -90.05109405517578, -85.43577575683594, -80.82046508789062, -76.20515441894531, -71.58984375, -66.97452545166016, -62.35921096801758, -57.743896484375, -53.12858581542969, -48.51327133178711, -43.89795684814453, -39.28264617919922, -34.66733169555664, -30.052017211914062, -25.436702728271484, -20.82139015197754, -16.206077575683594, -11.590763092041016, -6.9754486083984375, -2.360136032104492, 2.255176544189453, 6.870491027832031, 11.485804557800293, 16.101118087768555, 20.7164306640625, 25.331745147705078, 29.947059631347656, 34.56237030029297, 39.17768478393555, 43.79301452636719, 48.408329010009766, 53.023643493652344, 57.638954162597656, 62.254268646240234, 66.86958312988281, 71.48489379882812, 76.10020446777344, 80.71552276611328, 85.3308334350586, 89.94615173339844, 94.56146240234375, 99.17677307128906, 103.7920913696289, 108.40740203857422, 113.02272033691406, 117.63803100585938, 122.25334167480469, 126.86865997314453, 131.48397827148438, 136.0992889404297, 140.714599609375, 145.3299102783203, 149.94522094726562, 154.560546875, 159.1758575439453, 163.79116821289062, 168.406494140625, 173.0218048095703, 177.63711547851562, 182.25242614746094, 186.86773681640625, 191.48304748535156]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 6.0, 4.0, 8.0, 8.0, 7.0, 15.0, 28.0, 31.0, 49.0, 71.0, 92.0, 107.0, 116.0, 124.0, 101.0, 51.0, 44.0, 36.0, 23.0, 16.0, 11.0, 4.0, 11.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-110.92841339111328, -107.02137756347656, -103.11434936523438, -99.20731353759766, -95.30028533935547, -91.39324951171875, -87.48622131347656, -83.57918548583984, -79.67214965820312, -75.7651138305664, -71.85808563232422, -67.9510498046875, -64.04402160644531, -60.136985778808594, -56.22995376586914, -52.32292175292969, -48.4158935546875, -44.50886154174805, -40.601829528808594, -36.694793701171875, -32.78776550292969, -28.8807315826416, -24.973697662353516, -21.066665649414062, -17.15963363647461, -13.252601623535156, -9.345568656921387, -5.438535690307617, -1.531503677368164, 2.375528335571289, 6.282562255859375, 10.189594268798828, 14.096633911132812, 18.003665924072266, 21.91069793701172, 25.817731857299805, 29.724763870239258, 33.631797790527344, 37.5388298034668, 41.44586181640625, 45.3528938293457, 49.259925842285156, 53.16695785522461, 57.07398986816406, 60.98102569580078, 64.88805389404297, 68.79508972167969, 72.70211791992188, 76.6091537475586, 80.51618957519531, 84.4232177734375, 88.33025360107422, 92.2372817993164, 96.14431762695312, 100.05134582519531, 103.95838165283203, 107.86541748046875, 111.77245330810547, 115.67948150634766, 119.58651733398438, 123.49354553222656, 127.40058135986328, 131.3076171875, 135.2146453857422, 139.12167358398438]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 10.0, 9.0, 8.0, 15.0, 21.0, 35.0, 32.0, 57.0, 85.0, 87.0, 125.0, 183.0, 296.0, 453.0, 757.0, 1263.0, 2186.0, 4207.0, 9122.0, 26010.0, 143518.0, 3820257.0, 140125.0, 25593.0, 9219.0, 4205.0, 2312.0, 1357.0, 886.0, 551.0, 385.0, 260.0, 159.0, 132.0, 75.0, 76.0, 47.0, 38.0, 29.0, 24.0, 16.0, 15.0, 14.0, 7.0, 7.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-15.078125, -14.5994873046875, -14.120849609375, -13.6422119140625, -13.16357421875, -12.6849365234375, -12.206298828125, -11.7276611328125, -11.2490234375, -10.7703857421875, -10.291748046875, -9.8131103515625, -9.33447265625, -8.8558349609375, -8.377197265625, -7.8985595703125, -7.419921875, -6.9412841796875, -6.462646484375, -5.9840087890625, -5.50537109375, -5.0267333984375, -4.548095703125, -4.0694580078125, -3.5908203125, -3.1121826171875, -2.633544921875, -2.1549072265625, -1.67626953125, -1.1976318359375, -0.718994140625, -0.2403564453125, 0.23828125, 0.7169189453125, 1.195556640625, 1.6741943359375, 2.15283203125, 2.6314697265625, 3.110107421875, 3.5887451171875, 4.0673828125, 4.5460205078125, 5.024658203125, 5.5032958984375, 5.98193359375, 6.4605712890625, 6.939208984375, 7.4178466796875, 7.896484375, 8.3751220703125, 8.853759765625, 9.3323974609375, 9.81103515625, 10.2896728515625, 10.768310546875, 11.2469482421875, 11.7255859375, 12.2042236328125, 12.682861328125, 13.1614990234375, 13.64013671875, 14.1187744140625, 14.597412109375, 15.0760498046875, 15.5546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 0.0, 4.0, 5.0, 6.0, 3.0, 5.0, 9.0, 8.0, 12.0, 18.0, 23.0, 37.0, 79.0, 94.0, 145.0, 165.0, 116.0, 84.0, 59.0, 27.0, 25.0, 12.0, 10.0, 5.0, 8.0, 2.0, 10.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.466796875, -1.4183349609375, -1.369873046875, -1.3214111328125, -1.27294921875, -1.2244873046875, -1.176025390625, -1.1275634765625, -1.0791015625, -1.0306396484375, -0.982177734375, -0.9337158203125, -0.88525390625, -0.8367919921875, -0.788330078125, -0.7398681640625, -0.69140625, -0.6429443359375, -0.594482421875, -0.5460205078125, -0.49755859375, -0.4490966796875, -0.400634765625, -0.3521728515625, -0.3037109375, -0.2552490234375, -0.206787109375, -0.1583251953125, -0.10986328125, -0.0614013671875, -0.012939453125, 0.0355224609375, 0.083984375, 0.1324462890625, 0.180908203125, 0.2293701171875, 0.27783203125, 0.3262939453125, 0.374755859375, 0.4232177734375, 0.4716796875, 0.5201416015625, 0.568603515625, 0.6170654296875, 0.66552734375, 0.7139892578125, 0.762451171875, 0.8109130859375, 0.859375, 0.9078369140625, 0.956298828125, 1.0047607421875, 1.05322265625, 1.1016845703125, 1.150146484375, 1.1986083984375, 1.2470703125, 1.2955322265625, 1.343994140625, 1.3924560546875, 1.44091796875, 1.4893798828125, 1.537841796875, 1.5863037109375, 1.634765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 10.0, 22.0, 31.0, 37.0, 62.0, 69.0, 136.0, 185.0, 282.0, 514.0, 945.0, 1892.0, 4201.0, 12144.0, 57383.0, 2582382.0, 1466972.0, 49118.0, 10589.0, 3673.0, 1564.0, 856.0, 461.0, 268.0, 166.0, 106.0, 57.0, 44.0, 27.0, 19.0, 14.0, 10.0, 7.0, 6.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.59375, -12.1734619140625, -11.753173828125, -11.3328857421875, -10.91259765625, -10.4923095703125, -10.072021484375, -9.6517333984375, -9.2314453125, -8.8111572265625, -8.390869140625, -7.9705810546875, -7.55029296875, -7.1300048828125, -6.709716796875, -6.2894287109375, -5.869140625, -5.4488525390625, -5.028564453125, -4.6082763671875, -4.18798828125, -3.7677001953125, -3.347412109375, -2.9271240234375, -2.5068359375, -2.0865478515625, -1.666259765625, -1.2459716796875, -0.82568359375, -0.4053955078125, 0.014892578125, 0.4351806640625, 0.85546875, 1.2757568359375, 1.696044921875, 2.1163330078125, 2.53662109375, 2.9569091796875, 3.377197265625, 3.7974853515625, 4.2177734375, 4.6380615234375, 5.058349609375, 5.4786376953125, 5.89892578125, 6.3192138671875, 6.739501953125, 7.1597900390625, 7.580078125, 8.0003662109375, 8.420654296875, 8.8409423828125, 9.26123046875, 9.6815185546875, 10.101806640625, 10.5220947265625, 10.9423828125, 11.3626708984375, 11.782958984375, 12.2032470703125, 12.62353515625, 13.0438232421875, 13.464111328125, 13.8843994140625, 14.3046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 9.0, 10.0, 10.0, 19.0, 31.0, 49.0, 92.0, 230.0, 906.0, 1977.0, 410.0, 167.0, 57.0, 43.0, 22.0, 11.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.357421875, -3.242340087890625, -3.12725830078125, -3.012176513671875, -2.8970947265625, -2.782012939453125, -2.66693115234375, -2.551849365234375, -2.436767578125, -2.321685791015625, -2.20660400390625, -2.091522216796875, -1.9764404296875, -1.861358642578125, -1.74627685546875, -1.631195068359375, -1.51611328125, -1.401031494140625, -1.28594970703125, -1.170867919921875, -1.0557861328125, -0.940704345703125, -0.82562255859375, -0.710540771484375, -0.595458984375, -0.480377197265625, -0.36529541015625, -0.250213623046875, -0.1351318359375, -0.020050048828125, 0.09503173828125, 0.210113525390625, 0.3251953125, 0.440277099609375, 0.55535888671875, 0.670440673828125, 0.7855224609375, 0.900604248046875, 1.01568603515625, 1.130767822265625, 1.245849609375, 1.360931396484375, 1.47601318359375, 1.591094970703125, 1.7061767578125, 1.821258544921875, 1.93634033203125, 2.051422119140625, 2.16650390625, 2.281585693359375, 2.39666748046875, 2.511749267578125, 2.6268310546875, 2.741912841796875, 2.85699462890625, 2.972076416015625, 3.087158203125, 3.202239990234375, 3.31732177734375, 3.432403564453125, 3.5474853515625, 3.662567138671875, 3.77764892578125, 3.892730712890625, 4.0078125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 13.0, 16.0, 46.0, 75.0, 183.0, 255.0, 200.0, 98.0, 46.0, 20.0, 15.0, 10.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.447733879089355, -14.952469825744629, -14.457205772399902, -13.96194076538086, -13.466676712036133, -12.971412658691406, -12.47614860534668, -11.980884552001953, -11.485620498657227, -10.9903564453125, -10.495092391967773, -9.999828338623047, -9.504563331604004, -9.009299278259277, -8.51403522491455, -8.018771171569824, -7.523506164550781, -7.028242111206055, -6.53297758102417, -6.037713527679443, -5.542448997497559, -5.047184944152832, -4.5519208908081055, -4.056656837463379, -3.561392307281494, -3.0661280155181885, -2.570863723754883, -2.0755996704101562, -1.5803353786468506, -1.085071086883545, -0.5898070335388184, -0.0945427417755127, 0.40072059631347656, 0.8959848284721375, 1.3912490606307983, 1.8865132331848145, 2.38177752494812, 2.877041816711426, 3.3723058700561523, 3.867570161819458, 4.362834453582764, 4.85809850692749, 5.353363037109375, 5.848627090454102, 6.343891143798828, 6.839155673980713, 7.3344197273254395, 7.829684257507324, 8.32494831085205, 8.820212364196777, 9.315476417541504, 9.810741424560547, 10.306005477905273, 10.80126953125, 11.296533584594727, 11.791797637939453, 12.28706169128418, 12.782325744628906, 13.277589797973633, 13.77285385131836, 14.268118858337402, 14.763382911682129, 15.258646965026855, 15.753911018371582, 16.249176025390625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 13.0, 18.0, 41.0, 55.0, 80.0, 102.0, 101.0, 92.0, 92.0, 100.0, 80.0, 74.0, 46.0, 28.0, 15.0, 12.0, 9.0, 7.0, 6.0, 6.0, 1.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.30668067932129, -16.71780014038086, -16.128921508789062, -15.540040969848633, -14.951160430908203, -14.36228084564209, -13.773401260375977, -13.184520721435547, -12.595641136169434, -12.00676155090332, -11.41788101196289, -10.829001426696777, -10.240121841430664, -9.651241302490234, -9.062361717224121, -8.473482131958008, -7.884601593017578, -7.295721530914307, -6.706841468811035, -6.117961883544922, -5.52908182144165, -4.940201759338379, -4.351322174072266, -3.762442111968994, -3.1735620498657227, -2.584681987762451, -1.9958021640777588, -1.4069222211837769, -0.8180422782897949, -0.22916221618652344, 0.35971760749816895, 0.9485974311828613, 1.5374755859375, 2.1263556480407715, 2.715235471725464, 3.3041152954101562, 3.8929953575134277, 4.481875419616699, 5.0707550048828125, 5.659635066986084, 6.2485151290893555, 6.837395191192627, 7.426275253295898, 8.015154838562012, 8.604034423828125, 9.192914962768555, 9.781794548034668, 10.370674133300781, 10.959554672241211, 11.548434257507324, 12.137314796447754, 12.726194381713867, 13.315074920654297, 13.90395450592041, 14.492834091186523, 15.081714630126953, 15.670594215393066, 16.25947380065918, 16.84835433959961, 17.43723487854004, 18.026113510131836, 18.614994049072266, 19.203874588012695, 19.792753219604492, 20.381633758544922]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 14.0, 18.0, 21.0, 31.0, 27.0, 31.0, 47.0, 61.0, 116.0, 306.0, 1387.0, 11948.0, 682133.0, 341657.0, 9058.0, 1065.0, 253.0, 103.0, 67.0, 46.0, 28.0, 17.0, 24.0, 19.0, 11.0, 13.0, 17.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.546875, -29.590576171875, -28.63427734375, -27.677978515625, -26.7216796875, -25.765380859375, -24.80908203125, -23.852783203125, -22.896484375, -21.940185546875, -20.98388671875, -20.027587890625, -19.0712890625, -18.114990234375, -17.15869140625, -16.202392578125, -15.24609375, -14.289794921875, -13.33349609375, -12.377197265625, -11.4208984375, -10.464599609375, -9.50830078125, -8.552001953125, -7.595703125, -6.639404296875, -5.68310546875, -4.726806640625, -3.7705078125, -2.814208984375, -1.85791015625, -0.901611328125, 0.0546875, 1.010986328125, 1.96728515625, 2.923583984375, 3.8798828125, 4.836181640625, 5.79248046875, 6.748779296875, 7.705078125, 8.661376953125, 9.61767578125, 10.573974609375, 11.5302734375, 12.486572265625, 13.44287109375, 14.399169921875, 15.35546875, 16.311767578125, 17.26806640625, 18.224365234375, 19.1806640625, 20.136962890625, 21.09326171875, 22.049560546875, 23.005859375, 23.962158203125, 24.91845703125, 25.874755859375, 26.8310546875, 27.787353515625, 28.74365234375, 29.699951171875, 30.65625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 8.0, 5.0, 3.0, 8.0, 20.0, 36.0, 80.0, 194.0, 256.0, 211.0, 108.0, 34.0, 21.0, 10.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96435546875, -0.8649368286132812, -0.7655181884765625, -0.6660995483398438, -0.566680908203125, -0.46726226806640625, -0.3678436279296875, -0.26842498779296875, -0.16900634765625, -0.06958770751953125, 0.0298309326171875, 0.12924957275390625, 0.228668212890625, 0.32808685302734375, 0.4275054931640625, 0.5269241333007812, 0.6263427734375, 0.7257614135742188, 0.8251800537109375, 0.9245986938476562, 1.024017333984375, 1.1234359741210938, 1.2228546142578125, 1.3222732543945312, 1.42169189453125, 1.5211105346679688, 1.6205291748046875, 1.7199478149414062, 1.819366455078125, 1.9187850952148438, 2.0182037353515625, 2.1176223754882812, 2.217041015625, 2.3164596557617188, 2.4158782958984375, 2.5152969360351562, 2.614715576171875, 2.7141342163085938, 2.8135528564453125, 2.9129714965820312, 3.01239013671875, 3.1118087768554688, 3.2112274169921875, 3.3106460571289062, 3.410064697265625, 3.5094833374023438, 3.6089019775390625, 3.7083206176757812, 3.8077392578125, 3.9071578979492188, 4.0065765380859375, 4.105995178222656, 4.205413818359375, 4.304832458496094, 4.4042510986328125, 4.503669738769531, 4.60308837890625, 4.702507019042969, 4.8019256591796875, 4.901344299316406, 5.000762939453125, 5.100181579589844, 5.1996002197265625, 5.299018859863281, 5.3984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 10.0, 11.0, 17.0, 40.0, 92.0, 238.0, 641.0, 1852.0, 5803.0, 22220.0, 109586.0, 581594.0, 264681.0, 45640.0, 11100.0, 3209.0, 1062.0, 420.0, 161.0, 93.0, 36.0, 24.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.27288818359375, -7.0106201171875, -6.74835205078125, -6.486083984375, -6.22381591796875, -5.9615478515625, -5.69927978515625, -5.43701171875, -5.17474365234375, -4.9124755859375, -4.65020751953125, -4.387939453125, -4.12567138671875, -3.8634033203125, -3.60113525390625, -3.3388671875, -3.07659912109375, -2.8143310546875, -2.55206298828125, -2.289794921875, -2.02752685546875, -1.7652587890625, -1.50299072265625, -1.24072265625, -0.97845458984375, -0.7161865234375, -0.45391845703125, -0.191650390625, 0.07061767578125, 0.3328857421875, 0.59515380859375, 0.857421875, 1.11968994140625, 1.3819580078125, 1.64422607421875, 1.906494140625, 2.16876220703125, 2.4310302734375, 2.69329833984375, 2.95556640625, 3.21783447265625, 3.4801025390625, 3.74237060546875, 4.004638671875, 4.26690673828125, 4.5291748046875, 4.79144287109375, 5.0537109375, 5.31597900390625, 5.5782470703125, 5.84051513671875, 6.102783203125, 6.36505126953125, 6.6273193359375, 6.88958740234375, 7.15185546875, 7.41412353515625, 7.6763916015625, 7.93865966796875, 8.200927734375, 8.46319580078125, 8.7254638671875, 8.98773193359375, 9.25]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 7.0, 4.0, 5.0, 11.0, 12.0, 12.0, 11.0, 15.0, 11.0, 20.0, 24.0, 18.0, 25.0, 24.0, 37.0, 40.0, 42.0, 27.0, 35.0, 39.0, 50.0, 35.0, 34.0, 37.0, 33.0, 34.0, 38.0, 35.0, 41.0, 27.0, 23.0, 25.0, 28.0, 24.0, 17.0, 22.0, 12.0, 9.0, 10.0, 11.0, 12.0, 10.0, 3.0, 1.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.0078125, -3.87786865234375, -3.7479248046875, -3.61798095703125, -3.488037109375, -3.35809326171875, -3.2281494140625, -3.09820556640625, -2.96826171875, -2.83831787109375, -2.7083740234375, -2.57843017578125, -2.448486328125, -2.31854248046875, -2.1885986328125, -2.05865478515625, -1.9287109375, -1.79876708984375, -1.6688232421875, -1.53887939453125, -1.408935546875, -1.27899169921875, -1.1490478515625, -1.01910400390625, -0.88916015625, -0.75921630859375, -0.6292724609375, -0.49932861328125, -0.369384765625, -0.23944091796875, -0.1094970703125, 0.02044677734375, 0.150390625, 0.28033447265625, 0.4102783203125, 0.54022216796875, 0.670166015625, 0.80010986328125, 0.9300537109375, 1.05999755859375, 1.18994140625, 1.31988525390625, 1.4498291015625, 1.57977294921875, 1.709716796875, 1.83966064453125, 1.9696044921875, 2.09954833984375, 2.2294921875, 2.35943603515625, 2.4893798828125, 2.61932373046875, 2.749267578125, 2.87921142578125, 3.0091552734375, 3.13909912109375, 3.26904296875, 3.39898681640625, 3.5289306640625, 3.65887451171875, 3.788818359375, 3.91876220703125, 4.0487060546875, 4.17864990234375, 4.30859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 11.0, 12.0, 20.0, 29.0, 48.0, 71.0, 151.0, 347.0, 881.0, 2933.0, 13729.0, 297899.0, 708249.0, 18893.0, 3512.0, 1021.0, 371.0, 155.0, 73.0, 51.0, 27.0, 24.0, 16.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.425537109375, -16.75732421875, -16.089111328125, -15.4208984375, -14.752685546875, -14.08447265625, -13.416259765625, -12.748046875, -12.079833984375, -11.41162109375, -10.743408203125, -10.0751953125, -9.406982421875, -8.73876953125, -8.070556640625, -7.40234375, -6.734130859375, -6.06591796875, -5.397705078125, -4.7294921875, -4.061279296875, -3.39306640625, -2.724853515625, -2.056640625, -1.388427734375, -0.72021484375, -0.052001953125, 0.6162109375, 1.284423828125, 1.95263671875, 2.620849609375, 3.2890625, 3.957275390625, 4.62548828125, 5.293701171875, 5.9619140625, 6.630126953125, 7.29833984375, 7.966552734375, 8.634765625, 9.302978515625, 9.97119140625, 10.639404296875, 11.3076171875, 11.975830078125, 12.64404296875, 13.312255859375, 13.98046875, 14.648681640625, 15.31689453125, 15.985107421875, 16.6533203125, 17.321533203125, 17.98974609375, 18.657958984375, 19.326171875, 19.994384765625, 20.66259765625, 21.330810546875, 21.9990234375, 22.667236328125, 23.33544921875, 24.003662109375, 24.671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 9.0, 7.0, 9.0, 8.0, 16.0, 13.0, 41.0, 67.0, 155.0, 274.0, 187.0, 88.0, 38.0, 28.0, 15.0, 8.0, 4.0, 9.0, 2.0, 4.0, 8.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007023811340332031, -0.0006793811917304993, -0.0006563812494277954, -0.0006333813071250916, -0.0006103813648223877, -0.0005873814225196838, -0.00056438148021698, -0.0005413815379142761, -0.0005183815956115723, -0.0004953816533088684, -0.00047238171100616455, -0.0004493817687034607, -0.00042638182640075684, -0.000403381884098053, -0.0003803819417953491, -0.00035738199949264526, -0.0003343820571899414, -0.00031138211488723755, -0.0002883821725845337, -0.00026538223028182983, -0.00024238228797912598, -0.00021938234567642212, -0.00019638240337371826, -0.0001733824610710144, -0.00015038251876831055, -0.0001273825764656067, -0.00010438263416290283, -8.138269186019897e-05, -5.838274955749512e-05, -3.538280725479126e-05, -1.2382864952087402e-05, 1.0617077350616455e-05, 3.361701965332031e-05, 5.661696195602417e-05, 7.961690425872803e-05, 0.00010261684656143188, 0.00012561678886413574, 0.0001486167311668396, 0.00017161667346954346, 0.00019461661577224731, 0.00021761655807495117, 0.00024061650037765503, 0.0002636164426803589, 0.00028661638498306274, 0.0003096163272857666, 0.00033261626958847046, 0.0003556162118911743, 0.0003786161541938782, 0.00040161609649658203, 0.0004246160387992859, 0.00044761598110198975, 0.0004706159234046936, 0.0004936158657073975, 0.0005166158080101013, 0.0005396157503128052, 0.000562615692615509, 0.0005856156349182129, 0.0006086155772209167, 0.0006316155195236206, 0.0006546154618263245, 0.0006776154041290283, 0.0007006153464317322, 0.000723615288734436, 0.0007466152310371399, 0.0007696151733398438]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 8.0, 12.0, 9.0, 27.0, 25.0, 48.0, 67.0, 74.0, 140.0, 177.0, 265.0, 460.0, 758.0, 1190.0, 2088.0, 3501.0, 6686.0, 13485.0, 30253.0, 87500.0, 411030.0, 357607.0, 77099.0, 27788.0, 12601.0, 6508.0, 3477.0, 2096.0, 1271.0, 755.0, 539.0, 335.0, 227.0, 147.0, 83.0, 72.0, 34.0, 36.0, 23.0, 8.0, 8.0, 12.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0], "bins": [-6.20703125, -6.0390625, -5.87109375, -5.703125, -5.53515625, -5.3671875, -5.19921875, -5.03125, -4.86328125, -4.6953125, -4.52734375, -4.359375, -4.19140625, -4.0234375, -3.85546875, -3.6875, -3.51953125, -3.3515625, -3.18359375, -3.015625, -2.84765625, -2.6796875, -2.51171875, -2.34375, -2.17578125, -2.0078125, -1.83984375, -1.671875, -1.50390625, -1.3359375, -1.16796875, -1.0, -0.83203125, -0.6640625, -0.49609375, -0.328125, -0.16015625, 0.0078125, 0.17578125, 0.34375, 0.51171875, 0.6796875, 0.84765625, 1.015625, 1.18359375, 1.3515625, 1.51953125, 1.6875, 1.85546875, 2.0234375, 2.19140625, 2.359375, 2.52734375, 2.6953125, 2.86328125, 3.03125, 3.19921875, 3.3671875, 3.53515625, 3.703125, 3.87109375, 4.0390625, 4.20703125, 4.375, 4.54296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 6.0, 7.0, 7.0, 14.0, 17.0, 21.0, 22.0, 31.0, 43.0, 52.0, 81.0, 108.0, 120.0, 99.0, 95.0, 78.0, 52.0, 31.0, 20.0, 11.0, 14.0, 16.0, 6.0, 3.0, 7.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.09765625, -6.879638671875, -6.66162109375, -6.443603515625, -6.2255859375, -6.007568359375, -5.78955078125, -5.571533203125, -5.353515625, -5.135498046875, -4.91748046875, -4.699462890625, -4.4814453125, -4.263427734375, -4.04541015625, -3.827392578125, -3.609375, -3.391357421875, -3.17333984375, -2.955322265625, -2.7373046875, -2.519287109375, -2.30126953125, -2.083251953125, -1.865234375, -1.647216796875, -1.42919921875, -1.211181640625, -0.9931640625, -0.775146484375, -0.55712890625, -0.339111328125, -0.12109375, 0.096923828125, 0.31494140625, 0.532958984375, 0.7509765625, 0.968994140625, 1.18701171875, 1.405029296875, 1.623046875, 1.841064453125, 2.05908203125, 2.277099609375, 2.4951171875, 2.713134765625, 2.93115234375, 3.149169921875, 3.3671875, 3.585205078125, 3.80322265625, 4.021240234375, 4.2392578125, 4.457275390625, 4.67529296875, 4.893310546875, 5.111328125, 5.329345703125, 5.54736328125, 5.765380859375, 5.9833984375, 6.201416015625, 6.41943359375, 6.637451171875, 6.85546875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 55.0, 224.0, 373.0, 197.0, 82.0, 35.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.09200286865234, -82.81078338623047, -79.52957153320312, -76.24835205078125, -72.9671401977539, -69.68592071533203, -66.40470886230469, -63.12348937988281, -59.8422737121582, -56.561058044433594, -53.279842376708984, -49.998626708984375, -46.7174072265625, -43.436195373535156, -40.15497589111328, -36.87376022338867, -33.59254455566406, -30.311328887939453, -27.030113220214844, -23.7488956451416, -20.467679977416992, -17.186464309692383, -13.90524673461914, -10.624031066894531, -7.342815399169922, -4.061599254608154, -0.7803831100463867, 2.500833511352539, 5.782049179077148, 9.063264846801758, 12.344482421875, 15.62569808959961, 18.906906127929688, 22.188121795654297, 25.469337463378906, 28.75055503845215, 32.031768798828125, 35.31298828125, 38.59420394897461, 41.87541961669922, 45.15663528442383, 48.43785095214844, 51.71906661987305, 55.000282287597656, 58.28150177001953, 61.562713623046875, 64.84393310546875, 68.12515258789062, 71.40636444091797, 74.68758392333984, 77.96879577636719, 81.25001525878906, 84.5312271118164, 87.81244659423828, 91.09365844726562, 94.3748779296875, 97.65609741210938, 100.93731689453125, 104.2185287475586, 107.49974822998047, 110.78096008300781, 114.06217956542969, 117.34339904785156, 120.6246109008789, 123.90582275390625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 4.0, 1.0, 11.0, 6.0, 11.0, 9.0, 33.0, 31.0, 69.0, 93.0, 125.0, 157.0, 138.0, 127.0, 70.0, 59.0, 27.0, 11.0, 13.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-146.91952514648438, -143.66024780273438, -140.40098571777344, -137.14170837402344, -133.8824462890625, -130.6231689453125, -127.36390686035156, -124.10462951660156, -120.8453598022461, -117.58609008789062, -114.32682037353516, -111.06755065917969, -107.80828094482422, -104.54901123046875, -101.28973388671875, -98.03046417236328, -94.77119445800781, -91.51192474365234, -88.25265502929688, -84.9933853149414, -81.73411560058594, -78.47483825683594, -75.215576171875, -71.956298828125, -68.69703674316406, -65.4377670288086, -62.178497314453125, -58.919227600097656, -55.65995407104492, -52.40068435668945, -49.141414642333984, -45.88214111328125, -42.622867584228516, -39.36359786987305, -36.10432815551758, -32.845054626464844, -29.585784912109375, -26.326515197753906, -23.067245483398438, -19.807973861694336, -16.548704147338867, -13.289433479309082, -10.030162811279297, -6.770893096923828, -3.511622428894043, -0.2523517608642578, 3.006917953491211, 6.2661895751953125, 9.525459289550781, 12.784729957580566, 16.04400062561035, 19.30327033996582, 22.562541961669922, 25.82181167602539, 29.08108139038086, 32.340354919433594, 35.59962463378906, 38.85889434814453, 42.1181640625, 45.37743377685547, 48.6367073059082, 51.89597702026367, 55.15524673461914, 58.414520263671875, 61.67378616333008]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 10.0, 17.0, 11.0, 26.0, 27.0, 35.0, 60.0, 83.0, 101.0, 122.0, 202.0, 370.0, 476.0, 876.0, 1513.0, 3140.0, 7553.0, 26726.0, 330810.0, 3736626.0, 64427.0, 12515.0, 4300.0, 1824.0, 948.0, 506.0, 329.0, 202.0, 149.0, 83.0, 68.0, 38.0, 29.0, 19.0, 17.0, 11.0, 9.0, 7.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-27.703125, -26.9970703125, -26.291015625, -25.5849609375, -24.87890625, -24.1728515625, -23.466796875, -22.7607421875, -22.0546875, -21.3486328125, -20.642578125, -19.9365234375, -19.23046875, -18.5244140625, -17.818359375, -17.1123046875, -16.40625, -15.7001953125, -14.994140625, -14.2880859375, -13.58203125, -12.8759765625, -12.169921875, -11.4638671875, -10.7578125, -10.0517578125, -9.345703125, -8.6396484375, -7.93359375, -7.2275390625, -6.521484375, -5.8154296875, -5.109375, -4.4033203125, -3.697265625, -2.9912109375, -2.28515625, -1.5791015625, -0.873046875, -0.1669921875, 0.5390625, 1.2451171875, 1.951171875, 2.6572265625, 3.36328125, 4.0693359375, 4.775390625, 5.4814453125, 6.1875, 6.8935546875, 7.599609375, 8.3056640625, 9.01171875, 9.7177734375, 10.423828125, 11.1298828125, 11.8359375, 12.5419921875, 13.248046875, 13.9541015625, 14.66015625, 15.3662109375, 16.072265625, 16.7783203125, 17.484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 10.0, 11.0, 22.0, 24.0, 23.0, 30.0, 53.0, 66.0, 78.0, 109.0, 103.0, 89.0, 87.0, 72.0, 52.0, 44.0, 27.0, 28.0, 19.0, 4.0, 8.0, 4.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3671875, -1.32855224609375, -1.2899169921875, -1.25128173828125, -1.212646484375, -1.17401123046875, -1.1353759765625, -1.09674072265625, -1.05810546875, -1.01947021484375, -0.9808349609375, -0.94219970703125, -0.903564453125, -0.86492919921875, -0.8262939453125, -0.78765869140625, -0.7490234375, -0.71038818359375, -0.6717529296875, -0.63311767578125, -0.594482421875, -0.55584716796875, -0.5172119140625, -0.47857666015625, -0.43994140625, -0.40130615234375, -0.3626708984375, -0.32403564453125, -0.285400390625, -0.24676513671875, -0.2081298828125, -0.16949462890625, -0.130859375, -0.09222412109375, -0.0535888671875, -0.01495361328125, 0.023681640625, 0.06231689453125, 0.1009521484375, 0.13958740234375, 0.17822265625, 0.21685791015625, 0.2554931640625, 0.29412841796875, 0.332763671875, 0.37139892578125, 0.4100341796875, 0.44866943359375, 0.4873046875, 0.52593994140625, 0.5645751953125, 0.60321044921875, 0.641845703125, 0.68048095703125, 0.7191162109375, 0.75775146484375, 0.79638671875, 0.83502197265625, 0.8736572265625, 0.91229248046875, 0.950927734375, 0.98956298828125, 1.0281982421875, 1.06683349609375, 1.10546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 11.0, 7.0, 13.0, 11.0, 19.0, 21.0, 26.0, 55.0, 74.0, 115.0, 322.0, 1849.0, 42058.0, 4120392.0, 27128.0, 1508.0, 295.0, 124.0, 67.0, 42.0, 38.0, 19.0, 17.0, 9.0, 9.0, 6.0, 8.0, 4.0, 6.0, 5.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.78125, -41.462890625, -40.14453125, -38.826171875, -37.5078125, -36.189453125, -34.87109375, -33.552734375, -32.234375, -30.916015625, -29.59765625, -28.279296875, -26.9609375, -25.642578125, -24.32421875, -23.005859375, -21.6875, -20.369140625, -19.05078125, -17.732421875, -16.4140625, -15.095703125, -13.77734375, -12.458984375, -11.140625, -9.822265625, -8.50390625, -7.185546875, -5.8671875, -4.548828125, -3.23046875, -1.912109375, -0.59375, 0.724609375, 2.04296875, 3.361328125, 4.6796875, 5.998046875, 7.31640625, 8.634765625, 9.953125, 11.271484375, 12.58984375, 13.908203125, 15.2265625, 16.544921875, 17.86328125, 19.181640625, 20.5, 21.818359375, 23.13671875, 24.455078125, 25.7734375, 27.091796875, 28.41015625, 29.728515625, 31.046875, 32.365234375, 33.68359375, 35.001953125, 36.3203125, 37.638671875, 38.95703125, 40.275390625, 41.59375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 7.0, 7.0, 4.0, 10.0, 9.0, 13.0, 35.0, 35.0, 49.0, 76.0, 140.0, 215.0, 421.0, 1052.0, 950.0, 379.0, 218.0, 134.0, 92.0, 61.0, 43.0, 30.0, 19.0, 14.0, 11.0, 12.0, 1.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9541015625, -1.8910675048828125, -1.828033447265625, -1.7649993896484375, -1.70196533203125, -1.6389312744140625, -1.575897216796875, -1.5128631591796875, -1.4498291015625, -1.3867950439453125, -1.323760986328125, -1.2607269287109375, -1.19769287109375, -1.1346588134765625, -1.071624755859375, -1.0085906982421875, -0.945556640625, -0.8825225830078125, -0.819488525390625, -0.7564544677734375, -0.69342041015625, -0.6303863525390625, -0.567352294921875, -0.5043182373046875, -0.4412841796875, -0.3782501220703125, -0.315216064453125, -0.2521820068359375, -0.18914794921875, -0.1261138916015625, -0.063079833984375, -4.57763671875e-05, 0.06298828125, 0.1260223388671875, 0.189056396484375, 0.2520904541015625, 0.31512451171875, 0.3781585693359375, 0.441192626953125, 0.5042266845703125, 0.5672607421875, 0.6302947998046875, 0.693328857421875, 0.7563629150390625, 0.81939697265625, 0.8824310302734375, 0.945465087890625, 1.0084991455078125, 1.071533203125, 1.1345672607421875, 1.197601318359375, 1.2606353759765625, 1.32366943359375, 1.3867034912109375, 1.449737548828125, 1.5127716064453125, 1.5758056640625, 1.6388397216796875, 1.701873779296875, 1.7649078369140625, 1.82794189453125, 1.8909759521484375, 1.954010009765625, 2.0170440673828125, 2.080078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 7.0, 8.0, 25.0, 33.0, 61.0, 122.0, 201.0, 234.0, 143.0, 82.0, 37.0, 25.0, 5.0, 13.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.572629928588867, -22.10427474975586, -21.635921478271484, -21.167566299438477, -20.6992130279541, -20.230857849121094, -19.76250457763672, -19.29414939880371, -18.825794219970703, -18.357439041137695, -17.88908576965332, -17.420730590820312, -16.952377319335938, -16.48402214050293, -16.015668869018555, -15.547313690185547, -15.078960418701172, -14.61060619354248, -14.142251968383789, -13.673897743225098, -13.205543518066406, -12.737188339233398, -12.268834114074707, -11.800479888916016, -11.332125663757324, -10.863771438598633, -10.395417213439941, -9.92706298828125, -9.458707809448242, -8.990354537963867, -8.52199935913086, -8.053645133972168, -7.585291862487793, -7.116937637329102, -6.64858341217041, -6.1802287101745605, -5.711874485015869, -5.243520259857178, -4.775165557861328, -4.306811332702637, -3.8384571075439453, -3.370102882385254, -2.9017484188079834, -2.433393955230713, -1.9650397300720215, -1.49668550491333, -1.0283310413360596, -0.5599765777587891, -0.09162235260009766, 0.3767319917678833, 0.8450863361358643, 1.3134406805038452, 1.7817950248718262, 2.2501492500305176, 2.718503713607788, 3.1868581771850586, 3.65521240234375, 4.123566627502441, 4.591920852661133, 5.060275554656982, 5.528629779815674, 5.996984004974365, 6.465338706970215, 6.933692932128906, 7.402047157287598]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 4.0, 8.0, 6.0, 17.0, 14.0, 19.0, 18.0, 21.0, 34.0, 29.0, 33.0, 49.0, 50.0, 40.0, 49.0, 47.0, 46.0, 59.0, 67.0, 37.0, 37.0, 54.0, 26.0, 39.0, 29.0, 30.0, 24.0, 16.0, 20.0, 14.0, 11.0, 9.0, 4.0, 5.0, 5.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.331695556640625, -7.072372913360596, -6.813050270080566, -6.553727626800537, -6.294404983520508, -6.035082817077637, -5.775760173797607, -5.516437530517578, -5.257114887237549, -4.9977922439575195, -4.73846960067749, -4.479146957397461, -4.21982479095459, -3.9605019092559814, -3.7011795043945312, -3.441856861114502, -3.1825342178344727, -2.9232115745544434, -2.663888931274414, -2.404566526412964, -2.1452438831329346, -1.8859212398529053, -1.6265987157821655, -1.3672761917114258, -1.1079535484313965, -0.848630964756012, -0.5893083810806274, -0.3299857974052429, -0.0706632137298584, 0.1886594295501709, 0.44798195362091064, 0.7073044776916504, 0.9666271209716797, 1.225949764251709, 1.4852722883224487, 1.7445948123931885, 2.0039174556732178, 2.263240098953247, 2.5225625038146973, 2.7818851470947266, 3.041207790374756, 3.300530433654785, 3.5598530769348145, 3.8191754817962646, 4.078497886657715, 4.337821006774902, 4.597143173217773, 4.856465816497803, 5.115788459777832, 5.375111103057861, 5.634433746337891, 5.89375638961792, 6.153079032897949, 6.41240119934082, 6.67172384262085, 6.931046485900879, 7.190369129180908, 7.4496917724609375, 7.709014415740967, 7.968337059020996, 8.227659225463867, 8.486982345581055, 8.746304512023926, 9.005626678466797, 9.264949798583984]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 8.0, 6.0, 17.0, 17.0, 26.0, 27.0, 29.0, 49.0, 70.0, 112.0, 137.0, 220.0, 391.0, 671.0, 1205.0, 2312.0, 5060.0, 12634.0, 38962.0, 155308.0, 485195.0, 253752.0, 61041.0, 17917.0, 6690.0, 3040.0, 1518.0, 795.0, 463.0, 304.0, 182.0, 112.0, 93.0, 50.0, 37.0, 25.0, 16.0, 14.0, 10.0, 12.0, 8.0, 5.0, 13.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.74609375, -6.5330810546875, -6.320068359375, -6.1070556640625, -5.89404296875, -5.6810302734375, -5.468017578125, -5.2550048828125, -5.0419921875, -4.8289794921875, -4.615966796875, -4.4029541015625, -4.18994140625, -3.9769287109375, -3.763916015625, -3.5509033203125, -3.337890625, -3.1248779296875, -2.911865234375, -2.6988525390625, -2.48583984375, -2.2728271484375, -2.059814453125, -1.8468017578125, -1.6337890625, -1.4207763671875, -1.207763671875, -0.9947509765625, -0.78173828125, -0.5687255859375, -0.355712890625, -0.1427001953125, 0.0703125, 0.2833251953125, 0.496337890625, 0.7093505859375, 0.92236328125, 1.1353759765625, 1.348388671875, 1.5614013671875, 1.7744140625, 1.9874267578125, 2.200439453125, 2.4134521484375, 2.62646484375, 2.8394775390625, 3.052490234375, 3.2655029296875, 3.478515625, 3.6915283203125, 3.904541015625, 4.1175537109375, 4.33056640625, 4.5435791015625, 4.756591796875, 4.9696044921875, 5.1826171875, 5.3956298828125, 5.608642578125, 5.8216552734375, 6.03466796875, 6.2476806640625, 6.460693359375, 6.6737060546875, 6.88671875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 3.0, 11.0, 11.0, 18.0, 22.0, 41.0, 65.0, 53.0, 75.0, 81.0, 85.0, 101.0, 90.0, 74.0, 54.0, 56.0, 41.0, 36.0, 19.0, 15.0, 8.0, 18.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.177734375, -1.1412353515625, -1.104736328125, -1.0682373046875, -1.03173828125, -0.9952392578125, -0.958740234375, -0.9222412109375, -0.8857421875, -0.8492431640625, -0.812744140625, -0.7762451171875, -0.73974609375, -0.7032470703125, -0.666748046875, -0.6302490234375, -0.59375, -0.5572509765625, -0.520751953125, -0.4842529296875, -0.44775390625, -0.4112548828125, -0.374755859375, -0.3382568359375, -0.3017578125, -0.2652587890625, -0.228759765625, -0.1922607421875, -0.15576171875, -0.1192626953125, -0.082763671875, -0.0462646484375, -0.009765625, 0.0267333984375, 0.063232421875, 0.0997314453125, 0.13623046875, 0.1727294921875, 0.209228515625, 0.2457275390625, 0.2822265625, 0.3187255859375, 0.355224609375, 0.3917236328125, 0.42822265625, 0.4647216796875, 0.501220703125, 0.5377197265625, 0.57421875, 0.6107177734375, 0.647216796875, 0.6837158203125, 0.72021484375, 0.7567138671875, 0.793212890625, 0.8297119140625, 0.8662109375, 0.9027099609375, 0.939208984375, 0.9757080078125, 1.01220703125, 1.0487060546875, 1.085205078125, 1.1217041015625, 1.158203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 7.0, 17.0, 27.0, 34.0, 49.0, 68.0, 97.0, 132.0, 226.0, 314.0, 457.0, 729.0, 1193.0, 2172.0, 4060.0, 8327.0, 18467.0, 45531.0, 121040.0, 300873.0, 320023.0, 134604.0, 49943.0, 20462.0, 9251.0, 4485.0, 2295.0, 1288.0, 802.0, 525.0, 315.0, 224.0, 161.0, 102.0, 76.0, 52.0, 37.0, 24.0, 17.0, 14.0, 13.0, 3.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.9334716796875, -4.769287109375, -4.6051025390625, -4.44091796875, -4.2767333984375, -4.112548828125, -3.9483642578125, -3.7841796875, -3.6199951171875, -3.455810546875, -3.2916259765625, -3.12744140625, -2.9632568359375, -2.799072265625, -2.6348876953125, -2.470703125, -2.3065185546875, -2.142333984375, -1.9781494140625, -1.81396484375, -1.6497802734375, -1.485595703125, -1.3214111328125, -1.1572265625, -0.9930419921875, -0.828857421875, -0.6646728515625, -0.50048828125, -0.3363037109375, -0.172119140625, -0.0079345703125, 0.15625, 0.3204345703125, 0.484619140625, 0.6488037109375, 0.81298828125, 0.9771728515625, 1.141357421875, 1.3055419921875, 1.4697265625, 1.6339111328125, 1.798095703125, 1.9622802734375, 2.12646484375, 2.2906494140625, 2.454833984375, 2.6190185546875, 2.783203125, 2.9473876953125, 3.111572265625, 3.2757568359375, 3.43994140625, 3.6041259765625, 3.768310546875, 3.9324951171875, 4.0966796875, 4.2608642578125, 4.425048828125, 4.5892333984375, 4.75341796875, 4.9176025390625, 5.081787109375, 5.2459716796875, 5.41015625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 6.0, 3.0, 9.0, 8.0, 13.0, 18.0, 17.0, 29.0, 17.0, 29.0, 28.0, 29.0, 25.0, 29.0, 33.0, 35.0, 41.0, 46.0, 32.0, 44.0, 51.0, 46.0, 42.0, 46.0, 38.0, 31.0, 28.0, 27.0, 30.0, 34.0, 19.0, 20.0, 12.0, 16.0, 11.0, 14.0, 14.0, 9.0, 3.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.40234375, -4.25836181640625, -4.1143798828125, -3.97039794921875, -3.826416015625, -3.68243408203125, -3.5384521484375, -3.39447021484375, -3.25048828125, -3.10650634765625, -2.9625244140625, -2.81854248046875, -2.674560546875, -2.53057861328125, -2.3865966796875, -2.24261474609375, -2.0986328125, -1.95465087890625, -1.8106689453125, -1.66668701171875, -1.522705078125, -1.37872314453125, -1.2347412109375, -1.09075927734375, -0.94677734375, -0.80279541015625, -0.6588134765625, -0.51483154296875, -0.370849609375, -0.22686767578125, -0.0828857421875, 0.06109619140625, 0.205078125, 0.34906005859375, 0.4930419921875, 0.63702392578125, 0.781005859375, 0.92498779296875, 1.0689697265625, 1.21295166015625, 1.35693359375, 1.50091552734375, 1.6448974609375, 1.78887939453125, 1.932861328125, 2.07684326171875, 2.2208251953125, 2.36480712890625, 2.5087890625, 2.65277099609375, 2.7967529296875, 2.94073486328125, 3.084716796875, 3.22869873046875, 3.3726806640625, 3.51666259765625, 3.66064453125, 3.80462646484375, 3.9486083984375, 4.09259033203125, 4.236572265625, 4.38055419921875, 4.5245361328125, 4.66851806640625, 4.8125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 7.0, 13.0, 13.0, 20.0, 47.0, 61.0, 128.0, 196.0, 414.0, 831.0, 1995.0, 5977.0, 25434.0, 194822.0, 685341.0, 108895.0, 16926.0, 4436.0, 1558.0, 674.0, 328.0, 162.0, 102.0, 58.0, 37.0, 20.0, 19.0, 10.0, 8.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1484375, -8.8658447265625, -8.583251953125, -8.3006591796875, -8.01806640625, -7.7354736328125, -7.452880859375, -7.1702880859375, -6.8876953125, -6.6051025390625, -6.322509765625, -6.0399169921875, -5.75732421875, -5.4747314453125, -5.192138671875, -4.9095458984375, -4.626953125, -4.3443603515625, -4.061767578125, -3.7791748046875, -3.49658203125, -3.2139892578125, -2.931396484375, -2.6488037109375, -2.3662109375, -2.0836181640625, -1.801025390625, -1.5184326171875, -1.23583984375, -0.9532470703125, -0.670654296875, -0.3880615234375, -0.10546875, 0.1771240234375, 0.459716796875, 0.7423095703125, 1.02490234375, 1.3074951171875, 1.590087890625, 1.8726806640625, 2.1552734375, 2.4378662109375, 2.720458984375, 3.0030517578125, 3.28564453125, 3.5682373046875, 3.850830078125, 4.1334228515625, 4.416015625, 4.6986083984375, 4.981201171875, 5.2637939453125, 5.54638671875, 5.8289794921875, 6.111572265625, 6.3941650390625, 6.6767578125, 6.9593505859375, 7.241943359375, 7.5245361328125, 7.80712890625, 8.0897216796875, 8.372314453125, 8.6549072265625, 8.9375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 3.0, 14.0, 10.0, 8.0, 18.0, 23.0, 22.0, 29.0, 31.0, 46.0, 55.0, 59.0, 77.0, 78.0, 78.0, 78.0, 68.0, 50.0, 34.0, 47.0, 30.0, 22.0, 15.0, 17.0, 14.0, 14.0, 11.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0005249977111816406, -0.0005104541778564453, -0.00049591064453125, -0.0004813671112060547, -0.0004668235778808594, -0.00045228004455566406, -0.00043773651123046875, -0.00042319297790527344, -0.0004086494445800781, -0.0003941059112548828, -0.0003795623779296875, -0.0003650188446044922, -0.0003504753112792969, -0.00033593177795410156, -0.00032138824462890625, -0.00030684471130371094, -0.0002923011779785156, -0.0002777576446533203, -0.000263214111328125, -0.0002486705780029297, -0.00023412704467773438, -0.00021958351135253906, -0.00020503997802734375, -0.00019049644470214844, -0.00017595291137695312, -0.0001614093780517578, -0.0001468658447265625, -0.0001323223114013672, -0.00011777877807617188, -0.00010323524475097656, -8.869171142578125e-05, -7.414817810058594e-05, -5.9604644775390625e-05, -4.506111145019531e-05, -3.0517578125e-05, -1.5974044799804688e-05, -1.430511474609375e-06, 1.3113021850585938e-05, 2.765655517578125e-05, 4.220008850097656e-05, 5.6743621826171875e-05, 7.128715515136719e-05, 8.58306884765625e-05, 0.00010037422180175781, 0.00011491775512695312, 0.00012946128845214844, 0.00014400482177734375, 0.00015854835510253906, 0.00017309188842773438, 0.0001876354217529297, 0.000202178955078125, 0.0002167224884033203, 0.00023126602172851562, 0.00024580955505371094, 0.00026035308837890625, 0.00027489662170410156, 0.0002894401550292969, 0.0003039836883544922, 0.0003185272216796875, 0.0003330707550048828, 0.0003476142883300781, 0.00036215782165527344, 0.00037670135498046875, 0.00039124488830566406, 0.0004057884216308594]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 9.0, 21.0, 17.0, 32.0, 46.0, 65.0, 79.0, 142.0, 217.0, 262.0, 484.0, 922.0, 1747.0, 3388.0, 7869.0, 19226.0, 55955.0, 192765.0, 468078.0, 203753.0, 58059.0, 19659.0, 7865.0, 3669.0, 1766.0, 939.0, 563.0, 346.0, 186.0, 112.0, 81.0, 64.0, 41.0, 36.0, 21.0, 18.0, 12.0, 11.0, 8.0, 8.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.88671875, -4.7364501953125, -4.586181640625, -4.4359130859375, -4.28564453125, -4.1353759765625, -3.985107421875, -3.8348388671875, -3.6845703125, -3.5343017578125, -3.384033203125, -3.2337646484375, -3.08349609375, -2.9332275390625, -2.782958984375, -2.6326904296875, -2.482421875, -2.3321533203125, -2.181884765625, -2.0316162109375, -1.88134765625, -1.7310791015625, -1.580810546875, -1.4305419921875, -1.2802734375, -1.1300048828125, -0.979736328125, -0.8294677734375, -0.67919921875, -0.5289306640625, -0.378662109375, -0.2283935546875, -0.078125, 0.0721435546875, 0.222412109375, 0.3726806640625, 0.52294921875, 0.6732177734375, 0.823486328125, 0.9737548828125, 1.1240234375, 1.2742919921875, 1.424560546875, 1.5748291015625, 1.72509765625, 1.8753662109375, 2.025634765625, 2.1759033203125, 2.326171875, 2.4764404296875, 2.626708984375, 2.7769775390625, 2.92724609375, 3.0775146484375, 3.227783203125, 3.3780517578125, 3.5283203125, 3.6785888671875, 3.828857421875, 3.9791259765625, 4.12939453125, 4.2796630859375, 4.429931640625, 4.5802001953125, 4.73046875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 8.0, 7.0, 6.0, 9.0, 10.0, 9.0, 14.0, 19.0, 15.0, 15.0, 24.0, 34.0, 48.0, 57.0, 64.0, 62.0, 85.0, 73.0, 75.0, 68.0, 53.0, 43.0, 46.0, 24.0, 28.0, 12.0, 22.0, 18.0, 11.0, 6.0, 5.0, 7.0, 5.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.51953125, -3.4129638671875, -3.306396484375, -3.1998291015625, -3.09326171875, -2.9866943359375, -2.880126953125, -2.7735595703125, -2.6669921875, -2.5604248046875, -2.453857421875, -2.3472900390625, -2.24072265625, -2.1341552734375, -2.027587890625, -1.9210205078125, -1.814453125, -1.7078857421875, -1.601318359375, -1.4947509765625, -1.38818359375, -1.2816162109375, -1.175048828125, -1.0684814453125, -0.9619140625, -0.8553466796875, -0.748779296875, -0.6422119140625, -0.53564453125, -0.4290771484375, -0.322509765625, -0.2159423828125, -0.109375, -0.0028076171875, 0.103759765625, 0.2103271484375, 0.31689453125, 0.4234619140625, 0.530029296875, 0.6365966796875, 0.7431640625, 0.8497314453125, 0.956298828125, 1.0628662109375, 1.16943359375, 1.2760009765625, 1.382568359375, 1.4891357421875, 1.595703125, 1.7022705078125, 1.808837890625, 1.9154052734375, 2.02197265625, 2.1285400390625, 2.235107421875, 2.3416748046875, 2.4482421875, 2.5548095703125, 2.661376953125, 2.7679443359375, 2.87451171875, 2.9810791015625, 3.087646484375, 3.1942138671875, 3.30078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 21.0, 44.0, 104.0, 221.0, 285.0, 154.0, 84.0, 31.0, 24.0, 8.0, 5.0, 9.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.89102172851562, -80.39715576171875, -77.9032974243164, -75.40943145751953, -72.91557312011719, -70.42170715332031, -67.92784118652344, -65.43397521972656, -62.94011688232422, -60.44625473022461, -57.952392578125, -55.458526611328125, -52.964664459228516, -50.470802307128906, -47.97693634033203, -45.48307418823242, -42.98921203613281, -40.4953498840332, -38.001487731933594, -35.50762176513672, -33.01375961303711, -30.5198974609375, -28.026033401489258, -25.532169342041016, -23.038307189941406, -20.544445037841797, -18.050580978393555, -15.556717872619629, -13.062854766845703, -10.568991661071777, -8.075128555297852, -5.581264495849609, -3.08740234375, -0.5935392379760742, 1.9003238677978516, 4.394186973571777, 6.888050079345703, 9.381913185119629, 11.875776290893555, 14.369640350341797, 16.863502502441406, 19.357364654541016, 21.851228713989258, 24.3450927734375, 26.83895492553711, 29.33281707763672, 31.82668113708496, 34.3205451965332, 36.81440734863281, 39.30826950073242, 41.80213165283203, 44.295997619628906, 46.789859771728516, 49.283721923828125, 51.777587890625, 54.27145004272461, 56.76531219482422, 59.25917434692383, 61.75303649902344, 64.24690246582031, 66.74076843261719, 69.23462677001953, 71.7284927368164, 74.22235107421875, 76.71621704101562]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 5.0, 4.0, 10.0, 17.0, 19.0, 34.0, 48.0, 45.0, 42.0, 71.0, 71.0, 92.0, 84.0, 81.0, 80.0, 73.0, 55.0, 51.0, 27.0, 32.0, 26.0, 17.0, 12.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.71028137207031, -71.56988525390625, -69.42948913574219, -67.28909301757812, -65.14869689941406, -63.008296966552734, -60.86790084838867, -58.72750473022461, -56.58710479736328, -54.44670867919922, -52.306312561035156, -50.165916442871094, -48.025516510009766, -45.8851203918457, -43.74472427368164, -41.60432815551758, -39.463932037353516, -37.32353591918945, -35.18313980102539, -33.04273986816406, -30.90234375, -28.761947631835938, -26.621551513671875, -24.481155395507812, -22.340757369995117, -20.200361251831055, -18.05996322631836, -15.919567108154297, -13.779170036315918, -11.638772964477539, -9.498376846313477, -7.357979774475098, -5.217578887939453, -3.0771820545196533, -0.9367852210998535, 1.2036113739013672, 3.344008445739746, 5.484405517578125, 7.6248016357421875, 9.765198707580566, 11.905595779418945, 14.045992851257324, 16.186389923095703, 18.326786041259766, 20.467182159423828, 22.607580184936523, 24.747976303100586, 26.88837432861328, 29.028770446777344, 31.169166564941406, 33.30956268310547, 35.44995880126953, 37.59035873413086, 39.73075485229492, 41.871150970458984, 44.01154708862305, 46.151947021484375, 48.29234313964844, 50.4327392578125, 52.57313537597656, 54.71353530883789, 56.85393142700195, 58.994327545166016, 61.13472366333008, 63.27511978149414]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 11.0, 22.0, 28.0, 52.0, 74.0, 188.0, 423.0, 1182.0, 5581.0, 83519.0, 4070554.0, 28111.0, 3096.0, 798.0, 320.0, 128.0, 70.0, 44.0, 17.0, 15.0, 9.0, 7.0, 8.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.09375, -46.56005859375, -45.0263671875, -43.49267578125, -41.958984375, -40.42529296875, -38.8916015625, -37.35791015625, -35.82421875, -34.29052734375, -32.7568359375, -31.22314453125, -29.689453125, -28.15576171875, -26.6220703125, -25.08837890625, -23.5546875, -22.02099609375, -20.4873046875, -18.95361328125, -17.419921875, -15.88623046875, -14.3525390625, -12.81884765625, -11.28515625, -9.75146484375, -8.2177734375, -6.68408203125, -5.150390625, -3.61669921875, -2.0830078125, -0.54931640625, 0.984375, 2.51806640625, 4.0517578125, 5.58544921875, 7.119140625, 8.65283203125, 10.1865234375, 11.72021484375, 13.25390625, 14.78759765625, 16.3212890625, 17.85498046875, 19.388671875, 20.92236328125, 22.4560546875, 23.98974609375, 25.5234375, 27.05712890625, 28.5908203125, 30.12451171875, 31.658203125, 33.19189453125, 34.7255859375, 36.25927734375, 37.79296875, 39.32666015625, 40.8603515625, 42.39404296875, 43.927734375, 45.46142578125, 46.9951171875, 48.52880859375, 50.0625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 7.0, 9.0, 13.0, 18.0, 25.0, 55.0, 81.0, 88.0, 107.0, 128.0, 135.0, 101.0, 75.0, 57.0, 40.0, 25.0, 15.0, 10.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.14447021484375, -2.0721435546875, -1.99981689453125, -1.927490234375, -1.85516357421875, -1.7828369140625, -1.71051025390625, -1.63818359375, -1.56585693359375, -1.4935302734375, -1.42120361328125, -1.348876953125, -1.27655029296875, -1.2042236328125, -1.13189697265625, -1.0595703125, -0.98724365234375, -0.9149169921875, -0.84259033203125, -0.770263671875, -0.69793701171875, -0.6256103515625, -0.55328369140625, -0.48095703125, -0.40863037109375, -0.3363037109375, -0.26397705078125, -0.191650390625, -0.11932373046875, -0.0469970703125, 0.02532958984375, 0.09765625, 0.16998291015625, 0.2423095703125, 0.31463623046875, 0.386962890625, 0.45928955078125, 0.5316162109375, 0.60394287109375, 0.67626953125, 0.74859619140625, 0.8209228515625, 0.89324951171875, 0.965576171875, 1.03790283203125, 1.1102294921875, 1.18255615234375, 1.2548828125, 1.32720947265625, 1.3995361328125, 1.47186279296875, 1.544189453125, 1.61651611328125, 1.6888427734375, 1.76116943359375, 1.83349609375, 1.90582275390625, 1.9781494140625, 2.05047607421875, 2.122802734375, 2.19512939453125, 2.2674560546875, 2.33978271484375, 2.412109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 12.0, 19.0, 17.0, 53.0, 84.0, 173.0, 475.0, 1422.0, 6001.0, 38081.0, 918811.0, 3150955.0, 65417.0, 9265.0, 2202.0, 714.0, 265.0, 156.0, 67.0, 36.0, 23.0, 18.0, 7.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.875, -16.349609375, -15.82421875, -15.298828125, -14.7734375, -14.248046875, -13.72265625, -13.197265625, -12.671875, -12.146484375, -11.62109375, -11.095703125, -10.5703125, -10.044921875, -9.51953125, -8.994140625, -8.46875, -7.943359375, -7.41796875, -6.892578125, -6.3671875, -5.841796875, -5.31640625, -4.791015625, -4.265625, -3.740234375, -3.21484375, -2.689453125, -2.1640625, -1.638671875, -1.11328125, -0.587890625, -0.0625, 0.462890625, 0.98828125, 1.513671875, 2.0390625, 2.564453125, 3.08984375, 3.615234375, 4.140625, 4.666015625, 5.19140625, 5.716796875, 6.2421875, 6.767578125, 7.29296875, 7.818359375, 8.34375, 8.869140625, 9.39453125, 9.919921875, 10.4453125, 10.970703125, 11.49609375, 12.021484375, 12.546875, 13.072265625, 13.59765625, 14.123046875, 14.6484375, 15.173828125, 15.69921875, 16.224609375, 16.75]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 9.0, 6.0, 8.0, 13.0, 13.0, 28.0, 42.0, 45.0, 73.0, 77.0, 149.0, 194.0, 409.0, 850.0, 970.0, 430.0, 232.0, 163.0, 89.0, 64.0, 39.0, 31.0, 28.0, 16.0, 11.0, 17.0, 15.0, 10.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.943359375, -1.874114990234375, -1.80487060546875, -1.735626220703125, -1.6663818359375, -1.597137451171875, -1.52789306640625, -1.458648681640625, -1.389404296875, -1.320159912109375, -1.25091552734375, -1.181671142578125, -1.1124267578125, -1.043182373046875, -0.97393798828125, -0.904693603515625, -0.83544921875, -0.766204833984375, -0.69696044921875, -0.627716064453125, -0.5584716796875, -0.489227294921875, -0.41998291015625, -0.350738525390625, -0.281494140625, -0.212249755859375, -0.14300537109375, -0.073760986328125, -0.0045166015625, 0.064727783203125, 0.13397216796875, 0.203216552734375, 0.2724609375, 0.341705322265625, 0.41094970703125, 0.480194091796875, 0.5494384765625, 0.618682861328125, 0.68792724609375, 0.757171630859375, 0.826416015625, 0.895660400390625, 0.96490478515625, 1.034149169921875, 1.1033935546875, 1.172637939453125, 1.24188232421875, 1.311126708984375, 1.38037109375, 1.449615478515625, 1.51885986328125, 1.588104248046875, 1.6573486328125, 1.726593017578125, 1.79583740234375, 1.865081787109375, 1.934326171875, 2.003570556640625, 2.07281494140625, 2.142059326171875, 2.2113037109375, 2.280548095703125, 2.34979248046875, 2.419036865234375, 2.48828125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 10.0, 24.0, 81.0, 262.0, 384.0, 187.0, 50.0, 10.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.276119232177734, -47.077842712402344, -45.87956619262695, -44.68128967285156, -43.48301696777344, -42.28474044799805, -41.086463928222656, -39.888187408447266, -38.689910888671875, -37.491634368896484, -36.293357849121094, -35.0950813293457, -33.89680480957031, -32.69853210449219, -31.500255584716797, -30.301979064941406, -29.103702545166016, -27.905426025390625, -26.707149505615234, -25.508874893188477, -24.310598373413086, -23.112321853637695, -21.914047241210938, -20.715770721435547, -19.517494201660156, -18.319217681884766, -17.120941162109375, -15.922666549682617, -14.724390029907227, -13.526113510131836, -12.327837944030762, -11.129562377929688, -9.931282043457031, -8.73300552368164, -7.534729957580566, -6.336453914642334, -5.138177871704102, -3.939901828765869, -2.7416257858276367, -1.5433502197265625, -0.3450736999511719, 0.8532023429870605, 2.051478385925293, 3.2497544288635254, 4.448030471801758, 5.64630651473999, 6.844582557678223, 8.042858123779297, 9.241134643554688, 10.439411163330078, 11.637686729431152, 12.835962295532227, 14.034238815307617, 15.232515335083008, 16.430789947509766, 17.629066467285156, 18.827342987060547, 20.025619506835938, 21.223896026611328, 22.422170639038086, 23.620447158813477, 24.818723678588867, 26.016998291015625, 27.215274810791016, 28.413551330566406]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 8.0, 15.0, 18.0, 18.0, 19.0, 27.0, 37.0, 44.0, 54.0, 56.0, 47.0, 62.0, 53.0, 55.0, 53.0, 56.0, 56.0, 53.0, 43.0, 34.0, 36.0, 31.0, 23.0, 27.0, 14.0, 15.0, 8.0, 6.0, 7.0, 6.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.976312637329102, -12.615527153015137, -12.254741668701172, -11.893956184387207, -11.533170700073242, -11.172384262084961, -10.811599731445312, -10.450813293457031, -10.090027809143066, -9.729242324829102, -9.368456840515137, -9.007671356201172, -8.646885871887207, -8.286100387573242, -7.925314426422119, -7.564528465270996, -7.2037434577941895, -6.842957973480225, -6.48217248916626, -6.121386528015137, -5.760601043701172, -5.399815559387207, -5.039030075073242, -4.678244590759277, -4.3174591064453125, -3.9566736221313477, -3.5958878993988037, -3.235102415084839, -2.874316692352295, -2.51353120803833, -2.1527457237243652, -1.7919600009918213, -1.4311742782592773, -1.070388674736023, -0.7096031308174133, -0.3488175868988037, 0.011968016624450684, 0.3727536201477051, 0.7335391044616699, 1.0943248271942139, 1.4551103115081787, 1.815895915031433, 2.1766815185546875, 2.5374670028686523, 2.898252487182617, 3.259038209915161, 3.619823694229126, 3.98060941696167, 4.341394901275635, 4.7021803855896, 5.0629658699035645, 5.4237518310546875, 5.784537315368652, 6.145322799682617, 6.506108283996582, 6.866893768310547, 7.227679252624512, 7.588464736938477, 7.949250221252441, 8.310035705566406, 8.670821189880371, 9.031606674194336, 9.392393112182617, 9.753178596496582, 10.113964080810547]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 10.0, 4.0, 13.0, 14.0, 21.0, 29.0, 46.0, 82.0, 87.0, 177.0, 306.0, 652.0, 1694.0, 6262.0, 46950.0, 603299.0, 356699.0, 25432.0, 4257.0, 1281.0, 524.0, 256.0, 172.0, 96.0, 69.0, 37.0, 18.0, 16.0, 19.0, 15.0, 8.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.4453125, -14.960693359375, -14.47607421875, -13.991455078125, -13.5068359375, -13.022216796875, -12.53759765625, -12.052978515625, -11.568359375, -11.083740234375, -10.59912109375, -10.114501953125, -9.6298828125, -9.145263671875, -8.66064453125, -8.176025390625, -7.69140625, -7.206787109375, -6.72216796875, -6.237548828125, -5.7529296875, -5.268310546875, -4.78369140625, -4.299072265625, -3.814453125, -3.329833984375, -2.84521484375, -2.360595703125, -1.8759765625, -1.391357421875, -0.90673828125, -0.422119140625, 0.0625, 0.547119140625, 1.03173828125, 1.516357421875, 2.0009765625, 2.485595703125, 2.97021484375, 3.454833984375, 3.939453125, 4.424072265625, 4.90869140625, 5.393310546875, 5.8779296875, 6.362548828125, 6.84716796875, 7.331787109375, 7.81640625, 8.301025390625, 8.78564453125, 9.270263671875, 9.7548828125, 10.239501953125, 10.72412109375, 11.208740234375, 11.693359375, 12.177978515625, 12.66259765625, 13.147216796875, 13.6318359375, 14.116455078125, 14.60107421875, 15.085693359375, 15.5703125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 33.0, 60.0, 91.0, 132.0, 156.0, 173.0, 119.0, 95.0, 57.0, 35.0, 17.0, 7.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8984375, -2.804931640625, -2.71142578125, -2.617919921875, -2.5244140625, -2.430908203125, -2.33740234375, -2.243896484375, -2.150390625, -2.056884765625, -1.96337890625, -1.869873046875, -1.7763671875, -1.682861328125, -1.58935546875, -1.495849609375, -1.40234375, -1.308837890625, -1.21533203125, -1.121826171875, -1.0283203125, -0.934814453125, -0.84130859375, -0.747802734375, -0.654296875, -0.560791015625, -0.46728515625, -0.373779296875, -0.2802734375, -0.186767578125, -0.09326171875, 0.000244140625, 0.09375, 0.187255859375, 0.28076171875, 0.374267578125, 0.4677734375, 0.561279296875, 0.65478515625, 0.748291015625, 0.841796875, 0.935302734375, 1.02880859375, 1.122314453125, 1.2158203125, 1.309326171875, 1.40283203125, 1.496337890625, 1.58984375, 1.683349609375, 1.77685546875, 1.870361328125, 1.9638671875, 2.057373046875, 2.15087890625, 2.244384765625, 2.337890625, 2.431396484375, 2.52490234375, 2.618408203125, 2.7119140625, 2.805419921875, 2.89892578125, 2.992431640625, 3.0859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 1.0, 2.0, 9.0, 6.0, 8.0, 11.0, 13.0, 16.0, 30.0, 49.0, 52.0, 135.0, 196.0, 272.0, 442.0, 835.0, 1452.0, 2852.0, 6432.0, 17113.0, 54339.0, 202848.0, 448302.0, 221524.0, 59793.0, 18346.0, 6988.0, 3036.0, 1435.0, 815.0, 458.0, 270.0, 170.0, 123.0, 79.0, 36.0, 22.0, 15.0, 15.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7265625, -6.50628662109375, -6.2860107421875, -6.06573486328125, -5.845458984375, -5.62518310546875, -5.4049072265625, -5.18463134765625, -4.96435546875, -4.74407958984375, -4.5238037109375, -4.30352783203125, -4.083251953125, -3.86297607421875, -3.6427001953125, -3.42242431640625, -3.2021484375, -2.98187255859375, -2.7615966796875, -2.54132080078125, -2.321044921875, -2.10076904296875, -1.8804931640625, -1.66021728515625, -1.43994140625, -1.21966552734375, -0.9993896484375, -0.77911376953125, -0.558837890625, -0.33856201171875, -0.1182861328125, 0.10198974609375, 0.322265625, 0.54254150390625, 0.7628173828125, 0.98309326171875, 1.203369140625, 1.42364501953125, 1.6439208984375, 1.86419677734375, 2.08447265625, 2.30474853515625, 2.5250244140625, 2.74530029296875, 2.965576171875, 3.18585205078125, 3.4061279296875, 3.62640380859375, 3.8466796875, 4.06695556640625, 4.2872314453125, 4.50750732421875, 4.727783203125, 4.94805908203125, 5.1683349609375, 5.38861083984375, 5.60888671875, 5.82916259765625, 6.0494384765625, 6.26971435546875, 6.489990234375, 6.71026611328125, 6.9305419921875, 7.15081787109375, 7.37109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 6.0, 5.0, 12.0, 14.0, 20.0, 19.0, 24.0, 34.0, 41.0, 38.0, 53.0, 55.0, 59.0, 58.0, 51.0, 70.0, 57.0, 48.0, 50.0, 58.0, 38.0, 43.0, 24.0, 24.0, 25.0, 20.0, 12.0, 15.0, 5.0, 10.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.70703125, -7.46697998046875, -7.2269287109375, -6.98687744140625, -6.746826171875, -6.50677490234375, -6.2667236328125, -6.02667236328125, -5.78662109375, -5.54656982421875, -5.3065185546875, -5.06646728515625, -4.826416015625, -4.58636474609375, -4.3463134765625, -4.10626220703125, -3.8662109375, -3.62615966796875, -3.3861083984375, -3.14605712890625, -2.906005859375, -2.66595458984375, -2.4259033203125, -2.18585205078125, -1.94580078125, -1.70574951171875, -1.4656982421875, -1.22564697265625, -0.985595703125, -0.74554443359375, -0.5054931640625, -0.26544189453125, -0.025390625, 0.21466064453125, 0.4547119140625, 0.69476318359375, 0.934814453125, 1.17486572265625, 1.4149169921875, 1.65496826171875, 1.89501953125, 2.13507080078125, 2.3751220703125, 2.61517333984375, 2.855224609375, 3.09527587890625, 3.3353271484375, 3.57537841796875, 3.8154296875, 4.05548095703125, 4.2955322265625, 4.53558349609375, 4.775634765625, 5.01568603515625, 5.2557373046875, 5.49578857421875, 5.73583984375, 5.97589111328125, 6.2159423828125, 6.45599365234375, 6.696044921875, 6.93609619140625, 7.1761474609375, 7.41619873046875, 7.65625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 9.0, 10.0, 15.0, 23.0, 44.0, 75.0, 184.0, 495.0, 1993.0, 20477.0, 536480.0, 468695.0, 17345.0, 1844.0, 481.0, 173.0, 88.0, 51.0, 24.0, 18.0, 12.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.71875, -12.374755859375, -12.03076171875, -11.686767578125, -11.3427734375, -10.998779296875, -10.65478515625, -10.310791015625, -9.966796875, -9.622802734375, -9.27880859375, -8.934814453125, -8.5908203125, -8.246826171875, -7.90283203125, -7.558837890625, -7.21484375, -6.870849609375, -6.52685546875, -6.182861328125, -5.8388671875, -5.494873046875, -5.15087890625, -4.806884765625, -4.462890625, -4.118896484375, -3.77490234375, -3.430908203125, -3.0869140625, -2.742919921875, -2.39892578125, -2.054931640625, -1.7109375, -1.366943359375, -1.02294921875, -0.678955078125, -0.3349609375, 0.009033203125, 0.35302734375, 0.697021484375, 1.041015625, 1.385009765625, 1.72900390625, 2.072998046875, 2.4169921875, 2.760986328125, 3.10498046875, 3.448974609375, 3.79296875, 4.136962890625, 4.48095703125, 4.824951171875, 5.1689453125, 5.512939453125, 5.85693359375, 6.200927734375, 6.544921875, 6.888916015625, 7.23291015625, 7.576904296875, 7.9208984375, 8.264892578125, 8.60888671875, 8.952880859375, 9.296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 11.0, 12.0, 13.0, 13.0, 26.0, 26.0, 27.0, 36.0, 40.0, 51.0, 66.0, 90.0, 76.0, 88.0, 78.0, 57.0, 57.0, 33.0, 32.0, 22.0, 32.0, 22.0, 11.0, 11.0, 12.0, 3.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0], "bins": [-0.0005407333374023438, -0.0005267411470413208, -0.0005127489566802979, -0.0004987567663192749, -0.00048476457595825195, -0.000470772385597229, -0.00045678019523620605, -0.0004427880048751831, -0.00042879581451416016, -0.0004148036241531372, -0.00040081143379211426, -0.0003868192434310913, -0.00037282705307006836, -0.0003588348627090454, -0.00034484267234802246, -0.0003308504819869995, -0.00031685829162597656, -0.0003028661012649536, -0.00028887391090393066, -0.0002748817205429077, -0.00026088953018188477, -0.0002468973398208618, -0.00023290514945983887, -0.00021891295909881592, -0.00020492076873779297, -0.00019092857837677002, -0.00017693638801574707, -0.00016294419765472412, -0.00014895200729370117, -0.00013495981693267822, -0.00012096762657165527, -0.00010697543621063232, -9.298324584960938e-05, -7.899105548858643e-05, -6.499886512756348e-05, -5.100667476654053e-05, -3.701448440551758e-05, -2.302229404449463e-05, -9.03010368347168e-06, 4.9620866775512695e-06, 1.895427703857422e-05, 3.294646739959717e-05, 4.693865776062012e-05, 6.0930848121643066e-05, 7.492303848266602e-05, 8.891522884368896e-05, 0.00010290741920471191, 0.00011689960956573486, 0.0001308917999267578, 0.00014488399028778076, 0.0001588761806488037, 0.00017286837100982666, 0.0001868605613708496, 0.00020085275173187256, 0.0002148449420928955, 0.00022883713245391846, 0.0002428293228149414, 0.00025682151317596436, 0.0002708137035369873, 0.00028480589389801025, 0.0002987980842590332, 0.00031279027462005615, 0.0003267824649810791, 0.00034077465534210205, 0.000354766845703125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 8.0, 7.0, 25.0, 38.0, 64.0, 113.0, 178.0, 344.0, 700.0, 1466.0, 3996.0, 13530.0, 60314.0, 314376.0, 505742.0, 112700.0, 23884.0, 6510.0, 2367.0, 1015.0, 503.0, 290.0, 131.0, 86.0, 57.0, 35.0, 28.0, 13.0, 13.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9140625, -4.7264404296875, -4.538818359375, -4.3511962890625, -4.16357421875, -3.9759521484375, -3.788330078125, -3.6007080078125, -3.4130859375, -3.2254638671875, -3.037841796875, -2.8502197265625, -2.66259765625, -2.4749755859375, -2.287353515625, -2.0997314453125, -1.912109375, -1.7244873046875, -1.536865234375, -1.3492431640625, -1.16162109375, -0.9739990234375, -0.786376953125, -0.5987548828125, -0.4111328125, -0.2235107421875, -0.035888671875, 0.1517333984375, 0.33935546875, 0.5269775390625, 0.714599609375, 0.9022216796875, 1.08984375, 1.2774658203125, 1.465087890625, 1.6527099609375, 1.84033203125, 2.0279541015625, 2.215576171875, 2.4031982421875, 2.5908203125, 2.7784423828125, 2.966064453125, 3.1536865234375, 3.34130859375, 3.5289306640625, 3.716552734375, 3.9041748046875, 4.091796875, 4.2794189453125, 4.467041015625, 4.6546630859375, 4.84228515625, 5.0299072265625, 5.217529296875, 5.4051513671875, 5.5927734375, 5.7803955078125, 5.968017578125, 6.1556396484375, 6.34326171875, 6.5308837890625, 6.718505859375, 6.9061279296875, 7.09375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 2.0, 7.0, 17.0, 15.0, 22.0, 23.0, 33.0, 63.0, 82.0, 113.0, 94.0, 125.0, 101.0, 85.0, 62.0, 49.0, 32.0, 27.0, 13.0, 9.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.640625, -4.47491455078125, -4.3092041015625, -4.14349365234375, -3.977783203125, -3.81207275390625, -3.6463623046875, -3.48065185546875, -3.31494140625, -3.14923095703125, -2.9835205078125, -2.81781005859375, -2.652099609375, -2.48638916015625, -2.3206787109375, -2.15496826171875, -1.9892578125, -1.82354736328125, -1.6578369140625, -1.49212646484375, -1.326416015625, -1.16070556640625, -0.9949951171875, -0.82928466796875, -0.66357421875, -0.49786376953125, -0.3321533203125, -0.16644287109375, -0.000732421875, 0.16497802734375, 0.3306884765625, 0.49639892578125, 0.662109375, 0.82781982421875, 0.9935302734375, 1.15924072265625, 1.324951171875, 1.49066162109375, 1.6563720703125, 1.82208251953125, 1.98779296875, 2.15350341796875, 2.3192138671875, 2.48492431640625, 2.650634765625, 2.81634521484375, 2.9820556640625, 3.14776611328125, 3.3134765625, 3.47918701171875, 3.6448974609375, 3.81060791015625, 3.976318359375, 4.14202880859375, 4.3077392578125, 4.47344970703125, 4.63916015625, 4.80487060546875, 4.9705810546875, 5.13629150390625, 5.302001953125, 5.46771240234375, 5.6334228515625, 5.79913330078125, 5.96484375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 10.0, 9.0, 22.0, 47.0, 94.0, 193.0, 249.0, 177.0, 85.0, 51.0, 25.0, 12.0, 7.0, 9.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.75575256347656, -69.32864379882812, -66.90152740478516, -64.47441864013672, -62.04730224609375, -59.62018966674805, -57.193077087402344, -54.765968322753906, -52.33885192871094, -49.911739349365234, -47.48462677001953, -45.05751419067383, -42.630401611328125, -40.20328903198242, -37.77617645263672, -35.34906768798828, -32.92195510864258, -30.494842529296875, -28.067729949951172, -25.64061737060547, -23.213504791259766, -20.786392211914062, -18.359281539916992, -15.932168960571289, -13.505056381225586, -11.077943801879883, -8.65083122253418, -6.223719596862793, -3.79660701751709, -1.3694944381713867, 1.0576171875, 3.484729766845703, 5.911842346191406, 8.33895492553711, 10.766067504882812, 13.1931791305542, 15.620291709899902, 18.047405242919922, 20.474515914916992, 22.901628494262695, 25.3287410736084, 27.7558536529541, 30.182966232299805, 32.610076904296875, 35.03718948364258, 37.46430206298828, 39.891414642333984, 42.31852722167969, 44.74563980102539, 47.172752380371094, 49.5998649597168, 52.0269775390625, 54.4540901184082, 56.881202697753906, 59.308311462402344, 61.73542785644531, 64.16253662109375, 66.58964538574219, 69.01676177978516, 71.4438705444336, 73.87098693847656, 76.298095703125, 78.72521209716797, 81.1523208618164, 83.57943725585938]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 9.0, 19.0, 7.0, 8.0, 18.0, 25.0, 40.0, 35.0, 50.0, 58.0, 60.0, 59.0, 62.0, 64.0, 77.0, 67.0, 58.0, 56.0, 58.0, 47.0, 29.0, 14.0, 27.0, 13.0, 13.0, 8.0, 7.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.577125549316406, -58.30147171020508, -56.025821685791016, -53.75016784667969, -51.47451400756836, -49.19886016845703, -46.92321014404297, -44.64755630493164, -42.37190246582031, -40.096248626708984, -37.82059860229492, -35.544944763183594, -33.269290924072266, -30.99363899230957, -28.717987060546875, -26.442333221435547, -24.166683197021484, -21.89103126525879, -19.61537742614746, -17.339725494384766, -15.064072608947754, -12.788419723510742, -10.512767791748047, -8.237114906311035, -5.961462020874023, -3.685809373855591, -1.4101567268371582, 0.8654956817626953, 3.141148567199707, 5.416801452636719, 7.692453384399414, 9.968106269836426, 12.243759155273438, 14.51941204071045, 16.79506492614746, 19.070716857910156, 21.346370697021484, 23.62202262878418, 25.897674560546875, 28.173328399658203, 30.4489803314209, 32.724632263183594, 35.00028610229492, 37.27593994140625, 39.55158996582031, 41.82724380493164, 44.10289764404297, 46.37854766845703, 48.65420150756836, 50.92985534667969, 53.20550537109375, 55.48115921020508, 57.756813049316406, 60.03246307373047, 62.3081169128418, 64.58377075195312, 66.85942077636719, 69.13507080078125, 71.41072845458984, 73.6863784790039, 75.96202850341797, 78.23768615722656, 80.51333618164062, 82.78898620605469, 85.06464385986328]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 7.0, 6.0, 10.0, 5.0, 13.0, 22.0, 22.0, 28.0, 51.0, 69.0, 148.0, 180.0, 318.0, 604.0, 1243.0, 2755.0, 7757.0, 29156.0, 258841.0, 3742478.0, 120877.0, 19736.0, 5713.0, 2036.0, 941.0, 467.0, 284.0, 166.0, 105.0, 66.0, 52.0, 29.0, 26.0, 19.0, 10.0, 12.0, 9.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-16.78125, -16.29296875, -15.8046875, -15.31640625, -14.828125, -14.33984375, -13.8515625, -13.36328125, -12.875, -12.38671875, -11.8984375, -11.41015625, -10.921875, -10.43359375, -9.9453125, -9.45703125, -8.96875, -8.48046875, -7.9921875, -7.50390625, -7.015625, -6.52734375, -6.0390625, -5.55078125, -5.0625, -4.57421875, -4.0859375, -3.59765625, -3.109375, -2.62109375, -2.1328125, -1.64453125, -1.15625, -0.66796875, -0.1796875, 0.30859375, 0.796875, 1.28515625, 1.7734375, 2.26171875, 2.75, 3.23828125, 3.7265625, 4.21484375, 4.703125, 5.19140625, 5.6796875, 6.16796875, 6.65625, 7.14453125, 7.6328125, 8.12109375, 8.609375, 9.09765625, 9.5859375, 10.07421875, 10.5625, 11.05078125, 11.5390625, 12.02734375, 12.515625, 13.00390625, 13.4921875, 13.98046875, 14.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 8.0, 10.0, 5.0, 7.0, 13.0, 9.0, 11.0, 28.0, 39.0, 37.0, 42.0, 56.0, 55.0, 59.0, 61.0, 57.0, 65.0, 62.0, 56.0, 46.0, 56.0, 37.0, 37.0, 24.0, 28.0, 17.0, 19.0, 17.0, 8.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7431640625, -1.691741943359375, -1.64031982421875, -1.588897705078125, -1.5374755859375, -1.486053466796875, -1.43463134765625, -1.383209228515625, -1.331787109375, -1.280364990234375, -1.22894287109375, -1.177520751953125, -1.1260986328125, -1.074676513671875, -1.02325439453125, -0.971832275390625, -0.92041015625, -0.868988037109375, -0.81756591796875, -0.766143798828125, -0.7147216796875, -0.663299560546875, -0.61187744140625, -0.560455322265625, -0.509033203125, -0.457611083984375, -0.40618896484375, -0.354766845703125, -0.3033447265625, -0.251922607421875, -0.20050048828125, -0.149078369140625, -0.09765625, -0.046234130859375, 0.00518798828125, 0.056610107421875, 0.1080322265625, 0.159454345703125, 0.21087646484375, 0.262298583984375, 0.313720703125, 0.365142822265625, 0.41656494140625, 0.467987060546875, 0.5194091796875, 0.570831298828125, 0.62225341796875, 0.673675537109375, 0.72509765625, 0.776519775390625, 0.82794189453125, 0.879364013671875, 0.9307861328125, 0.982208251953125, 1.03363037109375, 1.085052490234375, 1.136474609375, 1.187896728515625, 1.23931884765625, 1.290740966796875, 1.3421630859375, 1.393585205078125, 1.44500732421875, 1.496429443359375, 1.5478515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 17.0, 30.0, 41.0, 108.0, 209.0, 438.0, 950.0, 2906.0, 13343.0, 162529.0, 3807024.0, 188491.0, 14094.0, 2731.0, 778.0, 286.0, 150.0, 80.0, 39.0, 16.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8984375, -10.4539794921875, -10.009521484375, -9.5650634765625, -9.12060546875, -8.6761474609375, -8.231689453125, -7.7872314453125, -7.3427734375, -6.8983154296875, -6.453857421875, -6.0093994140625, -5.56494140625, -5.1204833984375, -4.676025390625, -4.2315673828125, -3.787109375, -3.3426513671875, -2.898193359375, -2.4537353515625, -2.00927734375, -1.5648193359375, -1.120361328125, -0.6759033203125, -0.2314453125, 0.2130126953125, 0.657470703125, 1.1019287109375, 1.54638671875, 1.9908447265625, 2.435302734375, 2.8797607421875, 3.32421875, 3.7686767578125, 4.213134765625, 4.6575927734375, 5.10205078125, 5.5465087890625, 5.990966796875, 6.4354248046875, 6.8798828125, 7.3243408203125, 7.768798828125, 8.2132568359375, 8.65771484375, 9.1021728515625, 9.546630859375, 9.9910888671875, 10.435546875, 10.8800048828125, 11.324462890625, 11.7689208984375, 12.21337890625, 12.6578369140625, 13.102294921875, 13.5467529296875, 13.9912109375, 14.4356689453125, 14.880126953125, 15.3245849609375, 15.76904296875, 16.2135009765625, 16.657958984375, 17.1024169921875, 17.546875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 10.0, 14.0, 21.0, 22.0, 35.0, 54.0, 84.0, 128.0, 303.0, 786.0, 1400.0, 600.0, 239.0, 128.0, 83.0, 57.0, 27.0, 14.0, 17.0, 8.0, 5.0, 11.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.43359375, -3.341583251953125, -3.24957275390625, -3.157562255859375, -3.0655517578125, -2.973541259765625, -2.88153076171875, -2.789520263671875, -2.697509765625, -2.605499267578125, -2.51348876953125, -2.421478271484375, -2.3294677734375, -2.237457275390625, -2.14544677734375, -2.053436279296875, -1.96142578125, -1.869415283203125, -1.77740478515625, -1.685394287109375, -1.5933837890625, -1.501373291015625, -1.40936279296875, -1.317352294921875, -1.225341796875, -1.133331298828125, -1.04132080078125, -0.949310302734375, -0.8572998046875, -0.765289306640625, -0.67327880859375, -0.581268310546875, -0.4892578125, -0.397247314453125, -0.30523681640625, -0.213226318359375, -0.1212158203125, -0.029205322265625, 0.06280517578125, 0.154815673828125, 0.246826171875, 0.338836669921875, 0.43084716796875, 0.522857666015625, 0.6148681640625, 0.706878662109375, 0.79888916015625, 0.890899658203125, 0.98291015625, 1.074920654296875, 1.16693115234375, 1.258941650390625, 1.3509521484375, 1.442962646484375, 1.53497314453125, 1.626983642578125, 1.718994140625, 1.811004638671875, 1.90301513671875, 1.995025634765625, 2.0870361328125, 2.179046630859375, 2.27105712890625, 2.363067626953125, 2.455078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 6.0, 6.0, 9.0, 25.0, 37.0, 59.0, 97.0, 148.0, 178.0, 162.0, 140.0, 67.0, 34.0, 13.0, 10.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.280060768127441, -9.776605606079102, -9.273150444030762, -8.769695281982422, -8.266240119934082, -7.762784957885742, -7.2593302726745605, -6.755875110626221, -6.252419948577881, -5.748964786529541, -5.245509624481201, -4.7420549392700195, -4.23859977722168, -3.7351443767547607, -3.231689453125, -2.72823429107666, -2.2247791290283203, -1.7213239669799805, -1.2178689241409302, -0.7144138813018799, -0.21095871925354004, 0.2924964427947998, 0.7959513664245605, 1.2994065284729004, 1.8028616905212402, 2.30631685256958, 2.80977201461792, 3.3132269382476807, 3.8166821002960205, 4.320137023925781, 4.823592185974121, 5.327047348022461, 5.830501556396484, 6.333956718444824, 6.837411880493164, 7.340867042541504, 7.844322204589844, 8.347777366638184, 8.851232528686523, 9.354686737060547, 9.858142852783203, 10.361598014831543, 10.865053176879883, 11.368508338928223, 11.871963500976562, 12.375418663024902, 12.878873825073242, 13.382328033447266, 13.885783195495605, 14.389238357543945, 14.892693519592285, 15.396148681640625, 15.899603843688965, 16.403059005737305, 16.906513214111328, 17.409969329833984, 17.913423538208008, 18.41687774658203, 18.920333862304688, 19.42378807067871, 19.927244186401367, 20.43069839477539, 20.934154510498047, 21.43760871887207, 21.941064834594727]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 11.0, 11.0, 17.0, 19.0, 23.0, 27.0, 29.0, 37.0, 51.0, 47.0, 47.0, 50.0, 55.0, 60.0, 47.0, 66.0, 51.0, 58.0, 50.0, 35.0, 31.0, 28.0, 26.0, 24.0, 13.0, 21.0, 9.0, 9.0, 12.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.051424026489258, -8.704498291015625, -8.357573509216309, -8.010648727416992, -7.663722991943359, -7.316797733306885, -6.96987247467041, -6.6229472160339355, -6.276021957397461, -5.929096698760986, -5.582171440124512, -5.235246181488037, -4.8883209228515625, -4.541395664215088, -4.194470405578613, -3.8475451469421387, -3.500619888305664, -3.1536946296691895, -2.806769371032715, -2.4598441123962402, -2.1129188537597656, -1.765993595123291, -1.4190683364868164, -1.0721430778503418, -0.7252178192138672, -0.3782925605773926, -0.03136730194091797, 0.31555795669555664, 0.6624832153320312, 1.0094084739685059, 1.3563337326049805, 1.703258991241455, 2.0501842498779297, 2.3971095085144043, 2.744034767150879, 3.0909600257873535, 3.437885284423828, 3.7848105430603027, 4.131735801696777, 4.478661060333252, 4.825586318969727, 5.172511577606201, 5.519436836242676, 5.86636209487915, 6.213287353515625, 6.5602126121521, 6.907137870788574, 7.254063129425049, 7.600988388061523, 7.947913646697998, 8.294838905334473, 8.641763687133789, 8.988689422607422, 9.335615158081055, 9.682539939880371, 10.029464721679688, 10.37639045715332, 10.723316192626953, 11.07024097442627, 11.417165756225586, 11.764091491699219, 12.111017227172852, 12.457942008972168, 12.804866790771484, 13.151792526245117]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 8.0, 19.0, 28.0, 34.0, 56.0, 95.0, 139.0, 209.0, 314.0, 605.0, 1031.0, 1927.0, 3617.0, 7211.0, 15460.0, 35983.0, 95376.0, 267143.0, 359980.0, 159155.0, 56161.0, 22844.0, 10347.0, 5024.0, 2500.0, 1407.0, 733.0, 414.0, 246.0, 171.0, 107.0, 65.0, 49.0, 34.0, 22.0, 12.0, 11.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.38671875, -6.2152099609375, -6.043701171875, -5.8721923828125, -5.70068359375, -5.5291748046875, -5.357666015625, -5.1861572265625, -5.0146484375, -4.8431396484375, -4.671630859375, -4.5001220703125, -4.32861328125, -4.1571044921875, -3.985595703125, -3.8140869140625, -3.642578125, -3.4710693359375, -3.299560546875, -3.1280517578125, -2.95654296875, -2.7850341796875, -2.613525390625, -2.4420166015625, -2.2705078125, -2.0989990234375, -1.927490234375, -1.7559814453125, -1.58447265625, -1.4129638671875, -1.241455078125, -1.0699462890625, -0.8984375, -0.7269287109375, -0.555419921875, -0.3839111328125, -0.21240234375, -0.0408935546875, 0.130615234375, 0.3021240234375, 0.4736328125, 0.6451416015625, 0.816650390625, 0.9881591796875, 1.15966796875, 1.3311767578125, 1.502685546875, 1.6741943359375, 1.845703125, 2.0172119140625, 2.188720703125, 2.3602294921875, 2.53173828125, 2.7032470703125, 2.874755859375, 3.0462646484375, 3.2177734375, 3.3892822265625, 3.560791015625, 3.7322998046875, 3.90380859375, 4.0753173828125, 4.246826171875, 4.4183349609375, 4.58984375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 6.0, 5.0, 9.0, 11.0, 19.0, 18.0, 32.0, 37.0, 49.0, 55.0, 58.0, 67.0, 68.0, 70.0, 67.0, 57.0, 54.0, 60.0, 40.0, 35.0, 32.0, 29.0, 22.0, 24.0, 18.0, 12.0, 5.0, 10.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9033203125, -1.8485870361328125, -1.793853759765625, -1.7391204833984375, -1.68438720703125, -1.6296539306640625, -1.574920654296875, -1.5201873779296875, -1.4654541015625, -1.4107208251953125, -1.355987548828125, -1.3012542724609375, -1.24652099609375, -1.1917877197265625, -1.137054443359375, -1.0823211669921875, -1.027587890625, -0.9728546142578125, -0.918121337890625, -0.8633880615234375, -0.80865478515625, -0.7539215087890625, -0.699188232421875, -0.6444549560546875, -0.5897216796875, -0.5349884033203125, -0.480255126953125, -0.4255218505859375, -0.37078857421875, -0.3160552978515625, -0.261322021484375, -0.2065887451171875, -0.15185546875, -0.0971221923828125, -0.042388916015625, 0.0123443603515625, 0.06707763671875, 0.1218109130859375, 0.176544189453125, 0.2312774658203125, 0.2860107421875, 0.3407440185546875, 0.395477294921875, 0.4502105712890625, 0.50494384765625, 0.5596771240234375, 0.614410400390625, 0.6691436767578125, 0.723876953125, 0.7786102294921875, 0.833343505859375, 0.8880767822265625, 0.94281005859375, 0.9975433349609375, 1.052276611328125, 1.1070098876953125, 1.1617431640625, 1.2164764404296875, 1.271209716796875, 1.3259429931640625, 1.38067626953125, 1.4354095458984375, 1.490142822265625, 1.5448760986328125, 1.599609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 17.0, 22.0, 21.0, 23.0, 24.0, 52.0, 80.0, 130.0, 172.0, 297.0, 533.0, 898.0, 1763.0, 3264.0, 6570.0, 15107.0, 39041.0, 126720.0, 371539.0, 323598.0, 100820.0, 32600.0, 12902.0, 5869.0, 2845.0, 1526.0, 820.0, 511.0, 284.0, 166.0, 104.0, 69.0, 37.0, 27.0, 31.0, 17.0, 9.0, 11.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1484375, -5.96160888671875, -5.7747802734375, -5.58795166015625, -5.401123046875, -5.21429443359375, -5.0274658203125, -4.84063720703125, -4.65380859375, -4.46697998046875, -4.2801513671875, -4.09332275390625, -3.906494140625, -3.71966552734375, -3.5328369140625, -3.34600830078125, -3.1591796875, -2.97235107421875, -2.7855224609375, -2.59869384765625, -2.411865234375, -2.22503662109375, -2.0382080078125, -1.85137939453125, -1.66455078125, -1.47772216796875, -1.2908935546875, -1.10406494140625, -0.917236328125, -0.73040771484375, -0.5435791015625, -0.35675048828125, -0.169921875, 0.01690673828125, 0.2037353515625, 0.39056396484375, 0.577392578125, 0.76422119140625, 0.9510498046875, 1.13787841796875, 1.32470703125, 1.51153564453125, 1.6983642578125, 1.88519287109375, 2.072021484375, 2.25885009765625, 2.4456787109375, 2.63250732421875, 2.8193359375, 3.00616455078125, 3.1929931640625, 3.37982177734375, 3.566650390625, 3.75347900390625, 3.9403076171875, 4.12713623046875, 4.31396484375, 4.50079345703125, 4.6876220703125, 4.87445068359375, 5.061279296875, 5.24810791015625, 5.4349365234375, 5.62176513671875, 5.80859375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 2.0, 8.0, 16.0, 15.0, 24.0, 28.0, 35.0, 27.0, 34.0, 25.0, 37.0, 56.0, 58.0, 59.0, 50.0, 56.0, 42.0, 48.0, 51.0, 42.0, 31.0, 37.0, 24.0, 30.0, 20.0, 20.0, 17.0, 13.0, 10.0, 9.0, 4.0, 6.0, 5.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.51171875, -6.285400390625, -6.05908203125, -5.832763671875, -5.6064453125, -5.380126953125, -5.15380859375, -4.927490234375, -4.701171875, -4.474853515625, -4.24853515625, -4.022216796875, -3.7958984375, -3.569580078125, -3.34326171875, -3.116943359375, -2.890625, -2.664306640625, -2.43798828125, -2.211669921875, -1.9853515625, -1.759033203125, -1.53271484375, -1.306396484375, -1.080078125, -0.853759765625, -0.62744140625, -0.401123046875, -0.1748046875, 0.051513671875, 0.27783203125, 0.504150390625, 0.73046875, 0.956787109375, 1.18310546875, 1.409423828125, 1.6357421875, 1.862060546875, 2.08837890625, 2.314697265625, 2.541015625, 2.767333984375, 2.99365234375, 3.219970703125, 3.4462890625, 3.672607421875, 3.89892578125, 4.125244140625, 4.3515625, 4.577880859375, 4.80419921875, 5.030517578125, 5.2568359375, 5.483154296875, 5.70947265625, 5.935791015625, 6.162109375, 6.388427734375, 6.61474609375, 6.841064453125, 7.0673828125, 7.293701171875, 7.52001953125, 7.746337890625, 7.97265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 13.0, 11.0, 24.0, 34.0, 49.0, 87.0, 152.0, 336.0, 711.0, 1985.0, 6638.0, 27845.0, 139660.0, 493827.0, 297390.0, 60753.0, 13207.0, 3630.0, 1175.0, 447.0, 236.0, 125.0, 68.0, 30.0, 31.0, 19.0, 14.0, 10.0, 3.0, 6.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849609375, -2.753814697265625, -2.65802001953125, -2.562225341796875, -2.4664306640625, -2.370635986328125, -2.27484130859375, -2.179046630859375, -2.083251953125, -1.987457275390625, -1.89166259765625, -1.795867919921875, -1.7000732421875, -1.604278564453125, -1.50848388671875, -1.412689208984375, -1.31689453125, -1.221099853515625, -1.12530517578125, -1.029510498046875, -0.9337158203125, -0.837921142578125, -0.74212646484375, -0.646331787109375, -0.550537109375, -0.454742431640625, -0.35894775390625, -0.263153076171875, -0.1673583984375, -0.071563720703125, 0.02423095703125, 0.120025634765625, 0.2158203125, 0.311614990234375, 0.40740966796875, 0.503204345703125, 0.5989990234375, 0.694793701171875, 0.79058837890625, 0.886383056640625, 0.982177734375, 1.077972412109375, 1.17376708984375, 1.269561767578125, 1.3653564453125, 1.461151123046875, 1.55694580078125, 1.652740478515625, 1.74853515625, 1.844329833984375, 1.94012451171875, 2.035919189453125, 2.1317138671875, 2.227508544921875, 2.32330322265625, 2.419097900390625, 2.514892578125, 2.610687255859375, 2.70648193359375, 2.802276611328125, 2.8980712890625, 2.993865966796875, 3.08966064453125, 3.185455322265625, 3.28125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 5.0, 13.0, 18.0, 21.0, 21.0, 18.0, 42.0, 47.0, 49.0, 72.0, 94.0, 111.0, 96.0, 83.0, 59.0, 44.0, 41.0, 32.0, 23.0, 24.0, 23.0, 19.0, 11.0, 4.0, 3.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004715919494628906, -0.0004580691456794739, -0.00044454634189605713, -0.0004310235381126404, -0.00041750073432922363, -0.0004039779305458069, -0.00039045512676239014, -0.0003769323229789734, -0.00036340951919555664, -0.0003498867154121399, -0.00033636391162872314, -0.0003228411078453064, -0.00030931830406188965, -0.0002957955002784729, -0.00028227269649505615, -0.0002687498927116394, -0.00025522708892822266, -0.0002417042851448059, -0.00022818148136138916, -0.0002146586775779724, -0.00020113587379455566, -0.00018761307001113892, -0.00017409026622772217, -0.00016056746244430542, -0.00014704465866088867, -0.00013352185487747192, -0.00011999905109405518, -0.00010647624731063843, -9.295344352722168e-05, -7.943063974380493e-05, -6.590783596038818e-05, -5.2385032176971436e-05, -3.886222839355469e-05, -2.533942461013794e-05, -1.1816620826721191e-05, 1.7061829566955566e-06, 1.5228986740112305e-05, 2.8751790523529053e-05, 4.22745943069458e-05, 5.579739809036255e-05, 6.93202018737793e-05, 8.284300565719604e-05, 9.636580944061279e-05, 0.00010988861322402954, 0.0001234114170074463, 0.00013693422079086304, 0.00015045702457427979, 0.00016397982835769653, 0.00017750263214111328, 0.00019102543592453003, 0.00020454823970794678, 0.00021807104349136353, 0.00023159384727478027, 0.000245116651058197, 0.00025863945484161377, 0.0002721622586250305, 0.00028568506240844727, 0.000299207866191864, 0.00031273066997528076, 0.0003262534737586975, 0.00033977627754211426, 0.000353299081325531, 0.00036682188510894775, 0.0003803446888923645, 0.00039386749267578125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 10.0, 9.0, 12.0, 12.0, 34.0, 30.0, 50.0, 59.0, 100.0, 130.0, 247.0, 343.0, 614.0, 1011.0, 1905.0, 3568.0, 7388.0, 16133.0, 38410.0, 93903.0, 226083.0, 337679.0, 186131.0, 76321.0, 31409.0, 13490.0, 6297.0, 3108.0, 1596.0, 1005.0, 501.0, 315.0, 220.0, 133.0, 85.0, 58.0, 47.0, 34.0, 15.0, 20.0, 11.0, 6.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.85546875, -1.794403076171875, -1.73333740234375, -1.672271728515625, -1.6112060546875, -1.550140380859375, -1.48907470703125, -1.428009033203125, -1.366943359375, -1.305877685546875, -1.24481201171875, -1.183746337890625, -1.1226806640625, -1.061614990234375, -1.00054931640625, -0.939483642578125, -0.87841796875, -0.817352294921875, -0.75628662109375, -0.695220947265625, -0.6341552734375, -0.573089599609375, -0.51202392578125, -0.450958251953125, -0.389892578125, -0.328826904296875, -0.26776123046875, -0.206695556640625, -0.1456298828125, -0.084564208984375, -0.02349853515625, 0.037567138671875, 0.0986328125, 0.159698486328125, 0.22076416015625, 0.281829833984375, 0.3428955078125, 0.403961181640625, 0.46502685546875, 0.526092529296875, 0.587158203125, 0.648223876953125, 0.70928955078125, 0.770355224609375, 0.8314208984375, 0.892486572265625, 0.95355224609375, 1.014617919921875, 1.07568359375, 1.136749267578125, 1.19781494140625, 1.258880615234375, 1.3199462890625, 1.381011962890625, 1.44207763671875, 1.503143310546875, 1.564208984375, 1.625274658203125, 1.68634033203125, 1.747406005859375, 1.8084716796875, 1.869537353515625, 1.93060302734375, 1.991668701171875, 2.052734375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 1.0, 3.0, 4.0, 11.0, 17.0, 25.0, 21.0, 26.0, 32.0, 46.0, 63.0, 75.0, 87.0, 73.0, 75.0, 72.0, 69.0, 58.0, 42.0, 41.0, 42.0, 30.0, 20.0, 17.0, 18.0, 8.0, 4.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.541015625, -2.46221923828125, -2.3834228515625, -2.30462646484375, -2.225830078125, -2.14703369140625, -2.0682373046875, -1.98944091796875, -1.91064453125, -1.83184814453125, -1.7530517578125, -1.67425537109375, -1.595458984375, -1.51666259765625, -1.4378662109375, -1.35906982421875, -1.2802734375, -1.20147705078125, -1.1226806640625, -1.04388427734375, -0.965087890625, -0.88629150390625, -0.8074951171875, -0.72869873046875, -0.64990234375, -0.57110595703125, -0.4923095703125, -0.41351318359375, -0.334716796875, -0.25592041015625, -0.1771240234375, -0.09832763671875, -0.01953125, 0.05926513671875, 0.1380615234375, 0.21685791015625, 0.295654296875, 0.37445068359375, 0.4532470703125, 0.53204345703125, 0.61083984375, 0.68963623046875, 0.7684326171875, 0.84722900390625, 0.926025390625, 1.00482177734375, 1.0836181640625, 1.16241455078125, 1.2412109375, 1.32000732421875, 1.3988037109375, 1.47760009765625, 1.556396484375, 1.63519287109375, 1.7139892578125, 1.79278564453125, 1.87158203125, 1.95037841796875, 2.0291748046875, 2.10797119140625, 2.186767578125, 2.26556396484375, 2.3443603515625, 2.42315673828125, 2.501953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 8.0, 11.0, 23.0, 28.0, 59.0, 103.0, 151.0, 186.0, 160.0, 103.0, 68.0, 37.0, 28.0, 8.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.593894958496094, -59.95233154296875, -58.31076431274414, -56.6692008972168, -55.02763366699219, -53.386070251464844, -51.7445068359375, -50.10293960571289, -48.46137619018555, -46.8198127746582, -45.178245544433594, -43.53668212890625, -41.89511489868164, -40.2535514831543, -38.61198425292969, -36.970420837402344, -35.328857421875, -33.687294006347656, -32.04572677612305, -30.404163360595703, -28.762598037719727, -27.12103271484375, -25.479467391967773, -23.837902069091797, -22.196334838867188, -20.55476951599121, -18.913204193115234, -17.27164077758789, -15.630075454711914, -13.988510131835938, -12.346944808959961, -10.7053804397583, -9.06381607055664, -7.422251224517822, -5.780686378479004, -4.139121055603027, -2.497556209564209, -0.8559913635253906, 0.7855739593505859, 2.427138328552246, 4.068703651428223, 5.710268497467041, 7.351833343505859, 8.993398666381836, 10.634963989257812, 12.276528358459473, 13.91809368133545, 15.55965805053711, 17.201223373413086, 18.842788696289062, 20.48435401916504, 22.125919342041016, 23.76748275756836, 25.409048080444336, 27.050613403320312, 28.692176818847656, 30.333744049072266, 31.975309371948242, 33.61687469482422, 35.25843811035156, 36.90000534057617, 38.541568756103516, 40.183135986328125, 41.82469940185547, 43.46626281738281]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 12.0, 15.0, 27.0, 25.0, 28.0, 37.0, 45.0, 43.0, 63.0, 69.0, 57.0, 75.0, 81.0, 55.0, 52.0, 47.0, 46.0, 41.0, 40.0, 37.0, 25.0, 19.0, 25.0, 10.0, 11.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-69.49290466308594, -67.4550552368164, -65.41720581054688, -63.37936019897461, -61.34151077270508, -59.30366134643555, -57.26581573486328, -55.22796630859375, -53.19011688232422, -51.15226745605469, -49.114418029785156, -47.07657241821289, -45.03872299194336, -43.00087356567383, -40.96302795410156, -38.92517852783203, -36.8873291015625, -34.84947967529297, -32.81163024902344, -30.773784637451172, -28.73593521118164, -26.69808578491211, -24.66023826599121, -22.622390747070312, -20.58454132080078, -18.54669189453125, -16.50884437561035, -14.470995903015137, -12.433147430419922, -10.395298957824707, -8.357450485229492, -6.319602012634277, -4.281749725341797, -2.243901252746582, -0.2060527801513672, 1.8317956924438477, 3.8696441650390625, 5.907492637634277, 7.945341110229492, 9.983189582824707, 12.021038055419922, 14.058886528015137, 16.09673500061035, 18.13458251953125, 20.17243194580078, 22.210281372070312, 24.24812889099121, 26.28597640991211, 28.32382583618164, 30.361675262451172, 32.39952087402344, 34.43737030029297, 36.4752197265625, 38.51306915283203, 40.55091857910156, 42.58876419067383, 44.62661361694336, 46.66446304321289, 48.702308654785156, 50.74015808105469, 52.77800750732422, 54.81585693359375, 56.85370635986328, 58.89155197143555, 60.92940139770508]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 11.0, 14.0, 16.0, 31.0, 37.0, 49.0, 72.0, 101.0, 163.0, 266.0, 467.0, 836.0, 1698.0, 3869.0, 10114.0, 39717.0, 485025.0, 3525638.0, 97343.0, 17981.0, 5628.0, 2418.0, 1201.0, 615.0, 343.0, 202.0, 130.0, 79.0, 65.0, 44.0, 27.0, 24.0, 13.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.7813720703125, -8.500244140625, -8.2191162109375, -7.93798828125, -7.6568603515625, -7.375732421875, -7.0946044921875, -6.8134765625, -6.5323486328125, -6.251220703125, -5.9700927734375, -5.68896484375, -5.4078369140625, -5.126708984375, -4.8455810546875, -4.564453125, -4.2833251953125, -4.002197265625, -3.7210693359375, -3.43994140625, -3.1588134765625, -2.877685546875, -2.5965576171875, -2.3154296875, -2.0343017578125, -1.753173828125, -1.4720458984375, -1.19091796875, -0.9097900390625, -0.628662109375, -0.3475341796875, -0.06640625, 0.2147216796875, 0.495849609375, 0.7769775390625, 1.05810546875, 1.3392333984375, 1.620361328125, 1.9014892578125, 2.1826171875, 2.4637451171875, 2.744873046875, 3.0260009765625, 3.30712890625, 3.5882568359375, 3.869384765625, 4.1505126953125, 4.431640625, 4.7127685546875, 4.993896484375, 5.2750244140625, 5.55615234375, 5.8372802734375, 6.118408203125, 6.3995361328125, 6.6806640625, 6.9617919921875, 7.242919921875, 7.5240478515625, 7.80517578125, 8.0863037109375, 8.367431640625, 8.6485595703125, 8.9296875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 8.0, 7.0, 12.0, 20.0, 29.0, 27.0, 27.0, 48.0, 35.0, 42.0, 63.0, 61.0, 70.0, 65.0, 62.0, 63.0, 49.0, 50.0, 54.0, 40.0, 30.0, 26.0, 20.0, 18.0, 14.0, 17.0, 7.0, 4.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7802734375, -1.7254638671875, -1.670654296875, -1.6158447265625, -1.56103515625, -1.5062255859375, -1.451416015625, -1.3966064453125, -1.341796875, -1.2869873046875, -1.232177734375, -1.1773681640625, -1.12255859375, -1.0677490234375, -1.012939453125, -0.9581298828125, -0.9033203125, -0.8485107421875, -0.793701171875, -0.7388916015625, -0.68408203125, -0.6292724609375, -0.574462890625, -0.5196533203125, -0.46484375, -0.4100341796875, -0.355224609375, -0.3004150390625, -0.24560546875, -0.1907958984375, -0.135986328125, -0.0811767578125, -0.0263671875, 0.0284423828125, 0.083251953125, 0.1380615234375, 0.19287109375, 0.2476806640625, 0.302490234375, 0.3572998046875, 0.412109375, 0.4669189453125, 0.521728515625, 0.5765380859375, 0.63134765625, 0.6861572265625, 0.740966796875, 0.7957763671875, 0.8505859375, 0.9053955078125, 0.960205078125, 1.0150146484375, 1.06982421875, 1.1246337890625, 1.179443359375, 1.2342529296875, 1.2890625, 1.3438720703125, 1.398681640625, 1.4534912109375, 1.50830078125, 1.5631103515625, 1.617919921875, 1.6727294921875, 1.7275390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 9.0, 20.0, 36.0, 84.0, 129.0, 300.0, 767.0, 2975.0, 26419.0, 2361640.0, 1773366.0, 24282.0, 2994.0, 742.0, 251.0, 115.0, 63.0, 41.0, 23.0, 11.0, 6.0, 5.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.625, -12.230224609375, -11.83544921875, -11.440673828125, -11.0458984375, -10.651123046875, -10.25634765625, -9.861572265625, -9.466796875, -9.072021484375, -8.67724609375, -8.282470703125, -7.8876953125, -7.492919921875, -7.09814453125, -6.703369140625, -6.30859375, -5.913818359375, -5.51904296875, -5.124267578125, -4.7294921875, -4.334716796875, -3.93994140625, -3.545166015625, -3.150390625, -2.755615234375, -2.36083984375, -1.966064453125, -1.5712890625, -1.176513671875, -0.78173828125, -0.386962890625, 0.0078125, 0.402587890625, 0.79736328125, 1.192138671875, 1.5869140625, 1.981689453125, 2.37646484375, 2.771240234375, 3.166015625, 3.560791015625, 3.95556640625, 4.350341796875, 4.7451171875, 5.139892578125, 5.53466796875, 5.929443359375, 6.32421875, 6.718994140625, 7.11376953125, 7.508544921875, 7.9033203125, 8.298095703125, 8.69287109375, 9.087646484375, 9.482421875, 9.877197265625, 10.27197265625, 10.666748046875, 11.0615234375, 11.456298828125, 11.85107421875, 12.245849609375, 12.640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 15.0, 19.0, 35.0, 51.0, 95.0, 216.0, 458.0, 1504.0, 1013.0, 322.0, 152.0, 69.0, 55.0, 23.0, 14.0, 9.0, 6.0, 9.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.42828369140625, -2.3409423828125, -2.25360107421875, -2.166259765625, -2.07891845703125, -1.9915771484375, -1.90423583984375, -1.81689453125, -1.72955322265625, -1.6422119140625, -1.55487060546875, -1.467529296875, -1.38018798828125, -1.2928466796875, -1.20550537109375, -1.1181640625, -1.03082275390625, -0.9434814453125, -0.85614013671875, -0.768798828125, -0.68145751953125, -0.5941162109375, -0.50677490234375, -0.41943359375, -0.33209228515625, -0.2447509765625, -0.15740966796875, -0.070068359375, 0.01727294921875, 0.1046142578125, 0.19195556640625, 0.279296875, 0.36663818359375, 0.4539794921875, 0.54132080078125, 0.628662109375, 0.71600341796875, 0.8033447265625, 0.89068603515625, 0.97802734375, 1.06536865234375, 1.1527099609375, 1.24005126953125, 1.327392578125, 1.41473388671875, 1.5020751953125, 1.58941650390625, 1.6767578125, 1.76409912109375, 1.8514404296875, 1.93878173828125, 2.026123046875, 2.11346435546875, 2.2008056640625, 2.28814697265625, 2.37548828125, 2.46282958984375, 2.5501708984375, 2.63751220703125, 2.724853515625, 2.81219482421875, 2.8995361328125, 2.98687744140625, 3.07421875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 10.0, 9.0, 36.0, 50.0, 127.0, 165.0, 205.0, 153.0, 116.0, 75.0, 24.0, 15.0, 8.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.854011535644531, -9.370630264282227, -8.887248992919922, -8.403867721557617, -7.9204864501953125, -7.437105178833008, -6.953723430633545, -6.47034215927124, -5.9869608879089355, -5.503579616546631, -5.020198345184326, -4.536816596984863, -4.053435325622559, -3.570054292678833, -3.086672782897949, -2.6032915115356445, -2.11991024017334, -1.6365289688110352, -1.153147578239441, -0.6697661876678467, -0.186384916305542, 0.2969963550567627, 0.7803778648376465, 1.2637591361999512, 1.7471404075622559, 2.2305216789245605, 2.7139029502868652, 3.197284460067749, 3.6806657314300537, 4.1640472412109375, 4.647428512573242, 5.130809783935547, 5.614191055297852, 6.097572326660156, 6.580953598022461, 7.064334869384766, 7.54771614074707, 8.031097412109375, 8.51447868347168, 8.997859954833984, 9.481241226196289, 9.964622497558594, 10.448003768920898, 10.931385040283203, 11.414766311645508, 11.898147583007812, 12.381528854370117, 12.864910125732422, 13.348292350769043, 13.831673622131348, 14.315054893493652, 14.798436164855957, 15.281817436218262, 15.765198707580566, 16.248580932617188, 16.731962203979492, 17.215343475341797, 17.6987247467041, 18.182106018066406, 18.66548728942871, 19.148868560791016, 19.63224983215332, 20.115631103515625, 20.59901237487793, 21.082393646240234]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 9.0, 6.0, 18.0, 11.0, 18.0, 36.0, 24.0, 30.0, 21.0, 40.0, 47.0, 56.0, 45.0, 54.0, 61.0, 70.0, 57.0, 61.0, 53.0, 52.0, 34.0, 36.0, 36.0, 24.0, 23.0, 18.0, 28.0, 14.0, 5.0, 4.0, 6.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.16443157196045, -8.89543342590332, -8.626435279846191, -8.357437133789062, -8.08843994140625, -7.819441318511963, -7.550443649291992, -7.281445503234863, -7.012447357177734, -6.7434492111206055, -6.474451065063477, -6.205453395843506, -5.936455249786377, -5.667457103729248, -5.398459434509277, -5.129461288452148, -4.8604631423950195, -4.591464996337891, -4.322466850280762, -4.053469181060791, -3.784471035003662, -3.515472888946533, -3.2464749813079834, -2.9774770736694336, -2.7084789276123047, -2.439480781555176, -2.170482873916626, -1.9014848470687866, -1.6324868202209473, -1.363488793373108, -1.0944907665252686, -0.8254927396774292, -0.5564937591552734, -0.2874957323074341, -0.018497705459594727, 0.25050032138824463, 0.519498348236084, 0.7884963750839233, 1.0574944019317627, 1.326492428779602, 1.5954904556274414, 1.8644884824752808, 2.13348650932312, 2.40248441696167, 2.671482563018799, 2.9404807090759277, 3.2094786167144775, 3.4784765243530273, 3.7474746704101562, 4.016472816467285, 4.285470962524414, 4.554468631744385, 4.823466777801514, 5.092464923858643, 5.361462593078613, 5.630460739135742, 5.899458885192871, 6.16845703125, 6.437455177307129, 6.7064528465271, 6.9754509925842285, 7.244449138641357, 7.513446807861328, 7.782444953918457, 8.051443099975586]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 15.0, 23.0, 19.0, 37.0, 45.0, 63.0, 97.0, 153.0, 265.0, 442.0, 683.0, 1183.0, 2291.0, 4251.0, 8584.0, 18208.0, 39923.0, 96758.0, 229141.0, 325032.0, 184050.0, 75089.0, 32139.0, 14618.0, 7185.0, 3607.0, 1952.0, 1040.0, 587.0, 392.0, 222.0, 140.0, 103.0, 68.0, 46.0, 32.0, 15.0, 18.0, 8.0, 4.0, 4.0, 2.0, 1.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23828125, -4.09869384765625, -3.9591064453125, -3.81951904296875, -3.679931640625, -3.54034423828125, -3.4007568359375, -3.26116943359375, -3.12158203125, -2.98199462890625, -2.8424072265625, -2.70281982421875, -2.563232421875, -2.42364501953125, -2.2840576171875, -2.14447021484375, -2.0048828125, -1.86529541015625, -1.7257080078125, -1.58612060546875, -1.446533203125, -1.30694580078125, -1.1673583984375, -1.02777099609375, -0.88818359375, -0.74859619140625, -0.6090087890625, -0.46942138671875, -0.329833984375, -0.19024658203125, -0.0506591796875, 0.08892822265625, 0.228515625, 0.36810302734375, 0.5076904296875, 0.64727783203125, 0.786865234375, 0.92645263671875, 1.0660400390625, 1.20562744140625, 1.34521484375, 1.48480224609375, 1.6243896484375, 1.76397705078125, 1.903564453125, 2.04315185546875, 2.1827392578125, 2.32232666015625, 2.4619140625, 2.60150146484375, 2.7410888671875, 2.88067626953125, 3.020263671875, 3.15985107421875, 3.2994384765625, 3.43902587890625, 3.57861328125, 3.71820068359375, 3.8577880859375, 3.99737548828125, 4.136962890625, 4.27655029296875, 4.4161376953125, 4.55572509765625, 4.6953125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 4.0, 13.0, 8.0, 10.0, 21.0, 20.0, 36.0, 32.0, 34.0, 45.0, 54.0, 48.0, 55.0, 76.0, 55.0, 53.0, 77.0, 54.0, 57.0, 39.0, 36.0, 33.0, 21.0, 28.0, 25.0, 15.0, 10.0, 13.0, 9.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.015625, -1.9605560302734375, -1.905487060546875, -1.8504180908203125, -1.79534912109375, -1.7402801513671875, -1.685211181640625, -1.6301422119140625, -1.5750732421875, -1.5200042724609375, -1.464935302734375, -1.4098663330078125, -1.35479736328125, -1.2997283935546875, -1.244659423828125, -1.1895904541015625, -1.134521484375, -1.0794525146484375, -1.024383544921875, -0.9693145751953125, -0.91424560546875, -0.8591766357421875, -0.804107666015625, -0.7490386962890625, -0.6939697265625, -0.6389007568359375, -0.583831787109375, -0.5287628173828125, -0.47369384765625, -0.4186248779296875, -0.363555908203125, -0.3084869384765625, -0.25341796875, -0.1983489990234375, -0.143280029296875, -0.0882110595703125, -0.03314208984375, 0.0219268798828125, 0.076995849609375, 0.1320648193359375, 0.1871337890625, 0.2422027587890625, 0.297271728515625, 0.3523406982421875, 0.40740966796875, 0.4624786376953125, 0.517547607421875, 0.5726165771484375, 0.627685546875, 0.6827545166015625, 0.737823486328125, 0.7928924560546875, 0.84796142578125, 0.9030303955078125, 0.958099365234375, 1.0131683349609375, 1.0682373046875, 1.1233062744140625, 1.178375244140625, 1.2334442138671875, 1.28851318359375, 1.3435821533203125, 1.398651123046875, 1.4537200927734375, 1.5087890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 16.0, 10.0, 13.0, 16.0, 17.0, 29.0, 56.0, 55.0, 78.0, 117.0, 187.0, 274.0, 527.0, 896.0, 1703.0, 3590.0, 8272.0, 21191.0, 61576.0, 207698.0, 418782.0, 219740.0, 65217.0, 22184.0, 8558.0, 3617.0, 1763.0, 868.0, 546.0, 325.0, 218.0, 108.0, 91.0, 54.0, 36.0, 26.0, 21.0, 18.0, 15.0, 17.0, 5.0, 4.0, 11.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.30078125, -5.13262939453125, -4.9644775390625, -4.79632568359375, -4.628173828125, -4.46002197265625, -4.2918701171875, -4.12371826171875, -3.95556640625, -3.78741455078125, -3.6192626953125, -3.45111083984375, -3.282958984375, -3.11480712890625, -2.9466552734375, -2.77850341796875, -2.6103515625, -2.44219970703125, -2.2740478515625, -2.10589599609375, -1.937744140625, -1.76959228515625, -1.6014404296875, -1.43328857421875, -1.26513671875, -1.09698486328125, -0.9288330078125, -0.76068115234375, -0.592529296875, -0.42437744140625, -0.2562255859375, -0.08807373046875, 0.080078125, 0.24822998046875, 0.4163818359375, 0.58453369140625, 0.752685546875, 0.92083740234375, 1.0889892578125, 1.25714111328125, 1.42529296875, 1.59344482421875, 1.7615966796875, 1.92974853515625, 2.097900390625, 2.26605224609375, 2.4342041015625, 2.60235595703125, 2.7705078125, 2.93865966796875, 3.1068115234375, 3.27496337890625, 3.443115234375, 3.61126708984375, 3.7794189453125, 3.94757080078125, 4.11572265625, 4.28387451171875, 4.4520263671875, 4.62017822265625, 4.788330078125, 4.95648193359375, 5.1246337890625, 5.29278564453125, 5.4609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 12.0, 7.0, 12.0, 15.0, 19.0, 23.0, 24.0, 31.0, 31.0, 43.0, 40.0, 42.0, 52.0, 54.0, 50.0, 56.0, 54.0, 50.0, 49.0, 47.0, 35.0, 49.0, 27.0, 39.0, 14.0, 22.0, 23.0, 14.0, 10.0, 13.0, 10.0, 4.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.765625, -6.5382080078125, -6.310791015625, -6.0833740234375, -5.85595703125, -5.6285400390625, -5.401123046875, -5.1737060546875, -4.9462890625, -4.7188720703125, -4.491455078125, -4.2640380859375, -4.03662109375, -3.8092041015625, -3.581787109375, -3.3543701171875, -3.126953125, -2.8995361328125, -2.672119140625, -2.4447021484375, -2.21728515625, -1.9898681640625, -1.762451171875, -1.5350341796875, -1.3076171875, -1.0802001953125, -0.852783203125, -0.6253662109375, -0.39794921875, -0.1705322265625, 0.056884765625, 0.2843017578125, 0.51171875, 0.7391357421875, 0.966552734375, 1.1939697265625, 1.42138671875, 1.6488037109375, 1.876220703125, 2.1036376953125, 2.3310546875, 2.5584716796875, 2.785888671875, 3.0133056640625, 3.24072265625, 3.4681396484375, 3.695556640625, 3.9229736328125, 4.150390625, 4.3778076171875, 4.605224609375, 4.8326416015625, 5.06005859375, 5.2874755859375, 5.514892578125, 5.7423095703125, 5.9697265625, 6.1971435546875, 6.424560546875, 6.6519775390625, 6.87939453125, 7.1068115234375, 7.334228515625, 7.5616455078125, 7.7890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 16.0, 18.0, 22.0, 45.0, 53.0, 94.0, 127.0, 268.0, 541.0, 1228.0, 2917.0, 8367.0, 27119.0, 100605.0, 344890.0, 389959.0, 123354.0, 32816.0, 9778.0, 3522.0, 1438.0, 601.0, 331.0, 160.0, 100.0, 70.0, 30.0, 23.0, 13.0, 10.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8966827392578125, -1.831451416015625, -1.7662200927734375, -1.70098876953125, -1.6357574462890625, -1.570526123046875, -1.5052947998046875, -1.4400634765625, -1.3748321533203125, -1.309600830078125, -1.2443695068359375, -1.17913818359375, -1.1139068603515625, -1.048675537109375, -0.9834442138671875, -0.918212890625, -0.8529815673828125, -0.787750244140625, -0.7225189208984375, -0.65728759765625, -0.5920562744140625, -0.526824951171875, -0.4615936279296875, -0.3963623046875, -0.3311309814453125, -0.265899658203125, -0.2006683349609375, -0.13543701171875, -0.0702056884765625, -0.004974365234375, 0.0602569580078125, 0.12548828125, 0.1907196044921875, 0.255950927734375, 0.3211822509765625, 0.38641357421875, 0.4516448974609375, 0.516876220703125, 0.5821075439453125, 0.6473388671875, 0.7125701904296875, 0.777801513671875, 0.8430328369140625, 0.90826416015625, 0.9734954833984375, 1.038726806640625, 1.1039581298828125, 1.169189453125, 1.2344207763671875, 1.299652099609375, 1.3648834228515625, 1.43011474609375, 1.4953460693359375, 1.560577392578125, 1.6258087158203125, 1.6910400390625, 1.7562713623046875, 1.821502685546875, 1.8867340087890625, 1.95196533203125, 2.0171966552734375, 2.082427978515625, 2.1476593017578125, 2.212890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 2.0, 4.0, 12.0, 21.0, 9.0, 18.0, 17.0, 24.0, 28.0, 42.0, 36.0, 55.0, 59.0, 54.0, 68.0, 75.0, 72.0, 60.0, 41.0, 40.0, 37.0, 44.0, 30.0, 27.0, 11.0, 10.0, 13.0, 8.0, 14.0, 11.0, 8.0, 5.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002741813659667969, -0.0002656318247318268, -0.0002570822834968567, -0.0002485327422618866, -0.0002399832010269165, -0.0002314336597919464, -0.00022288411855697632, -0.00021433457732200623, -0.00020578503608703613, -0.00019723549485206604, -0.00018868595361709595, -0.00018013641238212585, -0.00017158687114715576, -0.00016303732991218567, -0.00015448778867721558, -0.00014593824744224548, -0.0001373887062072754, -0.0001288391649723053, -0.0001202896237373352, -0.00011174008250236511, -0.00010319054126739502, -9.464100003242493e-05, -8.609145879745483e-05, -7.754191756248474e-05, -6.899237632751465e-05, -6.0442835092544556e-05, -5.189329385757446e-05, -4.334375262260437e-05, -3.479421138763428e-05, -2.6244670152664185e-05, -1.7695128917694092e-05, -9.145587682723999e-06, -5.960464477539062e-07, 7.953494787216187e-06, 1.650303602218628e-05, 2.5052577257156372e-05, 3.3602118492126465e-05, 4.215165972709656e-05, 5.070120096206665e-05, 5.925074219703674e-05, 6.780028343200684e-05, 7.634982466697693e-05, 8.489936590194702e-05, 9.344890713691711e-05, 0.00010199844837188721, 0.0001105479896068573, 0.00011909753084182739, 0.00012764707207679749, 0.00013619661331176758, 0.00014474615454673767, 0.00015329569578170776, 0.00016184523701667786, 0.00017039477825164795, 0.00017894431948661804, 0.00018749386072158813, 0.00019604340195655823, 0.00020459294319152832, 0.0002131424844264984, 0.0002216920256614685, 0.0002302415668964386, 0.0002387911081314087, 0.0002473406493663788, 0.0002558901906013489, 0.00026443973183631897, 0.00027298927307128906]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 9.0, 30.0, 30.0, 42.0, 80.0, 123.0, 228.0, 404.0, 748.0, 1576.0, 3698.0, 10076.0, 30341.0, 104126.0, 351967.0, 376234.0, 116383.0, 33702.0, 11027.0, 4154.0, 1720.0, 830.0, 411.0, 228.0, 122.0, 86.0, 53.0, 29.0, 31.0, 12.0, 14.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.7135009765625, -1.647705078125, -1.5819091796875, -1.51611328125, -1.4503173828125, -1.384521484375, -1.3187255859375, -1.2529296875, -1.1871337890625, -1.121337890625, -1.0555419921875, -0.98974609375, -0.9239501953125, -0.858154296875, -0.7923583984375, -0.7265625, -0.6607666015625, -0.594970703125, -0.5291748046875, -0.46337890625, -0.3975830078125, -0.331787109375, -0.2659912109375, -0.2001953125, -0.1343994140625, -0.068603515625, -0.0028076171875, 0.06298828125, 0.1287841796875, 0.194580078125, 0.2603759765625, 0.326171875, 0.3919677734375, 0.457763671875, 0.5235595703125, 0.58935546875, 0.6551513671875, 0.720947265625, 0.7867431640625, 0.8525390625, 0.9183349609375, 0.984130859375, 1.0499267578125, 1.11572265625, 1.1815185546875, 1.247314453125, 1.3131103515625, 1.37890625, 1.4447021484375, 1.510498046875, 1.5762939453125, 1.64208984375, 1.7078857421875, 1.773681640625, 1.8394775390625, 1.9052734375, 1.9710693359375, 2.036865234375, 2.1026611328125, 2.16845703125, 2.2342529296875, 2.300048828125, 2.3658447265625, 2.431640625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 0.0, 3.0, 3.0, 4.0, 10.0, 8.0, 6.0, 9.0, 22.0, 25.0, 19.0, 32.0, 35.0, 49.0, 50.0, 76.0, 64.0, 61.0, 79.0, 67.0, 64.0, 51.0, 50.0, 42.0, 23.0, 36.0, 18.0, 18.0, 14.0, 12.0, 3.0, 11.0, 8.0, 13.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.9635009765625, -1.907470703125, -1.8514404296875, -1.79541015625, -1.7393798828125, -1.683349609375, -1.6273193359375, -1.5712890625, -1.5152587890625, -1.459228515625, -1.4031982421875, -1.34716796875, -1.2911376953125, -1.235107421875, -1.1790771484375, -1.123046875, -1.0670166015625, -1.010986328125, -0.9549560546875, -0.89892578125, -0.8428955078125, -0.786865234375, -0.7308349609375, -0.6748046875, -0.6187744140625, -0.562744140625, -0.5067138671875, -0.45068359375, -0.3946533203125, -0.338623046875, -0.2825927734375, -0.2265625, -0.1705322265625, -0.114501953125, -0.0584716796875, -0.00244140625, 0.0535888671875, 0.109619140625, 0.1656494140625, 0.2216796875, 0.2777099609375, 0.333740234375, 0.3897705078125, 0.44580078125, 0.5018310546875, 0.557861328125, 0.6138916015625, 0.669921875, 0.7259521484375, 0.781982421875, 0.8380126953125, 0.89404296875, 0.9500732421875, 1.006103515625, 1.0621337890625, 1.1181640625, 1.1741943359375, 1.230224609375, 1.2862548828125, 1.34228515625, 1.3983154296875, 1.454345703125, 1.5103759765625, 1.56640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 17.0, 18.0, 37.0, 62.0, 95.0, 165.0, 185.0, 134.0, 107.0, 82.0, 32.0, 30.0, 14.0, 8.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.86506271362305, -47.368404388427734, -45.871742248535156, -44.375083923339844, -42.87842559814453, -41.38176727294922, -39.88510513305664, -38.38844680786133, -36.89178466796875, -35.39512634277344, -33.89846420288086, -32.40180587768555, -30.905147552490234, -29.40848731994629, -27.911827087402344, -26.41516876220703, -24.91851043701172, -23.421850204467773, -21.92519187927246, -20.428531646728516, -18.931873321533203, -17.435213088989258, -15.938552856445312, -14.441893577575684, -12.945234298706055, -11.448575019836426, -9.951915740966797, -8.455255508422852, -6.958596229553223, -5.461936950683594, -3.9652767181396484, -2.4686174392700195, -0.9719619750976562, 0.5246975421905518, 2.0213570594787598, 3.518016815185547, 5.014676094055176, 6.511335372924805, 8.00799560546875, 9.504654884338379, 11.001314163208008, 12.497973442077637, 13.994632720947266, 15.491292953491211, 16.987953186035156, 18.48461151123047, 19.981271743774414, 21.47793197631836, 22.974590301513672, 24.471250534057617, 25.96790885925293, 27.464569091796875, 28.961227416992188, 30.457887649536133, 31.954547882080078, 33.45120620727539, 34.94786834716797, 36.44452667236328, 37.94118881225586, 39.43784713745117, 40.934505462646484, 42.43116760253906, 43.927825927734375, 45.42448425292969, 46.921142578125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 11.0, 12.0, 13.0, 7.0, 24.0, 31.0, 31.0, 42.0, 49.0, 47.0, 62.0, 70.0, 63.0, 73.0, 75.0, 60.0, 58.0, 48.0, 52.0, 29.0, 32.0, 32.0, 26.0, 9.0, 17.0, 9.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.17780303955078, -53.426483154296875, -51.67516326904297, -49.92384338378906, -48.17251968383789, -46.421199798583984, -44.66987991333008, -42.91856002807617, -41.167236328125, -39.415916442871094, -37.66459655761719, -35.91327667236328, -34.16195297241211, -32.4106330871582, -30.659313201904297, -28.90799331665039, -27.156673431396484, -25.405353546142578, -23.65403175354004, -21.902711868286133, -20.151390075683594, -18.400070190429688, -16.64875030517578, -14.897429466247559, -13.146108627319336, -11.394787788391113, -9.64346694946289, -7.892147064208984, -6.140826225280762, -4.389505386352539, -2.638185501098633, -0.8868646621704102, 0.8644561767578125, 2.615776777267456, 4.3670973777771, 6.118417739868164, 7.869738578796387, 9.62105941772461, 11.372379302978516, 13.123700141906738, 14.875020980834961, 16.626340866088867, 18.377662658691406, 20.128982543945312, 21.88030242919922, 23.631624221801758, 25.382944107055664, 27.134265899658203, 28.88558578491211, 30.636905670166016, 32.38822555541992, 34.139549255371094, 35.890869140625, 37.642189025878906, 39.39350891113281, 41.14482879638672, 42.896148681640625, 44.64746856689453, 46.39878845214844, 48.150108337402344, 49.901432037353516, 51.65275192260742, 53.40407180786133, 55.155391693115234, 56.906715393066406]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 11.0, 12.0, 11.0, 29.0, 35.0, 42.0, 57.0, 97.0, 119.0, 208.0, 353.0, 584.0, 1004.0, 2001.0, 4070.0, 10403.0, 32414.0, 167025.0, 3304588.0, 580365.0, 62875.0, 16456.0, 5816.0, 2564.0, 1330.0, 696.0, 359.0, 267.0, 163.0, 107.0, 73.0, 48.0, 32.0, 16.0, 12.0, 14.0, 6.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.9375, -7.6873779296875, -7.437255859375, -7.1871337890625, -6.93701171875, -6.6868896484375, -6.436767578125, -6.1866455078125, -5.9365234375, -5.6864013671875, -5.436279296875, -5.1861572265625, -4.93603515625, -4.6859130859375, -4.435791015625, -4.1856689453125, -3.935546875, -3.6854248046875, -3.435302734375, -3.1851806640625, -2.93505859375, -2.6849365234375, -2.434814453125, -2.1846923828125, -1.9345703125, -1.6844482421875, -1.434326171875, -1.1842041015625, -0.93408203125, -0.6839599609375, -0.433837890625, -0.1837158203125, 0.06640625, 0.3165283203125, 0.566650390625, 0.8167724609375, 1.06689453125, 1.3170166015625, 1.567138671875, 1.8172607421875, 2.0673828125, 2.3175048828125, 2.567626953125, 2.8177490234375, 3.06787109375, 3.3179931640625, 3.568115234375, 3.8182373046875, 4.068359375, 4.3184814453125, 4.568603515625, 4.8187255859375, 5.06884765625, 5.3189697265625, 5.569091796875, 5.8192138671875, 6.0693359375, 6.3194580078125, 6.569580078125, 6.8197021484375, 7.06982421875, 7.3199462890625, 7.570068359375, 7.8201904296875, 8.0703125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0, 10.0, 10.0, 10.0, 14.0, 19.0, 24.0, 16.0, 30.0, 41.0, 37.0, 47.0, 62.0, 55.0, 74.0, 50.0, 60.0, 56.0, 64.0, 45.0, 49.0, 35.0, 37.0, 32.0, 25.0, 19.0, 17.0, 16.0, 9.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8271484375, -1.7728424072265625, -1.718536376953125, -1.6642303466796875, -1.60992431640625, -1.5556182861328125, -1.501312255859375, -1.4470062255859375, -1.3927001953125, -1.3383941650390625, -1.284088134765625, -1.2297821044921875, -1.17547607421875, -1.1211700439453125, -1.066864013671875, -1.0125579833984375, -0.958251953125, -0.9039459228515625, -0.849639892578125, -0.7953338623046875, -0.74102783203125, -0.6867218017578125, -0.632415771484375, -0.5781097412109375, -0.5238037109375, -0.4694976806640625, -0.415191650390625, -0.3608856201171875, -0.30657958984375, -0.2522735595703125, -0.197967529296875, -0.1436614990234375, -0.08935546875, -0.0350494384765625, 0.019256591796875, 0.0735626220703125, 0.12786865234375, 0.1821746826171875, 0.236480712890625, 0.2907867431640625, 0.3450927734375, 0.3993988037109375, 0.453704833984375, 0.5080108642578125, 0.56231689453125, 0.6166229248046875, 0.670928955078125, 0.7252349853515625, 0.779541015625, 0.8338470458984375, 0.888153076171875, 0.9424591064453125, 0.99676513671875, 1.0510711669921875, 1.105377197265625, 1.1596832275390625, 1.2139892578125, 1.2682952880859375, 1.322601318359375, 1.3769073486328125, 1.43121337890625, 1.4855194091796875, 1.539825439453125, 1.5941314697265625, 1.6484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 3.0, 14.0, 21.0, 41.0, 67.0, 112.0, 272.0, 752.0, 3854.0, 114591.0, 4044471.0, 27093.0, 2124.0, 530.0, 184.0, 70.0, 40.0, 31.0, 11.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.890625, -27.216064453125, -26.54150390625, -25.866943359375, -25.1923828125, -24.517822265625, -23.84326171875, -23.168701171875, -22.494140625, -21.819580078125, -21.14501953125, -20.470458984375, -19.7958984375, -19.121337890625, -18.44677734375, -17.772216796875, -17.09765625, -16.423095703125, -15.74853515625, -15.073974609375, -14.3994140625, -13.724853515625, -13.05029296875, -12.375732421875, -11.701171875, -11.026611328125, -10.35205078125, -9.677490234375, -9.0029296875, -8.328369140625, -7.65380859375, -6.979248046875, -6.3046875, -5.630126953125, -4.95556640625, -4.281005859375, -3.6064453125, -2.931884765625, -2.25732421875, -1.582763671875, -0.908203125, -0.233642578125, 0.44091796875, 1.115478515625, 1.7900390625, 2.464599609375, 3.13916015625, 3.813720703125, 4.48828125, 5.162841796875, 5.83740234375, 6.511962890625, 7.1865234375, 7.861083984375, 8.53564453125, 9.210205078125, 9.884765625, 10.559326171875, 11.23388671875, 11.908447265625, 12.5830078125, 13.257568359375, 13.93212890625, 14.606689453125, 15.28125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 8.0, 14.0, 21.0, 45.0, 83.0, 168.0, 463.0, 1630.0, 1128.0, 279.0, 103.0, 54.0, 31.0, 18.0, 9.0, 5.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40234375, -7.2254638671875, -7.048583984375, -6.8717041015625, -6.69482421875, -6.5179443359375, -6.341064453125, -6.1641845703125, -5.9873046875, -5.8104248046875, -5.633544921875, -5.4566650390625, -5.27978515625, -5.1029052734375, -4.926025390625, -4.7491455078125, -4.572265625, -4.3953857421875, -4.218505859375, -4.0416259765625, -3.86474609375, -3.6878662109375, -3.510986328125, -3.3341064453125, -3.1572265625, -2.9803466796875, -2.803466796875, -2.6265869140625, -2.44970703125, -2.2728271484375, -2.095947265625, -1.9190673828125, -1.7421875, -1.5653076171875, -1.388427734375, -1.2115478515625, -1.03466796875, -0.8577880859375, -0.680908203125, -0.5040283203125, -0.3271484375, -0.1502685546875, 0.026611328125, 0.2034912109375, 0.38037109375, 0.5572509765625, 0.734130859375, 0.9110107421875, 1.087890625, 1.2647705078125, 1.441650390625, 1.6185302734375, 1.79541015625, 1.9722900390625, 2.149169921875, 2.3260498046875, 2.5029296875, 2.6798095703125, 2.856689453125, 3.0335693359375, 3.21044921875, 3.3873291015625, 3.564208984375, 3.7410888671875, 3.91796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 26.0, 63.0, 238.0, 382.0, 210.0, 61.0, 15.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.1904067993164, -69.59600830078125, -68.0016098022461, -66.40721130371094, -64.81281280517578, -63.218414306640625, -61.62401580810547, -60.02961730957031, -58.435218811035156, -56.8408203125, -55.246421813964844, -53.65202331542969, -52.05762481689453, -50.463226318359375, -48.86882781982422, -47.27442932128906, -45.680030822753906, -44.08563232421875, -42.491233825683594, -40.89683532714844, -39.30243682861328, -37.708038330078125, -36.11363983154297, -34.51924133300781, -32.92483901977539, -31.330440521240234, -29.736042022705078, -28.141643524169922, -26.547245025634766, -24.95284652709961, -23.358448028564453, -21.764049530029297, -20.169649124145508, -18.57525062561035, -16.980852127075195, -15.386453628540039, -13.792055130004883, -12.197656631469727, -10.603257179260254, -9.008858680725098, -7.414460182189941, -5.820061683654785, -4.225663185119629, -2.6312642097473145, -1.0368657112121582, 0.557532787322998, 2.1519317626953125, 3.7463302612304688, 5.340728759765625, 6.935127258300781, 8.529525756835938, 10.123924255371094, 11.71832275390625, 13.312721252441406, 14.907120704650879, 16.50151824951172, 18.095916748046875, 19.69031524658203, 21.284713745117188, 22.879112243652344, 24.4735107421875, 26.067909240722656, 27.662307739257812, 29.25670623779297, 30.851106643676758]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 4.0, 12.0, 14.0, 23.0, 19.0, 27.0, 36.0, 50.0, 48.0, 49.0, 44.0, 74.0, 59.0, 59.0, 63.0, 54.0, 57.0, 41.0, 49.0, 40.0, 47.0, 31.0, 25.0, 17.0, 10.0, 12.0, 7.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.38701057434082, -18.855302810668945, -18.32359504699707, -17.791887283325195, -17.26017951965332, -16.728471755981445, -16.19676399230957, -15.665056228637695, -15.13334846496582, -14.601640701293945, -14.06993293762207, -13.538225173950195, -13.00651741027832, -12.474809646606445, -11.94310188293457, -11.411394119262695, -10.87968635559082, -10.347978591918945, -9.81627082824707, -9.284563064575195, -8.75285530090332, -8.221147537231445, -7.68943977355957, -7.157732009887695, -6.62602424621582, -6.094316482543945, -5.56260871887207, -5.030900955200195, -4.49919319152832, -3.9674854278564453, -3.4357776641845703, -2.9040699005126953, -2.372361183166504, -1.840653419494629, -1.308945655822754, -0.7772378921508789, -0.2455301284790039, 0.2861776351928711, 0.8178853988647461, 1.349593162536621, 1.881300926208496, 2.413008689880371, 2.944716453552246, 3.476424217224121, 4.008131980895996, 4.539839744567871, 5.071547508239746, 5.603255271911621, 6.134963035583496, 6.666670799255371, 7.198378562927246, 7.730086326599121, 8.261794090270996, 8.793501853942871, 9.325209617614746, 9.856917381286621, 10.388625144958496, 10.920332908630371, 11.452040672302246, 11.983748435974121, 12.515456199645996, 13.047163963317871, 13.578871726989746, 14.110579490661621, 14.642287254333496]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 2.0, 5.0, 3.0, 9.0, 9.0, 24.0, 27.0, 36.0, 50.0, 88.0, 155.0, 204.0, 338.0, 494.0, 832.0, 1535.0, 2878.0, 6287.0, 14477.0, 40192.0, 132380.0, 395572.0, 309727.0, 92525.0, 29441.0, 10971.0, 4821.0, 2279.0, 1255.0, 653.0, 423.0, 309.0, 208.0, 117.0, 73.0, 50.0, 36.0, 18.0, 13.0, 7.0, 6.0, 10.0, 2.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.27734375, -7.06854248046875, -6.8597412109375, -6.65093994140625, -6.442138671875, -6.23333740234375, -6.0245361328125, -5.81573486328125, -5.60693359375, -5.39813232421875, -5.1893310546875, -4.98052978515625, -4.771728515625, -4.56292724609375, -4.3541259765625, -4.14532470703125, -3.9365234375, -3.72772216796875, -3.5189208984375, -3.31011962890625, -3.101318359375, -2.89251708984375, -2.6837158203125, -2.47491455078125, -2.26611328125, -2.05731201171875, -1.8485107421875, -1.63970947265625, -1.430908203125, -1.22210693359375, -1.0133056640625, -0.80450439453125, -0.595703125, -0.38690185546875, -0.1781005859375, 0.03070068359375, 0.239501953125, 0.44830322265625, 0.6571044921875, 0.86590576171875, 1.07470703125, 1.28350830078125, 1.4923095703125, 1.70111083984375, 1.909912109375, 2.11871337890625, 2.3275146484375, 2.53631591796875, 2.7451171875, 2.95391845703125, 3.1627197265625, 3.37152099609375, 3.580322265625, 3.78912353515625, 3.9979248046875, 4.20672607421875, 4.41552734375, 4.62432861328125, 4.8331298828125, 5.04193115234375, 5.250732421875, 5.45953369140625, 5.6683349609375, 5.87713623046875, 6.0859375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 9.0, 12.0, 13.0, 7.0, 28.0, 21.0, 35.0, 46.0, 51.0, 51.0, 61.0, 63.0, 77.0, 82.0, 67.0, 55.0, 60.0, 57.0, 38.0, 41.0, 32.0, 25.0, 23.0, 7.0, 12.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.193359375, -2.1304168701171875, -2.067474365234375, -2.0045318603515625, -1.94158935546875, -1.8786468505859375, -1.815704345703125, -1.7527618408203125, -1.6898193359375, -1.6268768310546875, -1.563934326171875, -1.5009918212890625, -1.43804931640625, -1.3751068115234375, -1.312164306640625, -1.2492218017578125, -1.186279296875, -1.1233367919921875, -1.060394287109375, -0.9974517822265625, -0.93450927734375, -0.8715667724609375, -0.808624267578125, -0.7456817626953125, -0.6827392578125, -0.6197967529296875, -0.556854248046875, -0.4939117431640625, -0.43096923828125, -0.3680267333984375, -0.305084228515625, -0.2421417236328125, -0.17919921875, -0.1162567138671875, -0.053314208984375, 0.0096282958984375, 0.07257080078125, 0.1355133056640625, 0.198455810546875, 0.2613983154296875, 0.3243408203125, 0.3872833251953125, 0.450225830078125, 0.5131683349609375, 0.57611083984375, 0.6390533447265625, 0.701995849609375, 0.7649383544921875, 0.827880859375, 0.8908233642578125, 0.953765869140625, 1.0167083740234375, 1.07965087890625, 1.1425933837890625, 1.205535888671875, 1.2684783935546875, 1.3314208984375, 1.3943634033203125, 1.457305908203125, 1.5202484130859375, 1.58319091796875, 1.6461334228515625, 1.709075927734375, 1.7720184326171875, 1.8349609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 16.0, 19.0, 28.0, 21.0, 32.0, 52.0, 75.0, 75.0, 107.0, 165.0, 274.0, 448.0, 736.0, 1294.0, 2267.0, 3997.0, 7376.0, 14387.0, 28845.0, 63616.0, 142922.0, 265582.0, 260735.0, 136784.0, 60299.0, 28172.0, 13785.0, 7100.0, 3869.0, 2165.0, 1267.0, 741.0, 443.0, 259.0, 165.0, 112.0, 69.0, 62.0, 57.0, 35.0, 25.0, 23.0, 14.0, 8.0, 12.0, 3.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.66015625, -3.549163818359375, -3.43817138671875, -3.327178955078125, -3.2161865234375, -3.105194091796875, -2.99420166015625, -2.883209228515625, -2.772216796875, -2.661224365234375, -2.55023193359375, -2.439239501953125, -2.3282470703125, -2.217254638671875, -2.10626220703125, -1.995269775390625, -1.88427734375, -1.773284912109375, -1.66229248046875, -1.551300048828125, -1.4403076171875, -1.329315185546875, -1.21832275390625, -1.107330322265625, -0.996337890625, -0.885345458984375, -0.77435302734375, -0.663360595703125, -0.5523681640625, -0.441375732421875, -0.33038330078125, -0.219390869140625, -0.1083984375, 0.002593994140625, 0.11358642578125, 0.224578857421875, 0.3355712890625, 0.446563720703125, 0.55755615234375, 0.668548583984375, 0.779541015625, 0.890533447265625, 1.00152587890625, 1.112518310546875, 1.2235107421875, 1.334503173828125, 1.44549560546875, 1.556488037109375, 1.66748046875, 1.778472900390625, 1.88946533203125, 2.000457763671875, 2.1114501953125, 2.222442626953125, 2.33343505859375, 2.444427490234375, 2.555419921875, 2.666412353515625, 2.77740478515625, 2.888397216796875, 2.9993896484375, 3.110382080078125, 3.22137451171875, 3.332366943359375, 3.443359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 4.0, 7.0, 8.0, 14.0, 14.0, 8.0, 11.0, 17.0, 21.0, 23.0, 24.0, 33.0, 38.0, 42.0, 26.0, 33.0, 34.0, 40.0, 38.0, 41.0, 35.0, 44.0, 37.0, 45.0, 44.0, 42.0, 32.0, 32.0, 23.0, 33.0, 17.0, 23.0, 17.0, 22.0, 13.0, 7.0, 8.0, 4.0, 8.0, 7.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.33367919921875, -5.1595458984375, -4.98541259765625, -4.811279296875, -4.63714599609375, -4.4630126953125, -4.28887939453125, -4.11474609375, -3.94061279296875, -3.7664794921875, -3.59234619140625, -3.418212890625, -3.24407958984375, -3.0699462890625, -2.89581298828125, -2.7216796875, -2.54754638671875, -2.3734130859375, -2.19927978515625, -2.025146484375, -1.85101318359375, -1.6768798828125, -1.50274658203125, -1.32861328125, -1.15447998046875, -0.9803466796875, -0.80621337890625, -0.632080078125, -0.45794677734375, -0.2838134765625, -0.10968017578125, 0.064453125, 0.23858642578125, 0.4127197265625, 0.58685302734375, 0.760986328125, 0.93511962890625, 1.1092529296875, 1.28338623046875, 1.45751953125, 1.63165283203125, 1.8057861328125, 1.97991943359375, 2.154052734375, 2.32818603515625, 2.5023193359375, 2.67645263671875, 2.8505859375, 3.02471923828125, 3.1988525390625, 3.37298583984375, 3.547119140625, 3.72125244140625, 3.8953857421875, 4.06951904296875, 4.24365234375, 4.41778564453125, 4.5919189453125, 4.76605224609375, 4.940185546875, 5.11431884765625, 5.2884521484375, 5.46258544921875, 5.63671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 5.0, 7.0, 15.0, 13.0, 22.0, 31.0, 48.0, 64.0, 113.0, 217.0, 343.0, 611.0, 1341.0, 3052.0, 7894.0, 23482.0, 80277.0, 286341.0, 431725.0, 149520.0, 41663.0, 13075.0, 4768.0, 1940.0, 865.0, 449.0, 252.0, 145.0, 83.0, 56.0, 39.0, 18.0, 13.0, 16.0, 14.0, 9.0, 6.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.24609375, -2.1741943359375, -2.102294921875, -2.0303955078125, -1.95849609375, -1.8865966796875, -1.814697265625, -1.7427978515625, -1.6708984375, -1.5989990234375, -1.527099609375, -1.4552001953125, -1.38330078125, -1.3114013671875, -1.239501953125, -1.1676025390625, -1.095703125, -1.0238037109375, -0.951904296875, -0.8800048828125, -0.80810546875, -0.7362060546875, -0.664306640625, -0.5924072265625, -0.5205078125, -0.4486083984375, -0.376708984375, -0.3048095703125, -0.23291015625, -0.1610107421875, -0.089111328125, -0.0172119140625, 0.0546875, 0.1265869140625, 0.198486328125, 0.2703857421875, 0.34228515625, 0.4141845703125, 0.486083984375, 0.5579833984375, 0.6298828125, 0.7017822265625, 0.773681640625, 0.8455810546875, 0.91748046875, 0.9893798828125, 1.061279296875, 1.1331787109375, 1.205078125, 1.2769775390625, 1.348876953125, 1.4207763671875, 1.49267578125, 1.5645751953125, 1.636474609375, 1.7083740234375, 1.7802734375, 1.8521728515625, 1.924072265625, 1.9959716796875, 2.06787109375, 2.1397705078125, 2.211669921875, 2.2835693359375, 2.35546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 8.0, 6.0, 12.0, 12.0, 23.0, 21.0, 41.0, 46.0, 65.0, 81.0, 97.0, 108.0, 118.0, 56.0, 51.0, 52.0, 33.0, 31.0, 31.0, 18.0, 17.0, 10.0, 9.0, 5.0, 5.0, 6.0, 6.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00042629241943359375, -0.0004149340093135834, -0.000403575599193573, -0.0003922171890735626, -0.00038085877895355225, -0.00036950036883354187, -0.0003581419587135315, -0.0003467835485935211, -0.00033542513847351074, -0.00032406672835350037, -0.00031270831823349, -0.0003013499081134796, -0.00028999149799346924, -0.00027863308787345886, -0.0002672746777534485, -0.0002559162676334381, -0.00024455785751342773, -0.00023319944739341736, -0.00022184103727340698, -0.0002104826271533966, -0.00019912421703338623, -0.00018776580691337585, -0.00017640739679336548, -0.0001650489866733551, -0.00015369057655334473, -0.00014233216643333435, -0.00013097375631332397, -0.0001196153461933136, -0.00010825693607330322, -9.689852595329285e-05, -8.554011583328247e-05, -7.41817057132721e-05, -6.282329559326172e-05, -5.146488547325134e-05, -4.010647535324097e-05, -2.874806523323059e-05, -1.7389655113220215e-05, -6.031244993209839e-06, 5.327165126800537e-06, 1.6685575246810913e-05, 2.804398536682129e-05, 3.9402395486831665e-05, 5.076080560684204e-05, 6.211921572685242e-05, 7.347762584686279e-05, 8.483603596687317e-05, 9.619444608688354e-05, 0.00010755285620689392, 0.0001189112663269043, 0.00013026967644691467, 0.00014162808656692505, 0.00015298649668693542, 0.0001643449068069458, 0.00017570331692695618, 0.00018706172704696655, 0.00019842013716697693, 0.0002097785472869873, 0.00022113695740699768, 0.00023249536752700806, 0.00024385377764701843, 0.0002552121877670288, 0.0002665705978870392, 0.00027792900800704956, 0.00028928741812705994, 0.0003006458282470703]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 6.0, 12.0, 14.0, 23.0, 23.0, 48.0, 64.0, 114.0, 194.0, 411.0, 825.0, 1877.0, 4817.0, 14341.0, 50950.0, 218170.0, 530001.0, 166793.0, 40841.0, 11773.0, 4086.0, 1601.0, 761.0, 333.0, 192.0, 93.0, 52.0, 43.0, 25.0, 26.0, 13.0, 5.0, 9.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5625, -2.478240966796875, -2.39398193359375, -2.309722900390625, -2.2254638671875, -2.141204833984375, -2.05694580078125, -1.972686767578125, -1.888427734375, -1.804168701171875, -1.71990966796875, -1.635650634765625, -1.5513916015625, -1.467132568359375, -1.38287353515625, -1.298614501953125, -1.21435546875, -1.130096435546875, -1.04583740234375, -0.961578369140625, -0.8773193359375, -0.793060302734375, -0.70880126953125, -0.624542236328125, -0.540283203125, -0.456024169921875, -0.37176513671875, -0.287506103515625, -0.2032470703125, -0.118988037109375, -0.03472900390625, 0.049530029296875, 0.1337890625, 0.218048095703125, 0.30230712890625, 0.386566162109375, 0.4708251953125, 0.555084228515625, 0.63934326171875, 0.723602294921875, 0.807861328125, 0.892120361328125, 0.97637939453125, 1.060638427734375, 1.1448974609375, 1.229156494140625, 1.31341552734375, 1.397674560546875, 1.48193359375, 1.566192626953125, 1.65045166015625, 1.734710693359375, 1.8189697265625, 1.903228759765625, 1.98748779296875, 2.071746826171875, 2.156005859375, 2.240264892578125, 2.32452392578125, 2.408782958984375, 2.4930419921875, 2.577301025390625, 2.66156005859375, 2.745819091796875, 2.830078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 8.0, 5.0, 9.0, 3.0, 12.0, 13.0, 15.0, 30.0, 38.0, 38.0, 63.0, 79.0, 67.0, 100.0, 95.0, 83.0, 69.0, 59.0, 35.0, 46.0, 44.0, 22.0, 18.0, 12.0, 12.0, 4.0, 7.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8603515625, -1.7845306396484375, -1.708709716796875, -1.6328887939453125, -1.55706787109375, -1.4812469482421875, -1.405426025390625, -1.3296051025390625, -1.2537841796875, -1.1779632568359375, -1.102142333984375, -1.0263214111328125, -0.95050048828125, -0.8746795654296875, -0.798858642578125, -0.7230377197265625, -0.647216796875, -0.5713958740234375, -0.495574951171875, -0.4197540283203125, -0.34393310546875, -0.2681121826171875, -0.192291259765625, -0.1164703369140625, -0.0406494140625, 0.0351715087890625, 0.110992431640625, 0.1868133544921875, 0.26263427734375, 0.3384552001953125, 0.414276123046875, 0.4900970458984375, 0.56591796875, 0.6417388916015625, 0.717559814453125, 0.7933807373046875, 0.86920166015625, 0.9450225830078125, 1.020843505859375, 1.0966644287109375, 1.1724853515625, 1.2483062744140625, 1.324127197265625, 1.3999481201171875, 1.47576904296875, 1.5515899658203125, 1.627410888671875, 1.7032318115234375, 1.779052734375, 1.8548736572265625, 1.930694580078125, 2.0065155029296875, 2.08233642578125, 2.1581573486328125, 2.233978271484375, 2.3097991943359375, 2.3856201171875, 2.4614410400390625, 2.537261962890625, 2.6130828857421875, 2.68890380859375, 2.7647247314453125, 2.840545654296875, 2.9163665771484375, 2.9921875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 24.0, 40.0, 39.0, 97.0, 161.0, 202.0, 195.0, 99.0, 56.0, 34.0, 19.0, 9.0, 5.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.545568466186523, -21.862661361694336, -20.17975425720215, -18.49684715270996, -16.813940048217773, -15.131033897399902, -13.448126792907715, -11.765219688415527, -10.08231258392334, -8.399405479431152, -6.716498374938965, -5.0335917472839355, -3.350684642791748, -1.6677780151367188, 0.01512908935546875, 1.6980361938476562, 3.3809432983398438, 5.063850402832031, 6.746757507324219, 8.429664611816406, 10.112571716308594, 11.795477867126465, 13.478384971618652, 15.16129207611084, 16.844200134277344, 18.52710723876953, 20.21001434326172, 21.892921447753906, 23.575828552246094, 25.25873565673828, 26.94164276123047, 28.624549865722656, 30.307453155517578, 31.990360260009766, 33.67326736450195, 35.35617446899414, 37.03908157348633, 38.721988677978516, 40.4048957824707, 42.08780288696289, 43.77070999145508, 45.453617095947266, 47.13652420043945, 48.81943130493164, 50.50233840942383, 52.185245513916016, 53.8681526184082, 55.55105972290039, 57.23396301269531, 58.9168701171875, 60.59977722167969, 62.282684326171875, 63.96559143066406, 65.64849853515625, 67.33140563964844, 69.01431274414062, 70.69721984863281, 72.380126953125, 74.06303405761719, 75.74594116210938, 77.42884826660156, 79.11175537109375, 80.79466247558594, 82.47756958007812, 84.16047668457031]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 5.0, 3.0, 6.0, 9.0, 11.0, 11.0, 17.0, 19.0, 23.0, 23.0, 25.0, 19.0, 34.0, 32.0, 35.0, 46.0, 51.0, 51.0, 34.0, 43.0, 53.0, 62.0, 46.0, 36.0, 45.0, 30.0, 36.0, 28.0, 24.0, 25.0, 20.0, 18.0, 18.0, 20.0, 7.0, 7.0, 14.0, 4.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.64718246459961, -33.43120193481445, -32.2152214050293, -30.999238967895508, -29.78325843811035, -28.567277908325195, -27.351295471191406, -26.13531494140625, -24.919334411621094, -23.703353881835938, -22.48737335205078, -21.271390914916992, -20.055410385131836, -18.83942985534668, -17.62344741821289, -16.407466888427734, -15.191486358642578, -13.975505828857422, -12.75952434539795, -11.543542861938477, -10.32756233215332, -9.111581802368164, -7.895600318908691, -6.679618835449219, -5.4636383056640625, -4.247657299041748, -3.0316762924194336, -1.8156952857971191, -0.5997142791748047, 0.6162667274475098, 1.8322477340698242, 3.048229217529297, 4.264213562011719, 5.480194568634033, 6.696175575256348, 7.912156581878662, 9.128137588500977, 10.344118118286133, 11.560099601745605, 12.776081085205078, 13.992061614990234, 15.20804214477539, 16.424022674560547, 17.640005111694336, 18.855985641479492, 20.07196617126465, 21.287948608398438, 22.503929138183594, 23.71990966796875, 24.935890197753906, 26.151870727539062, 27.36785316467285, 28.583833694458008, 29.799814224243164, 31.015796661376953, 32.23177719116211, 33.447757720947266, 34.66373825073242, 35.87971878051758, 37.095699310302734, 38.311683654785156, 39.52766418457031, 40.74364471435547, 41.959625244140625, 43.17560577392578]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 5.0, 4.0, 12.0, 8.0, 10.0, 13.0, 17.0, 24.0, 50.0, 61.0, 75.0, 125.0, 217.0, 331.0, 578.0, 1009.0, 1878.0, 4160.0, 10891.0, 38706.0, 507142.0, 3526531.0, 74888.0, 16606.0, 5733.0, 2395.0, 1239.0, 614.0, 329.0, 232.0, 144.0, 88.0, 50.0, 32.0, 33.0, 15.0, 7.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.53125, -9.27490234375, -9.0185546875, -8.76220703125, -8.505859375, -8.24951171875, -7.9931640625, -7.73681640625, -7.48046875, -7.22412109375, -6.9677734375, -6.71142578125, -6.455078125, -6.19873046875, -5.9423828125, -5.68603515625, -5.4296875, -5.17333984375, -4.9169921875, -4.66064453125, -4.404296875, -4.14794921875, -3.8916015625, -3.63525390625, -3.37890625, -3.12255859375, -2.8662109375, -2.60986328125, -2.353515625, -2.09716796875, -1.8408203125, -1.58447265625, -1.328125, -1.07177734375, -0.8154296875, -0.55908203125, -0.302734375, -0.04638671875, 0.2099609375, 0.46630859375, 0.72265625, 0.97900390625, 1.2353515625, 1.49169921875, 1.748046875, 2.00439453125, 2.2607421875, 2.51708984375, 2.7734375, 3.02978515625, 3.2861328125, 3.54248046875, 3.798828125, 4.05517578125, 4.3115234375, 4.56787109375, 4.82421875, 5.08056640625, 5.3369140625, 5.59326171875, 5.849609375, 6.10595703125, 6.3623046875, 6.61865234375, 6.875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 1.0, 12.0, 16.0, 18.0, 21.0, 18.0, 35.0, 49.0, 39.0, 52.0, 61.0, 72.0, 65.0, 81.0, 68.0, 49.0, 49.0, 52.0, 57.0, 36.0, 33.0, 28.0, 23.0, 16.0, 10.0, 9.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.35546875, -2.28863525390625, -2.2218017578125, -2.15496826171875, -2.088134765625, -2.02130126953125, -1.9544677734375, -1.88763427734375, -1.82080078125, -1.75396728515625, -1.6871337890625, -1.62030029296875, -1.553466796875, -1.48663330078125, -1.4197998046875, -1.35296630859375, -1.2861328125, -1.21929931640625, -1.1524658203125, -1.08563232421875, -1.018798828125, -0.95196533203125, -0.8851318359375, -0.81829833984375, -0.75146484375, -0.68463134765625, -0.6177978515625, -0.55096435546875, -0.484130859375, -0.41729736328125, -0.3504638671875, -0.28363037109375, -0.216796875, -0.14996337890625, -0.0831298828125, -0.01629638671875, 0.050537109375, 0.11737060546875, 0.1842041015625, 0.25103759765625, 0.31787109375, 0.38470458984375, 0.4515380859375, 0.51837158203125, 0.585205078125, 0.65203857421875, 0.7188720703125, 0.78570556640625, 0.8525390625, 0.91937255859375, 0.9862060546875, 1.05303955078125, 1.119873046875, 1.18670654296875, 1.2535400390625, 1.32037353515625, 1.38720703125, 1.45404052734375, 1.5208740234375, 1.58770751953125, 1.654541015625, 1.72137451171875, 1.7882080078125, 1.85504150390625, 1.921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 8.0, 9.0, 15.0, 27.0, 26.0, 49.0, 70.0, 96.0, 150.0, 305.0, 516.0, 1242.0, 3550.0, 12083.0, 66014.0, 1867701.0, 2157029.0, 68074.0, 11731.0, 3268.0, 1169.0, 513.0, 273.0, 148.0, 61.0, 49.0, 33.0, 24.0, 16.0, 12.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.26171875, -7.0482177734375, -6.834716796875, -6.6212158203125, -6.40771484375, -6.1942138671875, -5.980712890625, -5.7672119140625, -5.5537109375, -5.3402099609375, -5.126708984375, -4.9132080078125, -4.69970703125, -4.4862060546875, -4.272705078125, -4.0592041015625, -3.845703125, -3.6322021484375, -3.418701171875, -3.2052001953125, -2.99169921875, -2.7781982421875, -2.564697265625, -2.3511962890625, -2.1376953125, -1.9241943359375, -1.710693359375, -1.4971923828125, -1.28369140625, -1.0701904296875, -0.856689453125, -0.6431884765625, -0.4296875, -0.2161865234375, -0.002685546875, 0.2108154296875, 0.42431640625, 0.6378173828125, 0.851318359375, 1.0648193359375, 1.2783203125, 1.4918212890625, 1.705322265625, 1.9188232421875, 2.13232421875, 2.3458251953125, 2.559326171875, 2.7728271484375, 2.986328125, 3.1998291015625, 3.413330078125, 3.6268310546875, 3.84033203125, 4.0538330078125, 4.267333984375, 4.4808349609375, 4.6943359375, 4.9078369140625, 5.121337890625, 5.3348388671875, 5.54833984375, 5.7618408203125, 5.975341796875, 6.1888427734375, 6.40234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 4.0, 6.0, 9.0, 11.0, 14.0, 26.0, 29.0, 62.0, 125.0, 296.0, 1000.0, 1730.0, 459.0, 156.0, 65.0, 39.0, 13.0, 11.0, 6.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.986328125, -3.884674072265625, -3.78302001953125, -3.681365966796875, -3.5797119140625, -3.478057861328125, -3.37640380859375, -3.274749755859375, -3.173095703125, -3.071441650390625, -2.96978759765625, -2.868133544921875, -2.7664794921875, -2.664825439453125, -2.56317138671875, -2.461517333984375, -2.35986328125, -2.258209228515625, -2.15655517578125, -2.054901123046875, -1.9532470703125, -1.851593017578125, -1.74993896484375, -1.648284912109375, -1.546630859375, -1.444976806640625, -1.34332275390625, -1.241668701171875, -1.1400146484375, -1.038360595703125, -0.93670654296875, -0.835052490234375, -0.7333984375, -0.631744384765625, -0.53009033203125, -0.428436279296875, -0.3267822265625, -0.225128173828125, -0.12347412109375, -0.021820068359375, 0.079833984375, 0.181488037109375, 0.28314208984375, 0.384796142578125, 0.4864501953125, 0.588104248046875, 0.68975830078125, 0.791412353515625, 0.89306640625, 0.994720458984375, 1.09637451171875, 1.198028564453125, 1.2996826171875, 1.401336669921875, 1.50299072265625, 1.604644775390625, 1.706298828125, 1.807952880859375, 1.90960693359375, 2.011260986328125, 2.1129150390625, 2.214569091796875, 2.31622314453125, 2.417877197265625, 2.51953125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 13.0, 11.0, 25.0, 28.0, 53.0, 80.0, 102.0, 108.0, 148.0, 134.0, 97.0, 69.0, 59.0, 27.0, 15.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.840119361877441, -15.464123725891113, -15.088129043579102, -14.712133407592773, -14.336138725280762, -13.960143089294434, -13.584148406982422, -13.208152770996094, -12.832158088684082, -12.456162452697754, -12.080167770385742, -11.704172134399414, -11.328177452087402, -10.952181816101074, -10.576187133789062, -10.200191497802734, -9.824195861816406, -9.448200225830078, -9.072205543518066, -8.696209907531738, -8.320215225219727, -7.944220066070557, -7.568224906921387, -7.192229270935059, -6.816234588623047, -6.440239429473877, -6.064244270324707, -5.688249111175537, -5.312253952026367, -4.936258792877197, -4.560263633728027, -4.184267997741699, -3.8082733154296875, -3.4322781562805176, -3.0562829971313477, -2.6802878379821777, -2.304292678833008, -1.9282974004745483, -1.5523021221160889, -1.176306962966919, -0.800311803817749, -0.4243166148662567, -0.048321425914764404, 0.3276737928390503, 0.7036689519882202, 1.0796641111373901, 1.4556593894958496, 1.8316545486450195, 2.2076497077941895, 2.5836448669433594, 2.9596400260925293, 3.335635185241699, 3.711630344390869, 4.087625503540039, 4.463621139526367, 4.839615821838379, 5.215611457824707, 5.591606616973877, 5.967601776123047, 6.343596935272217, 6.719592094421387, 7.095587253570557, 7.471582412719727, 7.847578048706055, 8.223572731018066]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 8.0, 7.0, 15.0, 18.0, 26.0, 30.0, 44.0, 58.0, 55.0, 56.0, 66.0, 64.0, 76.0, 69.0, 71.0, 70.0, 58.0, 48.0, 31.0, 32.0, 27.0, 25.0, 18.0, 5.0, 10.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.930217742919922, -9.551583290100098, -9.172948837280273, -8.794315338134766, -8.415680885314941, -8.037046432495117, -7.658412456512451, -7.279778480529785, -6.901144027709961, -6.522509574890137, -6.143875598907471, -5.765241622924805, -5.3866071701049805, -5.007972717285156, -4.62933874130249, -4.250704765319824, -3.8720703125, -3.493436098098755, -3.1148018836975098, -2.7361676692962646, -2.3575334548950195, -1.9788992404937744, -1.6002650260925293, -1.2216308116912842, -0.8429965972900391, -0.46436238288879395, -0.08572816848754883, 0.2929060459136963, 0.6715402603149414, 1.0501744747161865, 1.4288086891174316, 1.8074429035186768, 2.186077117919922, 2.564711332321167, 2.943345546722412, 3.3219797611236572, 3.7006139755249023, 4.079248428344727, 4.457882404327393, 4.836516380310059, 5.215150833129883, 5.593785285949707, 5.972419261932373, 6.351053237915039, 6.729687690734863, 7.1083221435546875, 7.4869561195373535, 7.8655900955200195, 8.244224548339844, 8.622859001159668, 9.001493453979492, 9.380126953125, 9.758761405944824, 10.137395858764648, 10.516029357910156, 10.89466381072998, 11.273298263549805, 11.651932716369629, 12.030567169189453, 12.409200668334961, 12.787835121154785, 13.16646957397461, 13.545103073120117, 13.923737525939941, 14.302371978759766]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 7.0, 13.0, 8.0, 21.0, 26.0, 39.0, 55.0, 73.0, 127.0, 199.0, 260.0, 417.0, 625.0, 1104.0, 1968.0, 3774.0, 7562.0, 15938.0, 37399.0, 96100.0, 252980.0, 354030.0, 166116.0, 61603.0, 24817.0, 11085.0, 5343.0, 2860.0, 1509.0, 893.0, 534.0, 361.0, 235.0, 136.0, 103.0, 76.0, 47.0, 33.0, 16.0, 22.0, 12.0, 10.0, 9.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.453125, -5.27874755859375, -5.1043701171875, -4.92999267578125, -4.755615234375, -4.58123779296875, -4.4068603515625, -4.23248291015625, -4.05810546875, -3.88372802734375, -3.7093505859375, -3.53497314453125, -3.360595703125, -3.18621826171875, -3.0118408203125, -2.83746337890625, -2.6630859375, -2.48870849609375, -2.3143310546875, -2.13995361328125, -1.965576171875, -1.79119873046875, -1.6168212890625, -1.44244384765625, -1.26806640625, -1.09368896484375, -0.9193115234375, -0.74493408203125, -0.570556640625, -0.39617919921875, -0.2218017578125, -0.04742431640625, 0.126953125, 0.30133056640625, 0.4757080078125, 0.65008544921875, 0.824462890625, 0.99884033203125, 1.1732177734375, 1.34759521484375, 1.52197265625, 1.69635009765625, 1.8707275390625, 2.04510498046875, 2.219482421875, 2.39385986328125, 2.5682373046875, 2.74261474609375, 2.9169921875, 3.09136962890625, 3.2657470703125, 3.44012451171875, 3.614501953125, 3.78887939453125, 3.9632568359375, 4.13763427734375, 4.31201171875, 4.48638916015625, 4.6607666015625, 4.83514404296875, 5.009521484375, 5.18389892578125, 5.3582763671875, 5.53265380859375, 5.70703125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 5.0, 15.0, 11.0, 16.0, 28.0, 23.0, 33.0, 35.0, 51.0, 51.0, 62.0, 65.0, 63.0, 72.0, 56.0, 45.0, 69.0, 54.0, 41.0, 38.0, 32.0, 34.0, 31.0, 10.0, 13.0, 8.0, 12.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.2890625, -2.2258148193359375, -2.162567138671875, -2.0993194580078125, -2.03607177734375, -1.9728240966796875, -1.909576416015625, -1.8463287353515625, -1.7830810546875, -1.7198333740234375, -1.656585693359375, -1.5933380126953125, -1.53009033203125, -1.4668426513671875, -1.403594970703125, -1.3403472900390625, -1.277099609375, -1.2138519287109375, -1.150604248046875, -1.0873565673828125, -1.02410888671875, -0.9608612060546875, -0.897613525390625, -0.8343658447265625, -0.7711181640625, -0.7078704833984375, -0.644622802734375, -0.5813751220703125, -0.51812744140625, -0.4548797607421875, -0.391632080078125, -0.3283843994140625, -0.26513671875, -0.2018890380859375, -0.138641357421875, -0.0753936767578125, -0.01214599609375, 0.0511016845703125, 0.114349365234375, 0.1775970458984375, 0.2408447265625, 0.3040924072265625, 0.367340087890625, 0.4305877685546875, 0.49383544921875, 0.5570831298828125, 0.620330810546875, 0.6835784912109375, 0.746826171875, 0.8100738525390625, 0.873321533203125, 0.9365692138671875, 0.99981689453125, 1.0630645751953125, 1.126312255859375, 1.1895599365234375, 1.2528076171875, 1.3160552978515625, 1.379302978515625, 1.4425506591796875, 1.50579833984375, 1.5690460205078125, 1.632293701171875, 1.6955413818359375, 1.7587890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 9.0, 14.0, 14.0, 21.0, 24.0, 52.0, 69.0, 80.0, 122.0, 174.0, 235.0, 400.0, 606.0, 1035.0, 1870.0, 3605.0, 7631.0, 17562.0, 45713.0, 122110.0, 281510.0, 316204.0, 151916.0, 56993.0, 21868.0, 9302.0, 4154.0, 2124.0, 1113.0, 672.0, 417.0, 285.0, 184.0, 126.0, 105.0, 62.0, 49.0, 46.0, 24.0, 15.0, 8.0, 2.0, 9.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.22265625, -4.098876953125, -3.97509765625, -3.851318359375, -3.7275390625, -3.603759765625, -3.47998046875, -3.356201171875, -3.232421875, -3.108642578125, -2.98486328125, -2.861083984375, -2.7373046875, -2.613525390625, -2.48974609375, -2.365966796875, -2.2421875, -2.118408203125, -1.99462890625, -1.870849609375, -1.7470703125, -1.623291015625, -1.49951171875, -1.375732421875, -1.251953125, -1.128173828125, -1.00439453125, -0.880615234375, -0.7568359375, -0.633056640625, -0.50927734375, -0.385498046875, -0.26171875, -0.137939453125, -0.01416015625, 0.109619140625, 0.2333984375, 0.357177734375, 0.48095703125, 0.604736328125, 0.728515625, 0.852294921875, 0.97607421875, 1.099853515625, 1.2236328125, 1.347412109375, 1.47119140625, 1.594970703125, 1.71875, 1.842529296875, 1.96630859375, 2.090087890625, 2.2138671875, 2.337646484375, 2.46142578125, 2.585205078125, 2.708984375, 2.832763671875, 2.95654296875, 3.080322265625, 3.2041015625, 3.327880859375, 3.45166015625, 3.575439453125, 3.69921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 7.0, 7.0, 6.0, 10.0, 10.0, 12.0, 26.0, 31.0, 26.0, 29.0, 27.0, 29.0, 34.0, 31.0, 34.0, 47.0, 48.0, 47.0, 35.0, 40.0, 44.0, 41.0, 51.0, 34.0, 40.0, 35.0, 28.0, 28.0, 34.0, 25.0, 19.0, 9.0, 20.0, 12.0, 9.0, 7.0, 3.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.62890625, -5.43878173828125, -5.2486572265625, -5.05853271484375, -4.868408203125, -4.67828369140625, -4.4881591796875, -4.29803466796875, -4.10791015625, -3.91778564453125, -3.7276611328125, -3.53753662109375, -3.347412109375, -3.15728759765625, -2.9671630859375, -2.77703857421875, -2.5869140625, -2.39678955078125, -2.2066650390625, -2.01654052734375, -1.826416015625, -1.63629150390625, -1.4461669921875, -1.25604248046875, -1.06591796875, -0.87579345703125, -0.6856689453125, -0.49554443359375, -0.305419921875, -0.11529541015625, 0.0748291015625, 0.26495361328125, 0.455078125, 0.64520263671875, 0.8353271484375, 1.02545166015625, 1.215576171875, 1.40570068359375, 1.5958251953125, 1.78594970703125, 1.97607421875, 2.16619873046875, 2.3563232421875, 2.54644775390625, 2.736572265625, 2.92669677734375, 3.1168212890625, 3.30694580078125, 3.4970703125, 3.68719482421875, 3.8773193359375, 4.06744384765625, 4.257568359375, 4.44769287109375, 4.6378173828125, 4.82794189453125, 5.01806640625, 5.20819091796875, 5.3983154296875, 5.58843994140625, 5.778564453125, 5.96868896484375, 6.1588134765625, 6.34893798828125, 6.5390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 7.0, 18.0, 34.0, 43.0, 73.0, 156.0, 301.0, 691.0, 1509.0, 3927.0, 11632.0, 38310.0, 168405.0, 527110.0, 224924.0, 49225.0, 13972.0, 4859.0, 1833.0, 774.0, 363.0, 181.0, 94.0, 47.0, 23.0, 15.0, 7.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.3203125, -3.2385101318359375, -3.156707763671875, -3.0749053955078125, -2.99310302734375, -2.9113006591796875, -2.829498291015625, -2.7476959228515625, -2.6658935546875, -2.5840911865234375, -2.502288818359375, -2.4204864501953125, -2.33868408203125, -2.2568817138671875, -2.175079345703125, -2.0932769775390625, -2.011474609375, -1.9296722412109375, -1.847869873046875, -1.7660675048828125, -1.68426513671875, -1.6024627685546875, -1.520660400390625, -1.4388580322265625, -1.3570556640625, -1.2752532958984375, -1.193450927734375, -1.1116485595703125, -1.02984619140625, -0.9480438232421875, -0.866241455078125, -0.7844390869140625, -0.70263671875, -0.6208343505859375, -0.539031982421875, -0.4572296142578125, -0.37542724609375, -0.2936248779296875, -0.211822509765625, -0.1300201416015625, -0.0482177734375, 0.0335845947265625, 0.115386962890625, 0.1971893310546875, 0.27899169921875, 0.3607940673828125, 0.442596435546875, 0.5243988037109375, 0.606201171875, 0.6880035400390625, 0.769805908203125, 0.8516082763671875, 0.93341064453125, 1.0152130126953125, 1.097015380859375, 1.1788177490234375, 1.2606201171875, 1.3424224853515625, 1.424224853515625, 1.5060272216796875, 1.58782958984375, 1.6696319580078125, 1.751434326171875, 1.8332366943359375, 1.9150390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 11.0, 11.0, 11.0, 14.0, 16.0, 15.0, 27.0, 28.0, 37.0, 58.0, 60.0, 80.0, 76.0, 108.0, 100.0, 75.0, 51.0, 33.0, 24.0, 31.0, 26.0, 23.0, 19.0, 21.0, 11.0, 11.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036144256591796875, -0.00034914538264274597, -0.0003368481993675232, -0.0003245510160923004, -0.00031225383281707764, -0.00029995664954185486, -0.0002876594662666321, -0.0002753622829914093, -0.0002630650997161865, -0.00025076791644096375, -0.00023847073316574097, -0.0002261735498905182, -0.0002138763666152954, -0.00020157918334007263, -0.00018928200006484985, -0.00017698481678962708, -0.0001646876335144043, -0.00015239045023918152, -0.00014009326696395874, -0.00012779608368873596, -0.00011549890041351318, -0.0001032017171382904, -9.090453386306763e-05, -7.860735058784485e-05, -6.631016731262207e-05, -5.401298403739929e-05, -4.1715800762176514e-05, -2.9418617486953735e-05, -1.7121434211730957e-05, -4.824250936508179e-06, 7.4729323387146e-06, 1.9770115613937378e-05, 3.2067298889160156e-05, 4.4364482164382935e-05, 5.666166543960571e-05, 6.895884871482849e-05, 8.125603199005127e-05, 9.355321526527405e-05, 0.00010585039854049683, 0.0001181475818157196, 0.00013044476509094238, 0.00014274194836616516, 0.00015503913164138794, 0.00016733631491661072, 0.0001796334981918335, 0.00019193068146705627, 0.00020422786474227905, 0.00021652504801750183, 0.0002288222312927246, 0.0002411194145679474, 0.00025341659784317017, 0.00026571378111839294, 0.0002780109643936157, 0.0002903081476688385, 0.0003026053309440613, 0.00031490251421928406, 0.00032719969749450684, 0.0003394968807697296, 0.0003517940640449524, 0.00036409124732017517, 0.00037638843059539795, 0.00038868561387062073, 0.0004009827971458435, 0.0004132799804210663, 0.00042557716369628906]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 4.0, 8.0, 9.0, 16.0, 31.0, 35.0, 83.0, 105.0, 164.0, 282.0, 493.0, 941.0, 1901.0, 4013.0, 9735.0, 25404.0, 86266.0, 411044.0, 386180.0, 80480.0, 24288.0, 9276.0, 3874.0, 1783.0, 906.0, 471.0, 291.0, 176.0, 84.0, 67.0, 37.0, 25.0, 27.0, 18.0, 9.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.673828125, -2.592742919921875, -2.51165771484375, -2.430572509765625, -2.3494873046875, -2.268402099609375, -2.18731689453125, -2.106231689453125, -2.025146484375, -1.944061279296875, -1.86297607421875, -1.781890869140625, -1.7008056640625, -1.619720458984375, -1.53863525390625, -1.457550048828125, -1.37646484375, -1.295379638671875, -1.21429443359375, -1.133209228515625, -1.0521240234375, -0.971038818359375, -0.88995361328125, -0.808868408203125, -0.727783203125, -0.646697998046875, -0.56561279296875, -0.484527587890625, -0.4034423828125, -0.322357177734375, -0.24127197265625, -0.160186767578125, -0.0791015625, 0.001983642578125, 0.08306884765625, 0.164154052734375, 0.2452392578125, 0.326324462890625, 0.40740966796875, 0.488494873046875, 0.569580078125, 0.650665283203125, 0.73175048828125, 0.812835693359375, 0.8939208984375, 0.975006103515625, 1.05609130859375, 1.137176513671875, 1.21826171875, 1.299346923828125, 1.38043212890625, 1.461517333984375, 1.5426025390625, 1.623687744140625, 1.70477294921875, 1.785858154296875, 1.866943359375, 1.948028564453125, 2.02911376953125, 2.110198974609375, 2.1912841796875, 2.272369384765625, 2.35345458984375, 2.434539794921875, 2.515625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 8.0, 8.0, 11.0, 16.0, 18.0, 25.0, 41.0, 53.0, 59.0, 81.0, 119.0, 98.0, 109.0, 82.0, 59.0, 55.0, 36.0, 20.0, 16.0, 19.0, 7.0, 13.0, 11.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.650390625, -2.5714111328125, -2.492431640625, -2.4134521484375, -2.33447265625, -2.2554931640625, -2.176513671875, -2.0975341796875, -2.0185546875, -1.9395751953125, -1.860595703125, -1.7816162109375, -1.70263671875, -1.6236572265625, -1.544677734375, -1.4656982421875, -1.38671875, -1.3077392578125, -1.228759765625, -1.1497802734375, -1.07080078125, -0.9918212890625, -0.912841796875, -0.8338623046875, -0.7548828125, -0.6759033203125, -0.596923828125, -0.5179443359375, -0.43896484375, -0.3599853515625, -0.281005859375, -0.2020263671875, -0.123046875, -0.0440673828125, 0.034912109375, 0.1138916015625, 0.19287109375, 0.2718505859375, 0.350830078125, 0.4298095703125, 0.5087890625, 0.5877685546875, 0.666748046875, 0.7457275390625, 0.82470703125, 0.9036865234375, 0.982666015625, 1.0616455078125, 1.140625, 1.2196044921875, 1.298583984375, 1.3775634765625, 1.45654296875, 1.5355224609375, 1.614501953125, 1.6934814453125, 1.7724609375, 1.8514404296875, 1.930419921875, 2.0093994140625, 2.08837890625, 2.1673583984375, 2.246337890625, 2.3253173828125, 2.404296875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 21.0, 32.0, 69.0, 93.0, 140.0, 162.0, 157.0, 122.0, 72.0, 48.0, 28.0, 17.0, 11.0, 10.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.831026077270508, -24.46232795715332, -23.0936279296875, -21.724929809570312, -20.356229782104492, -18.987531661987305, -17.618831634521484, -16.250133514404297, -14.881434440612793, -13.512735366821289, -12.144036293029785, -10.775337219238281, -9.406639099121094, -8.037939071655273, -6.669240951538086, -5.300541877746582, -3.931842803955078, -2.563143730163574, -1.1944448947906494, 0.1742539405822754, 1.5429530143737793, 2.911652088165283, 4.280350685119629, 5.649049758911133, 7.017748832702637, 8.38644790649414, 9.755146980285645, 11.123846054077148, 12.492544174194336, 13.861244201660156, 15.229942321777344, 16.59864044189453, 17.96733856201172, 19.336036682128906, 20.704736709594727, 22.073434829711914, 23.442134857177734, 24.810832977294922, 26.17953109741211, 27.54823112487793, 28.91693115234375, 30.285629272460938, 31.654329299926758, 33.02302932739258, 34.391727447509766, 35.76042556762695, 37.12912368774414, 38.497825622558594, 39.86652374267578, 41.23522186279297, 42.603919982910156, 43.97262191772461, 45.3413200378418, 46.710018157958984, 48.07871627807617, 49.447418212890625, 50.81611251831055, 52.184810638427734, 53.55350875854492, 54.922210693359375, 56.29090881347656, 57.65960693359375, 59.02830505371094, 60.397003173828125, 61.76570510864258]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 14.0, 9.0, 8.0, 17.0, 20.0, 19.0, 14.0, 33.0, 26.0, 27.0, 33.0, 32.0, 35.0, 46.0, 44.0, 40.0, 43.0, 53.0, 48.0, 45.0, 47.0, 43.0, 43.0, 25.0, 31.0, 21.0, 24.0, 25.0, 24.0, 13.0, 20.0, 18.0, 16.0, 8.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.673675537109375, -31.614837646484375, -30.555999755859375, -29.497161865234375, -28.438323974609375, -27.379486083984375, -26.320650100708008, -25.261812210083008, -24.202974319458008, -23.144136428833008, -22.085298538208008, -21.026460647583008, -19.96762466430664, -18.90878677368164, -17.84994888305664, -16.79111099243164, -15.73227310180664, -14.67343521118164, -13.61459732055664, -12.555760383605957, -11.496922492980957, -10.438084602355957, -9.379247665405273, -8.320409774780273, -7.261571884155273, -6.202733993530273, -5.143896579742432, -4.08505916595459, -3.02622127532959, -1.9673833847045898, -0.908545970916748, 0.15029144287109375, 1.2091331481933594, 2.2679708003997803, 3.326808452606201, 4.385645866394043, 5.444483757019043, 6.503321647644043, 7.562159061431885, 8.620996475219727, 9.679834365844727, 10.738672256469727, 11.797510147094727, 12.85634708404541, 13.91518497467041, 14.97402286529541, 16.032859802246094, 17.091697692871094, 18.150535583496094, 19.209373474121094, 20.268211364746094, 21.327049255371094, 22.385887145996094, 23.444725036621094, 24.50356101989746, 25.56239891052246, 26.62123680114746, 27.68007469177246, 28.73891258239746, 29.79775047302246, 30.856586456298828, 31.915424346923828, 32.97426223754883, 34.03310012817383, 35.09193801879883]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 1.0, 3.0, 16.0, 8.0, 7.0, 22.0, 28.0, 41.0, 65.0, 104.0, 175.0, 250.0, 418.0, 721.0, 1378.0, 2966.0, 7252.0, 22370.0, 117006.0, 3573442.0, 408697.0, 40813.0, 10976.0, 3966.0, 1653.0, 806.0, 435.0, 263.0, 164.0, 79.0, 44.0, 31.0, 24.0, 23.0, 11.0, 7.0, 6.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.296875, -8.04327392578125, -7.7896728515625, -7.53607177734375, -7.282470703125, -7.02886962890625, -6.7752685546875, -6.52166748046875, -6.26806640625, -6.01446533203125, -5.7608642578125, -5.50726318359375, -5.253662109375, -5.00006103515625, -4.7464599609375, -4.49285888671875, -4.2392578125, -3.98565673828125, -3.7320556640625, -3.47845458984375, -3.224853515625, -2.97125244140625, -2.7176513671875, -2.46405029296875, -2.21044921875, -1.95684814453125, -1.7032470703125, -1.44964599609375, -1.196044921875, -0.94244384765625, -0.6888427734375, -0.43524169921875, -0.181640625, 0.07196044921875, 0.3255615234375, 0.57916259765625, 0.832763671875, 1.08636474609375, 1.3399658203125, 1.59356689453125, 1.84716796875, 2.10076904296875, 2.3543701171875, 2.60797119140625, 2.861572265625, 3.11517333984375, 3.3687744140625, 3.62237548828125, 3.8759765625, 4.12957763671875, 4.3831787109375, 4.63677978515625, 4.890380859375, 5.14398193359375, 5.3975830078125, 5.65118408203125, 5.90478515625, 6.15838623046875, 6.4119873046875, 6.66558837890625, 6.919189453125, 7.17279052734375, 7.4263916015625, 7.67999267578125, 7.93359375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 9.0, 6.0, 17.0, 18.0, 17.0, 31.0, 28.0, 41.0, 41.0, 52.0, 60.0, 59.0, 59.0, 63.0, 77.0, 53.0, 49.0, 58.0, 49.0, 45.0, 31.0, 38.0, 20.0, 20.0, 14.0, 12.0, 3.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.20745849609375, -2.1395263671875, -2.07159423828125, -2.003662109375, -1.93572998046875, -1.8677978515625, -1.79986572265625, -1.73193359375, -1.66400146484375, -1.5960693359375, -1.52813720703125, -1.460205078125, -1.39227294921875, -1.3243408203125, -1.25640869140625, -1.1884765625, -1.12054443359375, -1.0526123046875, -0.98468017578125, -0.916748046875, -0.84881591796875, -0.7808837890625, -0.71295166015625, -0.64501953125, -0.57708740234375, -0.5091552734375, -0.44122314453125, -0.373291015625, -0.30535888671875, -0.2374267578125, -0.16949462890625, -0.1015625, -0.03363037109375, 0.0343017578125, 0.10223388671875, 0.170166015625, 0.23809814453125, 0.3060302734375, 0.37396240234375, 0.44189453125, 0.50982666015625, 0.5777587890625, 0.64569091796875, 0.713623046875, 0.78155517578125, 0.8494873046875, 0.91741943359375, 0.9853515625, 1.05328369140625, 1.1212158203125, 1.18914794921875, 1.257080078125, 1.32501220703125, 1.3929443359375, 1.46087646484375, 1.52880859375, 1.59674072265625, 1.6646728515625, 1.73260498046875, 1.800537109375, 1.86846923828125, 1.9364013671875, 2.00433349609375, 2.072265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 13.0, 11.0, 14.0, 16.0, 33.0, 60.0, 102.0, 116.0, 224.0, 392.0, 804.0, 1883.0, 5342.0, 21015.0, 145889.0, 3416514.0, 545648.0, 42261.0, 9000.0, 2742.0, 1048.0, 503.0, 226.0, 147.0, 118.0, 64.0, 33.0, 17.0, 9.0, 10.0, 9.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.69140625, -6.48040771484375, -6.2694091796875, -6.05841064453125, -5.847412109375, -5.63641357421875, -5.4254150390625, -5.21441650390625, -5.00341796875, -4.79241943359375, -4.5814208984375, -4.37042236328125, -4.159423828125, -3.94842529296875, -3.7374267578125, -3.52642822265625, -3.3154296875, -3.10443115234375, -2.8934326171875, -2.68243408203125, -2.471435546875, -2.26043701171875, -2.0494384765625, -1.83843994140625, -1.62744140625, -1.41644287109375, -1.2054443359375, -0.99444580078125, -0.783447265625, -0.57244873046875, -0.3614501953125, -0.15045166015625, 0.060546875, 0.27154541015625, 0.4825439453125, 0.69354248046875, 0.904541015625, 1.11553955078125, 1.3265380859375, 1.53753662109375, 1.74853515625, 1.95953369140625, 2.1705322265625, 2.38153076171875, 2.592529296875, 2.80352783203125, 3.0145263671875, 3.22552490234375, 3.4365234375, 3.64752197265625, 3.8585205078125, 4.06951904296875, 4.280517578125, 4.49151611328125, 4.7025146484375, 4.91351318359375, 5.12451171875, 5.33551025390625, 5.5465087890625, 5.75750732421875, 5.968505859375, 6.17950439453125, 6.3905029296875, 6.60150146484375, 6.8125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 3.0, 11.0, 8.0, 22.0, 20.0, 23.0, 63.0, 127.0, 348.0, 1320.0, 1474.0, 353.0, 151.0, 66.0, 28.0, 22.0, 16.0, 7.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7890625, -4.656097412109375, -4.52313232421875, -4.390167236328125, -4.2572021484375, -4.124237060546875, -3.99127197265625, -3.858306884765625, -3.725341796875, -3.592376708984375, -3.45941162109375, -3.326446533203125, -3.1934814453125, -3.060516357421875, -2.92755126953125, -2.794586181640625, -2.66162109375, -2.528656005859375, -2.39569091796875, -2.262725830078125, -2.1297607421875, -1.996795654296875, -1.86383056640625, -1.730865478515625, -1.597900390625, -1.464935302734375, -1.33197021484375, -1.199005126953125, -1.0660400390625, -0.933074951171875, -0.80010986328125, -0.667144775390625, -0.5341796875, -0.401214599609375, -0.26824951171875, -0.135284423828125, -0.0023193359375, 0.130645751953125, 0.26361083984375, 0.396575927734375, 0.529541015625, 0.662506103515625, 0.79547119140625, 0.928436279296875, 1.0614013671875, 1.194366455078125, 1.32733154296875, 1.460296630859375, 1.59326171875, 1.726226806640625, 1.85919189453125, 1.992156982421875, 2.1251220703125, 2.258087158203125, 2.39105224609375, 2.524017333984375, 2.656982421875, 2.789947509765625, 2.92291259765625, 3.055877685546875, 3.1888427734375, 3.321807861328125, 3.45477294921875, 3.587738037109375, 3.720703125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 11.0, 21.0, 58.0, 132.0, 282.0, 278.0, 145.0, 54.0, 18.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.2313232421875, -41.24857711791992, -40.265830993652344, -39.283084869384766, -38.30033493041992, -37.317588806152344, -36.334842681884766, -35.35209655761719, -34.36935043334961, -33.38660430908203, -32.40385818481445, -31.421110153198242, -30.438364028930664, -29.455615997314453, -28.472869873046875, -27.490123748779297, -26.50737762451172, -25.52463150024414, -24.54188346862793, -23.55913734436035, -22.576391220092773, -21.593643188476562, -20.610897064208984, -19.628150939941406, -18.645402908325195, -17.662656784057617, -16.679908752441406, -15.697162628173828, -14.71441650390625, -13.731669425964355, -12.748922348022461, -11.766176223754883, -10.783430099487305, -9.80068302154541, -8.817936897277832, -7.8351898193359375, -6.852443695068359, -5.869696617126465, -4.8869500160217285, -3.904203414916992, -2.921456813812256, -1.9387102127075195, -0.9559634923934937, 0.026783227920532227, 1.0095298290252686, 1.992276668548584, 2.9750232696533203, 3.9577698707580566, 4.940516471862793, 5.923263072967529, 6.906009674072266, 7.88875675201416, 8.871502876281738, 9.854249954223633, 10.836996078491211, 11.819743156433105, 12.802490234375, 13.785237312316895, 14.767983436584473, 15.750730514526367, 16.733476638793945, 17.716224670410156, 18.698970794677734, 19.681716918945312, 20.66446304321289]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 11.0, 12.0, 12.0, 21.0, 26.0, 32.0, 36.0, 48.0, 46.0, 61.0, 56.0, 51.0, 72.0, 65.0, 67.0, 58.0, 52.0, 44.0, 42.0, 38.0, 45.0, 24.0, 28.0, 16.0, 12.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.574504852294922, -13.1665678024292, -12.758630752563477, -12.350693702697754, -11.942756652832031, -11.534820556640625, -11.126882553100586, -10.71894645690918, -10.311009407043457, -9.903072357177734, -9.495135307312012, -9.087198257446289, -8.679261207580566, -8.271324157714844, -7.863387584686279, -7.455451011657715, -7.047513484954834, -6.639576435089111, -6.231639385223389, -5.823702812194824, -5.415765762329102, -5.007828712463379, -4.599891662597656, -4.191954612731934, -3.78401780128479, -3.3760807514190674, -2.968143939971924, -2.560206890106201, -2.1522698402404785, -1.744333028793335, -1.3363959789276123, -0.9284591674804688, -0.5205221176147461, -0.1125851571559906, 0.2953518033027649, 0.7032887935638428, 1.1112257242202759, 1.519162654876709, 1.9270997047424316, 2.335036516189575, 2.742973566055298, 3.1509106159210205, 3.558847427368164, 3.9667844772338867, 4.374721527099609, 4.782658576965332, 5.190595626831055, 5.598532199859619, 6.006469249725342, 6.4144062995910645, 6.822343349456787, 7.230279922485352, 7.638216972351074, 8.046154022216797, 8.45409107208252, 8.862028121948242, 9.269965171813965, 9.677902221679688, 10.08583927154541, 10.493776321411133, 10.901713371276855, 11.309650421142578, 11.717586517333984, 12.125523567199707, 12.53346061706543]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 12.0, 18.0, 17.0, 22.0, 30.0, 41.0, 77.0, 121.0, 206.0, 315.0, 520.0, 916.0, 1765.0, 3649.0, 8391.0, 22328.0, 66893.0, 232637.0, 463233.0, 166488.0, 50314.0, 17284.0, 6730.0, 3065.0, 1456.0, 810.0, 465.0, 260.0, 158.0, 102.0, 62.0, 48.0, 40.0, 23.0, 18.0, 9.0, 5.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.47265625, -7.272705078125, -7.07275390625, -6.872802734375, -6.6728515625, -6.472900390625, -6.27294921875, -6.072998046875, -5.873046875, -5.673095703125, -5.47314453125, -5.273193359375, -5.0732421875, -4.873291015625, -4.67333984375, -4.473388671875, -4.2734375, -4.073486328125, -3.87353515625, -3.673583984375, -3.4736328125, -3.273681640625, -3.07373046875, -2.873779296875, -2.673828125, -2.473876953125, -2.27392578125, -2.073974609375, -1.8740234375, -1.674072265625, -1.47412109375, -1.274169921875, -1.07421875, -0.874267578125, -0.67431640625, -0.474365234375, -0.2744140625, -0.074462890625, 0.12548828125, 0.325439453125, 0.525390625, 0.725341796875, 0.92529296875, 1.125244140625, 1.3251953125, 1.525146484375, 1.72509765625, 1.925048828125, 2.125, 2.324951171875, 2.52490234375, 2.724853515625, 2.9248046875, 3.124755859375, 3.32470703125, 3.524658203125, 3.724609375, 3.924560546875, 4.12451171875, 4.324462890625, 4.5244140625, 4.724365234375, 4.92431640625, 5.124267578125, 5.32421875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 11.0, 10.0, 15.0, 17.0, 23.0, 33.0, 26.0, 43.0, 45.0, 66.0, 48.0, 51.0, 68.0, 64.0, 66.0, 61.0, 40.0, 55.0, 41.0, 42.0, 43.0, 33.0, 25.0, 10.0, 18.0, 5.0, 4.0, 8.0, 8.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37109375, -2.305511474609375, -2.23992919921875, -2.174346923828125, -2.1087646484375, -2.043182373046875, -1.97760009765625, -1.912017822265625, -1.846435546875, -1.780853271484375, -1.71527099609375, -1.649688720703125, -1.5841064453125, -1.518524169921875, -1.45294189453125, -1.387359619140625, -1.32177734375, -1.256195068359375, -1.19061279296875, -1.125030517578125, -1.0594482421875, -0.993865966796875, -0.92828369140625, -0.862701416015625, -0.797119140625, -0.731536865234375, -0.66595458984375, -0.600372314453125, -0.5347900390625, -0.469207763671875, -0.40362548828125, -0.338043212890625, -0.2724609375, -0.206878662109375, -0.14129638671875, -0.075714111328125, -0.0101318359375, 0.055450439453125, 0.12103271484375, 0.186614990234375, 0.252197265625, 0.317779541015625, 0.38336181640625, 0.448944091796875, 0.5145263671875, 0.580108642578125, 0.64569091796875, 0.711273193359375, 0.77685546875, 0.842437744140625, 0.90802001953125, 0.973602294921875, 1.0391845703125, 1.104766845703125, 1.17034912109375, 1.235931396484375, 1.301513671875, 1.367095947265625, 1.43267822265625, 1.498260498046875, 1.5638427734375, 1.629425048828125, 1.69500732421875, 1.760589599609375, 1.826171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 3.0, 7.0, 18.0, 15.0, 24.0, 26.0, 40.0, 66.0, 89.0, 144.0, 213.0, 353.0, 563.0, 946.0, 1825.0, 4139.0, 9964.0, 28068.0, 87995.0, 301775.0, 412486.0, 134369.0, 40561.0, 14036.0, 5520.0, 2314.0, 1191.0, 665.0, 368.0, 248.0, 165.0, 123.0, 87.0, 44.0, 29.0, 24.0, 19.0, 11.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.58984375, -5.430908203125, -5.27197265625, -5.113037109375, -4.9541015625, -4.795166015625, -4.63623046875, -4.477294921875, -4.318359375, -4.159423828125, -4.00048828125, -3.841552734375, -3.6826171875, -3.523681640625, -3.36474609375, -3.205810546875, -3.046875, -2.887939453125, -2.72900390625, -2.570068359375, -2.4111328125, -2.252197265625, -2.09326171875, -1.934326171875, -1.775390625, -1.616455078125, -1.45751953125, -1.298583984375, -1.1396484375, -0.980712890625, -0.82177734375, -0.662841796875, -0.50390625, -0.344970703125, -0.18603515625, -0.027099609375, 0.1318359375, 0.290771484375, 0.44970703125, 0.608642578125, 0.767578125, 0.926513671875, 1.08544921875, 1.244384765625, 1.4033203125, 1.562255859375, 1.72119140625, 1.880126953125, 2.0390625, 2.197998046875, 2.35693359375, 2.515869140625, 2.6748046875, 2.833740234375, 2.99267578125, 3.151611328125, 3.310546875, 3.469482421875, 3.62841796875, 3.787353515625, 3.9462890625, 4.105224609375, 4.26416015625, 4.423095703125, 4.58203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 5.0, 9.0, 12.0, 15.0, 15.0, 13.0, 29.0, 24.0, 24.0, 33.0, 39.0, 43.0, 28.0, 53.0, 57.0, 59.0, 51.0, 68.0, 54.0, 59.0, 43.0, 35.0, 29.0, 30.0, 31.0, 28.0, 21.0, 19.0, 15.0, 13.0, 8.0, 6.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.125, -8.89300537109375, -8.6610107421875, -8.42901611328125, -8.197021484375, -7.96502685546875, -7.7330322265625, -7.50103759765625, -7.26904296875, -7.03704833984375, -6.8050537109375, -6.57305908203125, -6.341064453125, -6.10906982421875, -5.8770751953125, -5.64508056640625, -5.4130859375, -5.18109130859375, -4.9490966796875, -4.71710205078125, -4.485107421875, -4.25311279296875, -4.0211181640625, -3.78912353515625, -3.55712890625, -3.32513427734375, -3.0931396484375, -2.86114501953125, -2.629150390625, -2.39715576171875, -2.1651611328125, -1.93316650390625, -1.701171875, -1.46917724609375, -1.2371826171875, -1.00518798828125, -0.773193359375, -0.54119873046875, -0.3092041015625, -0.07720947265625, 0.15478515625, 0.38677978515625, 0.6187744140625, 0.85076904296875, 1.082763671875, 1.31475830078125, 1.5467529296875, 1.77874755859375, 2.0107421875, 2.24273681640625, 2.4747314453125, 2.70672607421875, 2.938720703125, 3.17071533203125, 3.4027099609375, 3.63470458984375, 3.86669921875, 4.09869384765625, 4.3306884765625, 4.56268310546875, 4.794677734375, 5.02667236328125, 5.2586669921875, 5.49066162109375, 5.72265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 10.0, 6.0, 16.0, 34.0, 77.0, 191.0, 741.0, 4570.0, 60069.0, 867809.0, 106629.0, 7075.0, 943.0, 241.0, 79.0, 46.0, 11.0, 7.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.28057861328125, -6.1041259765625, -5.92767333984375, -5.751220703125, -5.57476806640625, -5.3983154296875, -5.22186279296875, -5.04541015625, -4.86895751953125, -4.6925048828125, -4.51605224609375, -4.339599609375, -4.16314697265625, -3.9866943359375, -3.81024169921875, -3.6337890625, -3.45733642578125, -3.2808837890625, -3.10443115234375, -2.927978515625, -2.75152587890625, -2.5750732421875, -2.39862060546875, -2.22216796875, -2.04571533203125, -1.8692626953125, -1.69281005859375, -1.516357421875, -1.33990478515625, -1.1634521484375, -0.98699951171875, -0.810546875, -0.63409423828125, -0.4576416015625, -0.28118896484375, -0.104736328125, 0.07171630859375, 0.2481689453125, 0.42462158203125, 0.60107421875, 0.77752685546875, 0.9539794921875, 1.13043212890625, 1.306884765625, 1.48333740234375, 1.6597900390625, 1.83624267578125, 2.0126953125, 2.18914794921875, 2.3656005859375, 2.54205322265625, 2.718505859375, 2.89495849609375, 3.0714111328125, 3.24786376953125, 3.42431640625, 3.60076904296875, 3.7772216796875, 3.95367431640625, 4.130126953125, 4.30657958984375, 4.4830322265625, 4.65948486328125, 4.8359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 12.0, 9.0, 17.0, 24.0, 24.0, 53.0, 118.0, 267.0, 238.0, 111.0, 43.0, 31.0, 18.0, 14.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012483596801757812, -0.0012205541133880615, -0.0011927485466003418, -0.001164942979812622, -0.0011371374130249023, -0.0011093318462371826, -0.0010815262794494629, -0.0010537207126617432, -0.0010259151458740234, -0.0009981095790863037, -0.000970304012298584, -0.0009424984455108643, -0.0009146928787231445, -0.0008868873119354248, -0.0008590817451477051, -0.0008312761783599854, -0.0008034706115722656, -0.0007756650447845459, -0.0007478594779968262, -0.0007200539112091064, -0.0006922483444213867, -0.000664442777633667, -0.0006366372108459473, -0.0006088316440582275, -0.0005810260772705078, -0.0005532205104827881, -0.0005254149436950684, -0.0004976093769073486, -0.0004698038101196289, -0.0004419982433319092, -0.00041419267654418945, -0.0003863871097564697, -0.00035858154296875, -0.0003307759761810303, -0.00030297040939331055, -0.0002751648426055908, -0.0002473592758178711, -0.00021955370903015137, -0.00019174814224243164, -0.00016394257545471191, -0.0001361370086669922, -0.00010833144187927246, -8.052587509155273e-05, -5.272030830383301e-05, -2.491474151611328e-05, 2.8908252716064453e-06, 3.069639205932617e-05, 5.85019588470459e-05, 8.630752563476562e-05, 0.00011411309242248535, 0.00014191865921020508, 0.0001697242259979248, 0.00019752979278564453, 0.00022533535957336426, 0.000253140926361084, 0.0002809464931488037, 0.00030875205993652344, 0.00033655762672424316, 0.0003643631935119629, 0.0003921687602996826, 0.00041997432708740234, 0.00044777989387512207, 0.0004755854606628418, 0.0005033910274505615, 0.0005311965942382812]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 16.0, 31.0, 40.0, 54.0, 105.0, 196.0, 382.0, 790.0, 2050.0, 6139.0, 23173.0, 116370.0, 728699.0, 134486.0, 25458.0, 6587.0, 2160.0, 892.0, 420.0, 202.0, 107.0, 70.0, 38.0, 20.0, 12.0, 10.0, 5.0, 5.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.139373779296875, -3.03656005859375, -2.933746337890625, -2.8309326171875, -2.728118896484375, -2.62530517578125, -2.522491455078125, -2.419677734375, -2.316864013671875, -2.21405029296875, -2.111236572265625, -2.0084228515625, -1.905609130859375, -1.80279541015625, -1.699981689453125, -1.59716796875, -1.494354248046875, -1.39154052734375, -1.288726806640625, -1.1859130859375, -1.083099365234375, -0.98028564453125, -0.877471923828125, -0.774658203125, -0.671844482421875, -0.56903076171875, -0.466217041015625, -0.3634033203125, -0.260589599609375, -0.15777587890625, -0.054962158203125, 0.0478515625, 0.150665283203125, 0.25347900390625, 0.356292724609375, 0.4591064453125, 0.561920166015625, 0.66473388671875, 0.767547607421875, 0.870361328125, 0.973175048828125, 1.07598876953125, 1.178802490234375, 1.2816162109375, 1.384429931640625, 1.48724365234375, 1.590057373046875, 1.69287109375, 1.795684814453125, 1.89849853515625, 2.001312255859375, 2.1041259765625, 2.206939697265625, 2.30975341796875, 2.412567138671875, 2.515380859375, 2.618194580078125, 2.72100830078125, 2.823822021484375, 2.9266357421875, 3.029449462890625, 3.13226318359375, 3.235076904296875, 3.337890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 9.0, 13.0, 17.0, 23.0, 35.0, 50.0, 80.0, 131.0, 156.0, 143.0, 120.0, 71.0, 43.0, 32.0, 22.0, 13.0, 13.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.482421875, -3.365386962890625, -3.24835205078125, -3.131317138671875, -3.0142822265625, -2.897247314453125, -2.78021240234375, -2.663177490234375, -2.546142578125, -2.429107666015625, -2.31207275390625, -2.195037841796875, -2.0780029296875, -1.960968017578125, -1.84393310546875, -1.726898193359375, -1.60986328125, -1.492828369140625, -1.37579345703125, -1.258758544921875, -1.1417236328125, -1.024688720703125, -0.90765380859375, -0.790618896484375, -0.673583984375, -0.556549072265625, -0.43951416015625, -0.322479248046875, -0.2054443359375, -0.088409423828125, 0.02862548828125, 0.145660400390625, 0.2626953125, 0.379730224609375, 0.49676513671875, 0.613800048828125, 0.7308349609375, 0.847869873046875, 0.96490478515625, 1.081939697265625, 1.198974609375, 1.316009521484375, 1.43304443359375, 1.550079345703125, 1.6671142578125, 1.784149169921875, 1.90118408203125, 2.018218994140625, 2.13525390625, 2.252288818359375, 2.36932373046875, 2.486358642578125, 2.6033935546875, 2.720428466796875, 2.83746337890625, 2.954498291015625, 3.071533203125, 3.188568115234375, 3.30560302734375, 3.422637939453125, 3.5396728515625, 3.656707763671875, 3.77374267578125, 3.890777587890625, 4.0078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 13.0, 16.0, 21.0, 33.0, 35.0, 67.0, 93.0, 111.0, 93.0, 122.0, 106.0, 68.0, 80.0, 49.0, 23.0, 22.0, 12.0, 9.0, 2.0, 7.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.47974395751953, -35.41631317138672, -34.35288619995117, -33.289459228515625, -32.22602844238281, -31.162599563598633, -30.099170684814453, -29.035741806030273, -27.972312927246094, -26.908884048461914, -25.845455169677734, -24.782026290893555, -23.718597412109375, -22.655168533325195, -21.591739654541016, -20.528310775756836, -19.464881896972656, -18.401453018188477, -17.338024139404297, -16.274595260620117, -15.211166381835938, -14.147737503051758, -13.084308624267578, -12.020879745483398, -10.957450866699219, -9.894021987915039, -8.83059310913086, -7.76716423034668, -6.7037353515625, -5.64030647277832, -4.576877593994141, -3.513448715209961, -2.4500160217285156, -1.386587142944336, -0.32315826416015625, 0.7402706146240234, 1.8036994934082031, 2.867128372192383, 3.9305572509765625, 4.993986129760742, 6.057415008544922, 7.120843887329102, 8.184272766113281, 9.247701644897461, 10.31113052368164, 11.37455940246582, 12.43798828125, 13.50141716003418, 14.56484603881836, 15.628274917602539, 16.69170379638672, 17.7551326751709, 18.818561553955078, 19.881990432739258, 20.945419311523438, 22.008848190307617, 23.072277069091797, 24.135705947875977, 25.199134826660156, 26.262563705444336, 27.325992584228516, 28.389421463012695, 29.452850341796875, 30.516279220581055, 31.579708099365234]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 8.0, 11.0, 10.0, 15.0, 17.0, 17.0, 23.0, 22.0, 18.0, 30.0, 22.0, 38.0, 25.0, 39.0, 22.0, 41.0, 48.0, 27.0, 40.0, 43.0, 32.0, 32.0, 40.0, 45.0, 28.0, 34.0, 29.0, 32.0, 21.0, 21.0, 29.0, 12.0, 24.0, 16.0, 16.0, 12.0, 9.0, 8.0, 10.0, 8.0, 4.0, 2.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.645950317382812, -26.70466423034668, -25.763378143310547, -24.822093963623047, -23.880807876586914, -22.93952178955078, -21.99823570251465, -21.056949615478516, -20.115665435791016, -19.174379348754883, -18.23309326171875, -17.29180908203125, -16.350522994995117, -15.409236907958984, -14.467950820922852, -13.526664733886719, -12.585378646850586, -11.644092559814453, -10.702807426452637, -9.761521339416504, -8.820236206054688, -7.878950119018555, -6.937664031982422, -5.996378421783447, -5.055092811584473, -4.113807201385498, -3.1725213527679443, -2.2312355041503906, -1.289949893951416, -0.3486642837524414, 0.5926218032836914, 1.533907413482666, 2.4751930236816406, 3.4164786338806152, 4.35776424407959, 5.299050331115723, 6.240335941314697, 7.181621551513672, 8.122907638549805, 9.064193725585938, 10.005478858947754, 10.946764945983887, 11.888050079345703, 12.829336166381836, 13.770622253417969, 14.711907386779785, 15.653193473815918, 16.594478607177734, 17.535764694213867, 18.47705078125, 19.418336868286133, 20.359622955322266, 21.300907135009766, 22.2421932220459, 23.18347930908203, 24.124765396118164, 25.066051483154297, 26.00733757019043, 26.948623657226562, 27.889907836914062, 28.831193923950195, 29.772480010986328, 30.71376609802246, 31.655052185058594, 32.596336364746094]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 14.0, 14.0, 19.0, 26.0, 31.0, 54.0, 57.0, 88.0, 143.0, 157.0, 269.0, 401.0, 584.0, 1033.0, 1776.0, 3392.0, 6477.0, 15118.0, 47308.0, 328796.0, 3576877.0, 155656.0, 32728.0, 11760.0, 5040.0, 2672.0, 1471.0, 854.0, 500.0, 295.0, 201.0, 160.0, 86.0, 60.0, 32.0, 25.0, 33.0, 14.0, 14.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.67578125, -6.4814453125, -6.287109375, -6.0927734375, -5.8984375, -5.7041015625, -5.509765625, -5.3154296875, -5.12109375, -4.9267578125, -4.732421875, -4.5380859375, -4.34375, -4.1494140625, -3.955078125, -3.7607421875, -3.56640625, -3.3720703125, -3.177734375, -2.9833984375, -2.7890625, -2.5947265625, -2.400390625, -2.2060546875, -2.01171875, -1.8173828125, -1.623046875, -1.4287109375, -1.234375, -1.0400390625, -0.845703125, -0.6513671875, -0.45703125, -0.2626953125, -0.068359375, 0.1259765625, 0.3203125, 0.5146484375, 0.708984375, 0.9033203125, 1.09765625, 1.2919921875, 1.486328125, 1.6806640625, 1.875, 2.0693359375, 2.263671875, 2.4580078125, 2.65234375, 2.8466796875, 3.041015625, 3.2353515625, 3.4296875, 3.6240234375, 3.818359375, 4.0126953125, 4.20703125, 4.4013671875, 4.595703125, 4.7900390625, 4.984375, 5.1787109375, 5.373046875, 5.5673828125, 5.76171875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 3.0, 9.0, 5.0, 7.0, 11.0, 21.0, 12.0, 17.0, 36.0, 32.0, 30.0, 40.0, 47.0, 41.0, 66.0, 58.0, 67.0, 51.0, 55.0, 60.0, 46.0, 47.0, 53.0, 34.0, 33.0, 22.0, 17.0, 18.0, 18.0, 14.0, 8.0, 2.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.18359375, -2.116851806640625, -2.05010986328125, -1.983367919921875, -1.9166259765625, -1.849884033203125, -1.78314208984375, -1.716400146484375, -1.649658203125, -1.582916259765625, -1.51617431640625, -1.449432373046875, -1.3826904296875, -1.315948486328125, -1.24920654296875, -1.182464599609375, -1.11572265625, -1.048980712890625, -0.98223876953125, -0.915496826171875, -0.8487548828125, -0.782012939453125, -0.71527099609375, -0.648529052734375, -0.581787109375, -0.515045166015625, -0.44830322265625, -0.381561279296875, -0.3148193359375, -0.248077392578125, -0.18133544921875, -0.114593505859375, -0.0478515625, 0.018890380859375, 0.08563232421875, 0.152374267578125, 0.2191162109375, 0.285858154296875, 0.35260009765625, 0.419342041015625, 0.486083984375, 0.552825927734375, 0.61956787109375, 0.686309814453125, 0.7530517578125, 0.819793701171875, 0.88653564453125, 0.953277587890625, 1.02001953125, 1.086761474609375, 1.15350341796875, 1.220245361328125, 1.2869873046875, 1.353729248046875, 1.42047119140625, 1.487213134765625, 1.553955078125, 1.620697021484375, 1.68743896484375, 1.754180908203125, 1.8209228515625, 1.887664794921875, 1.95440673828125, 2.021148681640625, 2.087890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 9.0, 13.0, 11.0, 35.0, 57.0, 93.0, 157.0, 285.0, 615.0, 1402.0, 3947.0, 15756.0, 152667.0, 3812713.0, 182984.0, 16902.0, 3972.0, 1418.0, 571.0, 303.0, 171.0, 85.0, 50.0, 30.0, 18.0, 10.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1796875, -5.927734375, -5.67578125, -5.423828125, -5.171875, -4.919921875, -4.66796875, -4.416015625, -4.1640625, -3.912109375, -3.66015625, -3.408203125, -3.15625, -2.904296875, -2.65234375, -2.400390625, -2.1484375, -1.896484375, -1.64453125, -1.392578125, -1.140625, -0.888671875, -0.63671875, -0.384765625, -0.1328125, 0.119140625, 0.37109375, 0.623046875, 0.875, 1.126953125, 1.37890625, 1.630859375, 1.8828125, 2.134765625, 2.38671875, 2.638671875, 2.890625, 3.142578125, 3.39453125, 3.646484375, 3.8984375, 4.150390625, 4.40234375, 4.654296875, 4.90625, 5.158203125, 5.41015625, 5.662109375, 5.9140625, 6.166015625, 6.41796875, 6.669921875, 6.921875, 7.173828125, 7.42578125, 7.677734375, 7.9296875, 8.181640625, 8.43359375, 8.685546875, 8.9375, 9.189453125, 9.44140625, 9.693359375, 9.9453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 8.0, 11.0, 18.0, 31.0, 58.0, 115.0, 300.0, 1704.0, 1274.0, 294.0, 115.0, 58.0, 29.0, 18.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.2186279296875, -3.111083984375, -3.0035400390625, -2.89599609375, -2.7884521484375, -2.680908203125, -2.5733642578125, -2.4658203125, -2.3582763671875, -2.250732421875, -2.1431884765625, -2.03564453125, -1.9281005859375, -1.820556640625, -1.7130126953125, -1.60546875, -1.4979248046875, -1.390380859375, -1.2828369140625, -1.17529296875, -1.0677490234375, -0.960205078125, -0.8526611328125, -0.7451171875, -0.6375732421875, -0.530029296875, -0.4224853515625, -0.31494140625, -0.2073974609375, -0.099853515625, 0.0076904296875, 0.115234375, 0.2227783203125, 0.330322265625, 0.4378662109375, 0.54541015625, 0.6529541015625, 0.760498046875, 0.8680419921875, 0.9755859375, 1.0831298828125, 1.190673828125, 1.2982177734375, 1.40576171875, 1.5133056640625, 1.620849609375, 1.7283935546875, 1.8359375, 1.9434814453125, 2.051025390625, 2.1585693359375, 2.26611328125, 2.3736572265625, 2.481201171875, 2.5887451171875, 2.6962890625, 2.8038330078125, 2.911376953125, 3.0189208984375, 3.12646484375, 3.2340087890625, 3.341552734375, 3.4490966796875, 3.556640625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 18.0, 26.0, 66.0, 124.0, 168.0, 183.0, 169.0, 113.0, 68.0, 24.0, 20.0, 10.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.105419158935547, -25.56537437438965, -25.02532958984375, -24.48528480529785, -23.945240020751953, -23.405195236206055, -22.865150451660156, -22.32510757446289, -21.78506088256836, -21.24501609802246, -20.704971313476562, -20.164926528930664, -19.624881744384766, -19.084836959838867, -18.54479217529297, -18.004749298095703, -17.464704513549805, -16.924659729003906, -16.384614944458008, -15.84457015991211, -15.304525375366211, -14.764480590820312, -14.22443675994873, -13.684391975402832, -13.144347190856934, -12.604302406311035, -12.064257621765137, -11.524212837219238, -10.984169006347656, -10.444124221801758, -9.90407943725586, -9.364034652709961, -8.823991775512695, -8.283946990966797, -7.743902206420898, -7.203857898712158, -6.66381311416626, -6.123768329620361, -5.583724021911621, -5.043679237365723, -4.503634452819824, -3.963589668273926, -3.4235451221466064, -2.883500576019287, -2.3434557914733887, -1.8034110069274902, -1.263366460800171, -0.7233219146728516, -0.18327713012695312, 0.35676753520965576, 0.8968122005462646, 1.4368568658828735, 1.9769015312194824, 2.516946315765381, 3.0569908618927, 3.5970354080200195, 4.137080192565918, 4.677124977111816, 5.217169761657715, 5.757214069366455, 6.2972588539123535, 6.837303638458252, 7.377347946166992, 7.917392730712891, 8.457437515258789]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 13.0, 10.0, 16.0, 21.0, 25.0, 30.0, 19.0, 56.0, 38.0, 54.0, 52.0, 49.0, 59.0, 53.0, 63.0, 67.0, 60.0, 46.0, 24.0, 43.0, 40.0, 33.0, 30.0, 24.0, 19.0, 14.0, 5.0, 7.0, 4.0, 8.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.014872550964355, -8.690292358398438, -8.36571216583252, -8.041132926940918, -7.716552734375, -7.391972541809082, -7.067392349243164, -6.742812156677246, -6.418232440948486, -6.093652248382568, -5.769072532653809, -5.444492340087891, -5.119912147521973, -4.795332431793213, -4.470752239227295, -4.146172523498535, -3.821592330932617, -3.4970123767852783, -3.1724324226379395, -2.8478522300720215, -2.5232722759246826, -2.1986923217773438, -1.8741122484207153, -1.549532175064087, -1.224952220916748, -0.9003722071647644, -0.5757921934127808, -0.2512121796607971, 0.07336783409118652, 0.3979477882385254, 0.7225278615951538, 1.0471079349517822, 1.3716888427734375, 1.6962687969207764, 2.0208487510681152, 2.345428943634033, 2.670008897781372, 2.994588851928711, 3.319169044494629, 3.6437489986419678, 3.9683289527893066, 4.292909145355225, 4.617488861083984, 4.942069053649902, 5.26664924621582, 5.59122896194458, 5.915809154510498, 6.240388870239258, 6.564969062805176, 6.889549255371094, 7.2141289710998535, 7.5387091636657715, 7.863288879394531, 8.18786907196045, 8.512449264526367, 8.837029457092285, 9.161609649658203, 9.486189842224121, 9.810770034790039, 10.13534927368164, 10.459929466247559, 10.784509658813477, 11.109089851379395, 11.433670043945312, 11.758249282836914]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 16.0, 20.0, 32.0, 43.0, 80.0, 150.0, 224.0, 428.0, 989.0, 2532.0, 7878.0, 29398.0, 141391.0, 565348.0, 236185.0, 46437.0, 11300.0, 3539.0, 1336.0, 558.0, 238.0, 171.0, 81.0, 49.0, 36.0, 23.0, 15.0, 6.0, 11.0, 7.0, 4.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.3828125, -10.1070556640625, -9.831298828125, -9.5555419921875, -9.27978515625, -9.0040283203125, -8.728271484375, -8.4525146484375, -8.1767578125, -7.9010009765625, -7.625244140625, -7.3494873046875, -7.07373046875, -6.7979736328125, -6.522216796875, -6.2464599609375, -5.970703125, -5.6949462890625, -5.419189453125, -5.1434326171875, -4.86767578125, -4.5919189453125, -4.316162109375, -4.0404052734375, -3.7646484375, -3.4888916015625, -3.213134765625, -2.9373779296875, -2.66162109375, -2.3858642578125, -2.110107421875, -1.8343505859375, -1.55859375, -1.2828369140625, -1.007080078125, -0.7313232421875, -0.45556640625, -0.1798095703125, 0.095947265625, 0.3717041015625, 0.6474609375, 0.9232177734375, 1.198974609375, 1.4747314453125, 1.75048828125, 2.0262451171875, 2.302001953125, 2.5777587890625, 2.853515625, 3.1292724609375, 3.405029296875, 3.6807861328125, 3.95654296875, 4.2322998046875, 4.508056640625, 4.7838134765625, 5.0595703125, 5.3353271484375, 5.611083984375, 5.8868408203125, 6.16259765625, 6.4383544921875, 6.714111328125, 6.9898681640625, 7.265625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 0.0, 3.0, 5.0, 4.0, 7.0, 9.0, 8.0, 10.0, 14.0, 28.0, 34.0, 24.0, 28.0, 44.0, 42.0, 46.0, 46.0, 68.0, 56.0, 57.0, 54.0, 57.0, 44.0, 56.0, 53.0, 42.0, 44.0, 23.0, 15.0, 20.0, 18.0, 11.0, 10.0, 7.0, 7.0, 1.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.443359375, -2.3759613037109375, -2.308563232421875, -2.2411651611328125, -2.17376708984375, -2.1063690185546875, -2.038970947265625, -1.9715728759765625, -1.9041748046875, -1.8367767333984375, -1.769378662109375, -1.7019805908203125, -1.63458251953125, -1.5671844482421875, -1.499786376953125, -1.4323883056640625, -1.364990234375, -1.2975921630859375, -1.230194091796875, -1.1627960205078125, -1.09539794921875, -1.0279998779296875, -0.960601806640625, -0.8932037353515625, -0.8258056640625, -0.7584075927734375, -0.691009521484375, -0.6236114501953125, -0.55621337890625, -0.4888153076171875, -0.421417236328125, -0.3540191650390625, -0.28662109375, -0.2192230224609375, -0.151824951171875, -0.0844268798828125, -0.01702880859375, 0.0503692626953125, 0.117767333984375, 0.1851654052734375, 0.2525634765625, 0.3199615478515625, 0.387359619140625, 0.4547576904296875, 0.52215576171875, 0.5895538330078125, 0.656951904296875, 0.7243499755859375, 0.791748046875, 0.8591461181640625, 0.926544189453125, 0.9939422607421875, 1.06134033203125, 1.1287384033203125, 1.196136474609375, 1.2635345458984375, 1.3309326171875, 1.3983306884765625, 1.465728759765625, 1.5331268310546875, 1.60052490234375, 1.6679229736328125, 1.735321044921875, 1.8027191162109375, 1.8701171875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 7.0, 11.0, 14.0, 19.0, 21.0, 37.0, 51.0, 50.0, 67.0, 100.0, 164.0, 200.0, 352.0, 609.0, 1059.0, 2428.0, 5564.0, 14414.0, 42164.0, 134124.0, 423427.0, 291972.0, 85748.0, 27744.0, 10007.0, 4055.0, 1838.0, 884.0, 509.0, 286.0, 169.0, 125.0, 104.0, 54.0, 42.0, 35.0, 23.0, 20.0, 15.0, 8.0, 3.0, 11.0, 6.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.48333740234375, -4.3221435546875, -4.16094970703125, -3.999755859375, -3.83856201171875, -3.6773681640625, -3.51617431640625, -3.35498046875, -3.19378662109375, -3.0325927734375, -2.87139892578125, -2.710205078125, -2.54901123046875, -2.3878173828125, -2.22662353515625, -2.0654296875, -1.90423583984375, -1.7430419921875, -1.58184814453125, -1.420654296875, -1.25946044921875, -1.0982666015625, -0.93707275390625, -0.77587890625, -0.61468505859375, -0.4534912109375, -0.29229736328125, -0.131103515625, 0.03009033203125, 0.1912841796875, 0.35247802734375, 0.513671875, 0.67486572265625, 0.8360595703125, 0.99725341796875, 1.158447265625, 1.31964111328125, 1.4808349609375, 1.64202880859375, 1.80322265625, 1.96441650390625, 2.1256103515625, 2.28680419921875, 2.447998046875, 2.60919189453125, 2.7703857421875, 2.93157958984375, 3.0927734375, 3.25396728515625, 3.4151611328125, 3.57635498046875, 3.737548828125, 3.89874267578125, 4.0599365234375, 4.22113037109375, 4.38232421875, 4.54351806640625, 4.7047119140625, 4.86590576171875, 5.027099609375, 5.18829345703125, 5.3494873046875, 5.51068115234375, 5.671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 4.0, 7.0, 4.0, 8.0, 9.0, 9.0, 14.0, 15.0, 26.0, 24.0, 24.0, 30.0, 31.0, 27.0, 38.0, 35.0, 41.0, 36.0, 45.0, 59.0, 38.0, 46.0, 38.0, 32.0, 41.0, 23.0, 35.0, 35.0, 34.0, 22.0, 26.0, 23.0, 24.0, 16.0, 13.0, 7.0, 10.0, 10.0, 11.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.96875, -5.77081298828125, -5.5728759765625, -5.37493896484375, -5.177001953125, -4.97906494140625, -4.7811279296875, -4.58319091796875, -4.38525390625, -4.18731689453125, -3.9893798828125, -3.79144287109375, -3.593505859375, -3.39556884765625, -3.1976318359375, -2.99969482421875, -2.8017578125, -2.60382080078125, -2.4058837890625, -2.20794677734375, -2.010009765625, -1.81207275390625, -1.6141357421875, -1.41619873046875, -1.21826171875, -1.02032470703125, -0.8223876953125, -0.62445068359375, -0.426513671875, -0.22857666015625, -0.0306396484375, 0.16729736328125, 0.365234375, 0.56317138671875, 0.7611083984375, 0.95904541015625, 1.156982421875, 1.35491943359375, 1.5528564453125, 1.75079345703125, 1.94873046875, 2.14666748046875, 2.3446044921875, 2.54254150390625, 2.740478515625, 2.93841552734375, 3.1363525390625, 3.33428955078125, 3.5322265625, 3.73016357421875, 3.9281005859375, 4.12603759765625, 4.323974609375, 4.52191162109375, 4.7198486328125, 4.91778564453125, 5.11572265625, 5.31365966796875, 5.5115966796875, 5.70953369140625, 5.907470703125, 6.10540771484375, 6.3033447265625, 6.50128173828125, 6.69921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 1.0, 13.0, 15.0, 28.0, 68.0, 165.0, 443.0, 1498.0, 7210.0, 58765.0, 829071.0, 134954.0, 13036.0, 2245.0, 641.0, 227.0, 93.0, 39.0, 20.0, 8.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.481689453125, -4.33056640625, -4.179443359375, -4.0283203125, -3.877197265625, -3.72607421875, -3.574951171875, -3.423828125, -3.272705078125, -3.12158203125, -2.970458984375, -2.8193359375, -2.668212890625, -2.51708984375, -2.365966796875, -2.21484375, -2.063720703125, -1.91259765625, -1.761474609375, -1.6103515625, -1.459228515625, -1.30810546875, -1.156982421875, -1.005859375, -0.854736328125, -0.70361328125, -0.552490234375, -0.4013671875, -0.250244140625, -0.09912109375, 0.052001953125, 0.203125, 0.354248046875, 0.50537109375, 0.656494140625, 0.8076171875, 0.958740234375, 1.10986328125, 1.260986328125, 1.412109375, 1.563232421875, 1.71435546875, 1.865478515625, 2.0166015625, 2.167724609375, 2.31884765625, 2.469970703125, 2.62109375, 2.772216796875, 2.92333984375, 3.074462890625, 3.2255859375, 3.376708984375, 3.52783203125, 3.678955078125, 3.830078125, 3.981201171875, 4.13232421875, 4.283447265625, 4.4345703125, 4.585693359375, 4.73681640625, 4.887939453125, 5.0390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 4.0, 17.0, 23.0, 22.0, 27.0, 63.0, 113.0, 199.0, 210.0, 105.0, 58.0, 37.0, 21.0, 19.0, 16.0, 14.0, 8.0, 3.0, 4.0, 6.0, 2.0, 0.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004558563232421875, -0.00043683499097824097, -0.00041781365871429443, -0.0003987923264503479, -0.00037977099418640137, -0.00036074966192245483, -0.0003417283296585083, -0.00032270699739456177, -0.00030368566513061523, -0.0002846643328666687, -0.00026564300060272217, -0.00024662166833877563, -0.0002276003360748291, -0.00020857900381088257, -0.00018955767154693604, -0.0001705363392829895, -0.00015151500701904297, -0.00013249367475509644, -0.0001134723424911499, -9.445101022720337e-05, -7.542967796325684e-05, -5.64083456993103e-05, -3.738701343536377e-05, -1.8365681171417236e-05, 6.556510925292969e-07, 1.967698335647583e-05, 3.869831562042236e-05, 5.7719647884368896e-05, 7.674098014831543e-05, 9.576231241226196e-05, 0.0001147836446762085, 0.00013380497694015503, 0.00015282630920410156, 0.0001718476414680481, 0.00019086897373199463, 0.00020989030599594116, 0.0002289116382598877, 0.00024793297052383423, 0.00026695430278778076, 0.0002859756350517273, 0.00030499696731567383, 0.00032401829957962036, 0.0003430396318435669, 0.00036206096410751343, 0.00038108229637145996, 0.0004001036286354065, 0.00041912496089935303, 0.00043814629316329956, 0.0004571676254272461, 0.0004761889576911926, 0.0004952102899551392, 0.0005142316222190857, 0.0005332529544830322, 0.0005522742867469788, 0.0005712956190109253, 0.0005903169512748718, 0.0006093382835388184, 0.0006283596158027649, 0.0006473809480667114, 0.000666402280330658, 0.0006854236125946045, 0.000704444944858551, 0.0007234662771224976, 0.0007424876093864441, 0.0007615089416503906]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 10.0, 17.0, 27.0, 55.0, 76.0, 256.0, 910.0, 5416.0, 57465.0, 921528.0, 56178.0, 5283.0, 872.0, 251.0, 95.0, 59.0, 25.0, 20.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.87542724609375, -3.6766357421875, -3.47784423828125, -3.279052734375, -3.08026123046875, -2.8814697265625, -2.68267822265625, -2.48388671875, -2.28509521484375, -2.0863037109375, -1.88751220703125, -1.688720703125, -1.48992919921875, -1.2911376953125, -1.09234619140625, -0.8935546875, -0.69476318359375, -0.4959716796875, -0.29718017578125, -0.098388671875, 0.10040283203125, 0.2991943359375, 0.49798583984375, 0.69677734375, 0.89556884765625, 1.0943603515625, 1.29315185546875, 1.491943359375, 1.69073486328125, 1.8895263671875, 2.08831787109375, 2.287109375, 2.48590087890625, 2.6846923828125, 2.88348388671875, 3.082275390625, 3.28106689453125, 3.4798583984375, 3.67864990234375, 3.87744140625, 4.07623291015625, 4.2750244140625, 4.47381591796875, 4.672607421875, 4.87139892578125, 5.0701904296875, 5.26898193359375, 5.4677734375, 5.66656494140625, 5.8653564453125, 6.06414794921875, 6.262939453125, 6.46173095703125, 6.6605224609375, 6.85931396484375, 7.05810546875, 7.25689697265625, 7.4556884765625, 7.65447998046875, 7.853271484375, 8.05206298828125, 8.2508544921875, 8.44964599609375, 8.6484375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 11.0, 16.0, 35.0, 42.0, 89.0, 135.0, 228.0, 197.0, 105.0, 48.0, 26.0, 23.0, 19.0, 6.0, 7.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -1.998992919921875, -1.86322021484375, -1.727447509765625, -1.5916748046875, -1.455902099609375, -1.32012939453125, -1.184356689453125, -1.048583984375, -0.912811279296875, -0.77703857421875, -0.641265869140625, -0.5054931640625, -0.369720458984375, -0.23394775390625, -0.098175048828125, 0.03759765625, 0.173370361328125, 0.30914306640625, 0.444915771484375, 0.5806884765625, 0.716461181640625, 0.85223388671875, 0.988006591796875, 1.123779296875, 1.259552001953125, 1.39532470703125, 1.531097412109375, 1.6668701171875, 1.802642822265625, 1.93841552734375, 2.074188232421875, 2.2099609375, 2.345733642578125, 2.48150634765625, 2.617279052734375, 2.7530517578125, 2.888824462890625, 3.02459716796875, 3.160369873046875, 3.296142578125, 3.431915283203125, 3.56768798828125, 3.703460693359375, 3.8392333984375, 3.975006103515625, 4.11077880859375, 4.246551513671875, 4.38232421875, 4.518096923828125, 4.65386962890625, 4.789642333984375, 4.9254150390625, 5.061187744140625, 5.19696044921875, 5.332733154296875, 5.468505859375, 5.604278564453125, 5.74005126953125, 5.875823974609375, 6.0115966796875, 6.147369384765625, 6.28314208984375, 6.418914794921875, 6.5546875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 12.0, 24.0, 52.0, 79.0, 145.0, 186.0, 192.0, 144.0, 81.0, 38.0, 24.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.9426155090332, -61.23741912841797, -59.5322265625, -57.827030181884766, -56.12183380126953, -54.41664123535156, -52.71144485473633, -51.006248474121094, -49.301055908203125, -47.59585952758789, -45.89066696166992, -44.18547058105469, -42.48027801513672, -40.775081634521484, -39.06988525390625, -37.36469268798828, -35.65949630737305, -33.95429992675781, -32.249107360839844, -30.54391098022461, -28.838716506958008, -27.133522033691406, -25.428325653076172, -23.72313117980957, -22.01793670654297, -20.312742233276367, -18.607547760009766, -16.90235137939453, -15.19715690612793, -13.491962432861328, -11.78676700592041, -10.081571578979492, -8.376380920410156, -6.6711859703063965, -4.965991020202637, -3.260796070098877, -1.5556011199951172, 0.14959335327148438, 1.8547887802124023, 3.5599842071533203, 5.265178680419922, 6.970373630523682, 8.675568580627441, 10.38076400756836, 12.085958480834961, 13.791152954101562, 15.49634838104248, 17.2015438079834, 18.90673828125, 20.6119327545166, 22.317127227783203, 24.022323608398438, 25.72751808166504, 27.43271255493164, 29.137908935546875, 30.843103408813477, 32.54829788208008, 34.25349426269531, 35.95868682861328, 37.663883209228516, 39.36907958984375, 41.07427215576172, 42.77946853637695, 44.48466491699219, 46.189857482910156]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 8.0, 8.0, 6.0, 9.0, 23.0, 16.0, 31.0, 28.0, 25.0, 36.0, 34.0, 37.0, 38.0, 44.0, 41.0, 43.0, 40.0, 41.0, 47.0, 42.0, 50.0, 41.0, 44.0, 27.0, 38.0, 17.0, 30.0, 22.0, 20.0, 23.0, 10.0, 16.0, 13.0, 10.0, 12.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53301239013672, -28.52191162109375, -27.510812759399414, -26.499711990356445, -25.48861312866211, -24.47751235961914, -23.466411590576172, -22.455310821533203, -21.444211959838867, -20.4331111907959, -19.422012329101562, -18.410911560058594, -17.399810791015625, -16.38871192932129, -15.37761116027832, -14.366511344909668, -13.355411529541016, -12.344311714172363, -11.333211898803711, -10.322111129760742, -9.31101131439209, -8.299911499023438, -7.288811206817627, -6.277710914611816, -5.266611099243164, -4.255511283874512, -3.244410991668701, -2.2333109378814697, -1.2222108840942383, -0.21111106872558594, 0.7999892234802246, 1.8110895156860352, 2.822193145751953, 3.8332931995391846, 4.844393253326416, 5.855493545532227, 6.866593360900879, 7.877693176269531, 8.8887939453125, 9.899893760681152, 10.910993576049805, 11.922093391418457, 12.93319320678711, 13.944293975830078, 14.95539379119873, 15.966493606567383, 16.97759437561035, 17.988693237304688, 18.999794006347656, 20.010894775390625, 21.02199363708496, 22.03309440612793, 23.044193267822266, 24.055294036865234, 25.066394805908203, 26.077495574951172, 27.088594436645508, 28.099695205688477, 29.110794067382812, 30.12189483642578, 31.13299560546875, 32.14409637451172, 33.15519332885742, 34.16629409790039, 35.17739486694336]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 2.0, 2.0, 10.0, 10.0, 11.0, 14.0, 19.0, 21.0, 27.0, 40.0, 41.0, 63.0, 130.0, 179.0, 212.0, 327.0, 482.0, 887.0, 1435.0, 2384.0, 4778.0, 10022.0, 26493.0, 128386.0, 3752016.0, 208590.0, 34040.0, 11834.0, 5153.0, 2729.0, 1498.0, 845.0, 540.0, 366.0, 232.0, 126.0, 89.0, 72.0, 46.0, 49.0, 23.0, 17.0, 19.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.8515625, -9.58233642578125, -9.3131103515625, -9.04388427734375, -8.774658203125, -8.50543212890625, -8.2362060546875, -7.96697998046875, -7.69775390625, -7.42852783203125, -7.1593017578125, -6.89007568359375, -6.620849609375, -6.35162353515625, -6.0823974609375, -5.81317138671875, -5.5439453125, -5.27471923828125, -5.0054931640625, -4.73626708984375, -4.467041015625, -4.19781494140625, -3.9285888671875, -3.65936279296875, -3.39013671875, -3.12091064453125, -2.8516845703125, -2.58245849609375, -2.313232421875, -2.04400634765625, -1.7747802734375, -1.50555419921875, -1.236328125, -0.96710205078125, -0.6978759765625, -0.42864990234375, -0.159423828125, 0.10980224609375, 0.3790283203125, 0.64825439453125, 0.91748046875, 1.18670654296875, 1.4559326171875, 1.72515869140625, 1.994384765625, 2.26361083984375, 2.5328369140625, 2.80206298828125, 3.0712890625, 3.34051513671875, 3.6097412109375, 3.87896728515625, 4.148193359375, 4.41741943359375, 4.6866455078125, 4.95587158203125, 5.22509765625, 5.49432373046875, 5.7635498046875, 6.03277587890625, 6.302001953125, 6.57122802734375, 6.8404541015625, 7.10968017578125, 7.37890625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 13.0, 6.0, 8.0, 11.0, 14.0, 22.0, 18.0, 35.0, 34.0, 33.0, 47.0, 45.0, 51.0, 53.0, 57.0, 58.0, 55.0, 56.0, 62.0, 48.0, 43.0, 39.0, 34.0, 30.0, 30.0, 27.0, 13.0, 12.0, 13.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.4086151123046875, -2.338714599609375, -2.2688140869140625, -2.19891357421875, -2.1290130615234375, -2.059112548828125, -1.9892120361328125, -1.9193115234375, -1.8494110107421875, -1.779510498046875, -1.7096099853515625, -1.63970947265625, -1.5698089599609375, -1.499908447265625, -1.4300079345703125, -1.360107421875, -1.2902069091796875, -1.220306396484375, -1.1504058837890625, -1.08050537109375, -1.0106048583984375, -0.940704345703125, -0.8708038330078125, -0.8009033203125, -0.7310028076171875, -0.661102294921875, -0.5912017822265625, -0.52130126953125, -0.4514007568359375, -0.381500244140625, -0.3115997314453125, -0.24169921875, -0.1717987060546875, -0.101898193359375, -0.0319976806640625, 0.03790283203125, 0.1078033447265625, 0.177703857421875, 0.2476043701171875, 0.3175048828125, 0.3874053955078125, 0.457305908203125, 0.5272064208984375, 0.59710693359375, 0.6670074462890625, 0.736907958984375, 0.8068084716796875, 0.876708984375, 0.9466094970703125, 1.016510009765625, 1.0864105224609375, 1.15631103515625, 1.2262115478515625, 1.296112060546875, 1.3660125732421875, 1.4359130859375, 1.5058135986328125, 1.575714111328125, 1.6456146240234375, 1.71551513671875, 1.7854156494140625, 1.855316162109375, 1.9252166748046875, 1.9951171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 7.0, 15.0, 17.0, 30.0, 64.0, 127.0, 301.0, 819.0, 2811.0, 13490.0, 214716.0, 3902110.0, 50846.0, 6429.0, 1550.0, 530.0, 202.0, 90.0, 53.0, 33.0, 17.0, 19.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.6519775390625, -7.233642578125, -6.8153076171875, -6.39697265625, -5.9786376953125, -5.560302734375, -5.1419677734375, -4.7236328125, -4.3052978515625, -3.886962890625, -3.4686279296875, -3.05029296875, -2.6319580078125, -2.213623046875, -1.7952880859375, -1.376953125, -0.9586181640625, -0.540283203125, -0.1219482421875, 0.29638671875, 0.7147216796875, 1.133056640625, 1.5513916015625, 1.9697265625, 2.3880615234375, 2.806396484375, 3.2247314453125, 3.64306640625, 4.0614013671875, 4.479736328125, 4.8980712890625, 5.31640625, 5.7347412109375, 6.153076171875, 6.5714111328125, 6.98974609375, 7.4080810546875, 7.826416015625, 8.2447509765625, 8.6630859375, 9.0814208984375, 9.499755859375, 9.9180908203125, 10.33642578125, 10.7547607421875, 11.173095703125, 11.5914306640625, 12.009765625, 12.4281005859375, 12.846435546875, 13.2647705078125, 13.68310546875, 14.1014404296875, 14.519775390625, 14.9381103515625, 15.3564453125, 15.7747802734375, 16.193115234375, 16.6114501953125, 17.02978515625, 17.4481201171875, 17.866455078125, 18.2847900390625, 18.703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 10.0, 8.0, 19.0, 29.0, 41.0, 68.0, 190.0, 813.0, 2384.0, 276.0, 105.0, 44.0, 23.0, 19.0, 7.0, 5.0, 9.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6640625, -3.53424072265625, -3.4044189453125, -3.27459716796875, -3.144775390625, -3.01495361328125, -2.8851318359375, -2.75531005859375, -2.62548828125, -2.49566650390625, -2.3658447265625, -2.23602294921875, -2.106201171875, -1.97637939453125, -1.8465576171875, -1.71673583984375, -1.5869140625, -1.45709228515625, -1.3272705078125, -1.19744873046875, -1.067626953125, -0.93780517578125, -0.8079833984375, -0.67816162109375, -0.54833984375, -0.41851806640625, -0.2886962890625, -0.15887451171875, -0.029052734375, 0.10076904296875, 0.2305908203125, 0.36041259765625, 0.490234375, 0.62005615234375, 0.7498779296875, 0.87969970703125, 1.009521484375, 1.13934326171875, 1.2691650390625, 1.39898681640625, 1.52880859375, 1.65863037109375, 1.7884521484375, 1.91827392578125, 2.048095703125, 2.17791748046875, 2.3077392578125, 2.43756103515625, 2.5673828125, 2.69720458984375, 2.8270263671875, 2.95684814453125, 3.086669921875, 3.21649169921875, 3.3463134765625, 3.47613525390625, 3.60595703125, 3.73577880859375, 3.8656005859375, 3.99542236328125, 4.125244140625, 4.25506591796875, 4.3848876953125, 4.51470947265625, 4.64453125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 9.0, 15.0, 22.0, 41.0, 88.0, 99.0, 139.0, 157.0, 133.0, 103.0, 70.0, 54.0, 34.0, 14.0, 5.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.901444435119629, -15.409701347351074, -14.91795825958252, -14.426216125488281, -13.934473037719727, -13.442729949951172, -12.950986862182617, -12.459243774414062, -11.967500686645508, -11.475757598876953, -10.984014511108398, -10.492271423339844, -10.000529289245605, -9.50878620147705, -9.017043113708496, -8.525300025939941, -8.033557891845703, -7.541814804077148, -7.050072193145752, -6.558329105377197, -6.066586494445801, -5.574843406677246, -5.083100318908691, -4.591357231140137, -4.09961462020874, -3.6078717708587646, -3.116128921508789, -2.6243858337402344, -2.132642984390259, -1.6409001350402832, -1.1491570472717285, -0.6574141979217529, -0.16567039489746094, 0.3260725140571594, 0.8178154230117798, 1.309558391571045, 1.8013012409210205, 2.293044090270996, 2.784787178039551, 3.2765300273895264, 3.768272876739502, 4.260015964508057, 4.751758575439453, 5.243501663208008, 5.7352447509765625, 6.226987361907959, 6.718730449676514, 7.21047306060791, 7.702216148376465, 8.19395923614502, 8.685702323913574, 9.177444458007812, 9.669187545776367, 10.160930633544922, 10.652673721313477, 11.144416809082031, 11.636159896850586, 12.12790298461914, 12.619646072387695, 13.11138916015625, 13.603131294250488, 14.094874382019043, 14.586617469787598, 15.078360557556152, 15.57010269165039]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 8.0, 3.0, 12.0, 12.0, 15.0, 16.0, 16.0, 19.0, 26.0, 41.0, 24.0, 25.0, 36.0, 49.0, 37.0, 35.0, 63.0, 35.0, 39.0, 39.0, 41.0, 42.0, 34.0, 36.0, 24.0, 40.0, 32.0, 31.0, 32.0, 22.0, 19.0, 11.0, 17.0, 17.0, 15.0, 4.0, 9.0, 5.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.623503684997559, -7.3664326667785645, -7.10936164855957, -6.852290630340576, -6.595219612121582, -6.338148593902588, -6.081077575683594, -5.8240065574646, -5.5669355392456055, -5.309864521026611, -5.052793502807617, -4.795722484588623, -4.538651466369629, -4.281580448150635, -4.024509429931641, -3.7674384117126465, -3.5103673934936523, -3.253296375274658, -2.996225357055664, -2.73915433883667, -2.482083320617676, -2.2250123023986816, -1.9679412841796875, -1.7108702659606934, -1.4537992477416992, -1.196728229522705, -0.9396572113037109, -0.6825861930847168, -0.42551517486572266, -0.16844415664672852, 0.08862686157226562, 0.34569787979125977, 0.6027679443359375, 0.8598389625549316, 1.1169099807739258, 1.37398099899292, 1.631052017211914, 1.8881230354309082, 2.1451940536499023, 2.4022650718688965, 2.6593360900878906, 2.9164071083068848, 3.173478126525879, 3.430549144744873, 3.687620162963867, 3.9446911811828613, 4.2017621994018555, 4.45883321762085, 4.715904235839844, 4.972975254058838, 5.230046272277832, 5.487117290496826, 5.74418830871582, 6.0012593269348145, 6.258330345153809, 6.515401363372803, 6.772472381591797, 7.029543399810791, 7.286614418029785, 7.543685436248779, 7.800756454467773, 8.05782699584961, 8.314898490905762, 8.571969985961914, 8.82904052734375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 5.0, 13.0, 27.0, 23.0, 31.0, 51.0, 71.0, 129.0, 194.0, 315.0, 550.0, 914.0, 1786.0, 3472.0, 7911.0, 18732.0, 48743.0, 143655.0, 388832.0, 281372.0, 93930.0, 32946.0, 13123.0, 5659.0, 2803.0, 1435.0, 754.0, 412.0, 241.0, 132.0, 100.0, 67.0, 47.0, 14.0, 13.0, 14.0, 8.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.87835693359375, -5.6590576171875, -5.43975830078125, -5.220458984375, -5.00115966796875, -4.7818603515625, -4.56256103515625, -4.34326171875, -4.12396240234375, -3.9046630859375, -3.68536376953125, -3.466064453125, -3.24676513671875, -3.0274658203125, -2.80816650390625, -2.5888671875, -2.36956787109375, -2.1502685546875, -1.93096923828125, -1.711669921875, -1.49237060546875, -1.2730712890625, -1.05377197265625, -0.83447265625, -0.61517333984375, -0.3958740234375, -0.17657470703125, 0.042724609375, 0.26202392578125, 0.4813232421875, 0.70062255859375, 0.919921875, 1.13922119140625, 1.3585205078125, 1.57781982421875, 1.797119140625, 2.01641845703125, 2.2357177734375, 2.45501708984375, 2.67431640625, 2.89361572265625, 3.1129150390625, 3.33221435546875, 3.551513671875, 3.77081298828125, 3.9901123046875, 4.20941162109375, 4.4287109375, 4.64801025390625, 4.8673095703125, 5.08660888671875, 5.305908203125, 5.52520751953125, 5.7445068359375, 5.96380615234375, 6.18310546875, 6.40240478515625, 6.6217041015625, 6.84100341796875, 7.060302734375, 7.27960205078125, 7.4989013671875, 7.71820068359375, 7.9375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 11.0, 15.0, 22.0, 16.0, 21.0, 21.0, 37.0, 32.0, 52.0, 59.0, 51.0, 50.0, 54.0, 65.0, 54.0, 49.0, 58.0, 43.0, 49.0, 37.0, 38.0, 33.0, 26.0, 25.0, 15.0, 15.0, 9.0, 10.0, 3.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.578125, -2.5057373046875, -2.433349609375, -2.3609619140625, -2.28857421875, -2.2161865234375, -2.143798828125, -2.0714111328125, -1.9990234375, -1.9266357421875, -1.854248046875, -1.7818603515625, -1.70947265625, -1.6370849609375, -1.564697265625, -1.4923095703125, -1.419921875, -1.3475341796875, -1.275146484375, -1.2027587890625, -1.13037109375, -1.0579833984375, -0.985595703125, -0.9132080078125, -0.8408203125, -0.7684326171875, -0.696044921875, -0.6236572265625, -0.55126953125, -0.4788818359375, -0.406494140625, -0.3341064453125, -0.26171875, -0.1893310546875, -0.116943359375, -0.0445556640625, 0.02783203125, 0.1002197265625, 0.172607421875, 0.2449951171875, 0.3173828125, 0.3897705078125, 0.462158203125, 0.5345458984375, 0.60693359375, 0.6793212890625, 0.751708984375, 0.8240966796875, 0.896484375, 0.9688720703125, 1.041259765625, 1.1136474609375, 1.18603515625, 1.2584228515625, 1.330810546875, 1.4031982421875, 1.4755859375, 1.5479736328125, 1.620361328125, 1.6927490234375, 1.76513671875, 1.8375244140625, 1.909912109375, 1.9822998046875, 2.0546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 10.0, 5.0, 11.0, 12.0, 11.0, 33.0, 37.0, 63.0, 122.0, 170.0, 319.0, 519.0, 1022.0, 2259.0, 6118.0, 20942.0, 91578.0, 477488.0, 357374.0, 65688.0, 15839.0, 4922.0, 1928.0, 891.0, 458.0, 278.0, 171.0, 106.0, 55.0, 44.0, 27.0, 16.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-9.046875, -8.79486083984375, -8.5428466796875, -8.29083251953125, -8.038818359375, -7.78680419921875, -7.5347900390625, -7.28277587890625, -7.03076171875, -6.77874755859375, -6.5267333984375, -6.27471923828125, -6.022705078125, -5.77069091796875, -5.5186767578125, -5.26666259765625, -5.0146484375, -4.76263427734375, -4.5106201171875, -4.25860595703125, -4.006591796875, -3.75457763671875, -3.5025634765625, -3.25054931640625, -2.99853515625, -2.74652099609375, -2.4945068359375, -2.24249267578125, -1.990478515625, -1.73846435546875, -1.4864501953125, -1.23443603515625, -0.982421875, -0.73040771484375, -0.4783935546875, -0.22637939453125, 0.025634765625, 0.27764892578125, 0.5296630859375, 0.78167724609375, 1.03369140625, 1.28570556640625, 1.5377197265625, 1.78973388671875, 2.041748046875, 2.29376220703125, 2.5457763671875, 2.79779052734375, 3.0498046875, 3.30181884765625, 3.5538330078125, 3.80584716796875, 4.057861328125, 4.30987548828125, 4.5618896484375, 4.81390380859375, 5.06591796875, 5.31793212890625, 5.5699462890625, 5.82196044921875, 6.073974609375, 6.32598876953125, 6.5780029296875, 6.83001708984375, 7.08203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 14.0, 13.0, 17.0, 31.0, 30.0, 49.0, 33.0, 45.0, 54.0, 63.0, 77.0, 73.0, 71.0, 70.0, 43.0, 64.0, 56.0, 37.0, 24.0, 23.0, 31.0, 12.0, 18.0, 14.0, 5.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0390625, -11.6494140625, -11.259765625, -10.8701171875, -10.48046875, -10.0908203125, -9.701171875, -9.3115234375, -8.921875, -8.5322265625, -8.142578125, -7.7529296875, -7.36328125, -6.9736328125, -6.583984375, -6.1943359375, -5.8046875, -5.4150390625, -5.025390625, -4.6357421875, -4.24609375, -3.8564453125, -3.466796875, -3.0771484375, -2.6875, -2.2978515625, -1.908203125, -1.5185546875, -1.12890625, -0.7392578125, -0.349609375, 0.0400390625, 0.4296875, 0.8193359375, 1.208984375, 1.5986328125, 1.98828125, 2.3779296875, 2.767578125, 3.1572265625, 3.546875, 3.9365234375, 4.326171875, 4.7158203125, 5.10546875, 5.4951171875, 5.884765625, 6.2744140625, 6.6640625, 7.0537109375, 7.443359375, 7.8330078125, 8.22265625, 8.6123046875, 9.001953125, 9.3916015625, 9.78125, 10.1708984375, 10.560546875, 10.9501953125, 11.33984375, 11.7294921875, 12.119140625, 12.5087890625, 12.8984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 7.0, 2.0, 5.0, 4.0, 7.0, 16.0, 26.0, 45.0, 48.0, 76.0, 116.0, 233.0, 431.0, 814.0, 1705.0, 3847.0, 11067.0, 87060.0, 865442.0, 61189.0, 9759.0, 3416.0, 1504.0, 766.0, 401.0, 219.0, 131.0, 77.0, 47.0, 32.0, 18.0, 17.0, 13.0, 5.0, 7.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03125, -9.739990234375, -9.44873046875, -9.157470703125, -8.8662109375, -8.574951171875, -8.28369140625, -7.992431640625, -7.701171875, -7.409912109375, -7.11865234375, -6.827392578125, -6.5361328125, -6.244873046875, -5.95361328125, -5.662353515625, -5.37109375, -5.079833984375, -4.78857421875, -4.497314453125, -4.2060546875, -3.914794921875, -3.62353515625, -3.332275390625, -3.041015625, -2.749755859375, -2.45849609375, -2.167236328125, -1.8759765625, -1.584716796875, -1.29345703125, -1.002197265625, -0.7109375, -0.419677734375, -0.12841796875, 0.162841796875, 0.4541015625, 0.745361328125, 1.03662109375, 1.327880859375, 1.619140625, 1.910400390625, 2.20166015625, 2.492919921875, 2.7841796875, 3.075439453125, 3.36669921875, 3.657958984375, 3.94921875, 4.240478515625, 4.53173828125, 4.822998046875, 5.1142578125, 5.405517578125, 5.69677734375, 5.988037109375, 6.279296875, 6.570556640625, 6.86181640625, 7.153076171875, 7.4443359375, 7.735595703125, 8.02685546875, 8.318115234375, 8.609375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 12.0, 20.0, 25.0, 51.0, 52.0, 133.0, 365.0, 144.0, 93.0, 55.0, 25.0, 13.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011434555053710938, -0.001095101237297058, -0.0010467469692230225, -0.0009983927011489868, -0.0009500384330749512, -0.0009016841650009155, -0.0008533298969268799, -0.0008049756288528442, -0.0007566213607788086, -0.000708267092704773, -0.0006599128246307373, -0.0006115585565567017, -0.000563204288482666, -0.0005148500204086304, -0.0004664957523345947, -0.0004181414842605591, -0.00036978721618652344, -0.0003214329481124878, -0.00027307868003845215, -0.0002247244119644165, -0.00017637014389038086, -0.00012801587581634521, -7.966160774230957e-05, -3.1307339668273926e-05, 1.704692840576172e-05, 6.540119647979736e-05, 0.00011375546455383301, 0.00016210973262786865, 0.0002104640007019043, 0.00025881826877593994, 0.0003071725368499756, 0.00035552680492401123, 0.0004038810729980469, 0.0004522353410720825, 0.0005005896091461182, 0.0005489438772201538, 0.0005972981452941895, 0.0006456524133682251, 0.0006940066814422607, 0.0007423609495162964, 0.000790715217590332, 0.0008390694856643677, 0.0008874237537384033, 0.000935778021812439, 0.0009841322898864746, 0.0010324865579605103, 0.001080840826034546, 0.0011291950941085815, 0.0011775493621826172, 0.0012259036302566528, 0.0012742578983306885, 0.0013226121664047241, 0.0013709664344787598, 0.0014193207025527954, 0.001467674970626831, 0.0015160292387008667, 0.0015643835067749023, 0.001612737774848938, 0.0016610920429229736, 0.0017094463109970093, 0.001757800579071045, 0.0018061548471450806, 0.0018545091152191162, 0.0019028633832931519, 0.0019512176513671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 8.0, 7.0, 25.0, 27.0, 61.0, 126.0, 322.0, 836.0, 2961.0, 18848.0, 867112.0, 147655.0, 7825.0, 1773.0, 561.0, 195.0, 94.0, 44.0, 32.0, 10.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.75, -10.2783203125, -9.806640625, -9.3349609375, -8.86328125, -8.3916015625, -7.919921875, -7.4482421875, -6.9765625, -6.5048828125, -6.033203125, -5.5615234375, -5.08984375, -4.6181640625, -4.146484375, -3.6748046875, -3.203125, -2.7314453125, -2.259765625, -1.7880859375, -1.31640625, -0.8447265625, -0.373046875, 0.0986328125, 0.5703125, 1.0419921875, 1.513671875, 1.9853515625, 2.45703125, 2.9287109375, 3.400390625, 3.8720703125, 4.34375, 4.8154296875, 5.287109375, 5.7587890625, 6.23046875, 6.7021484375, 7.173828125, 7.6455078125, 8.1171875, 8.5888671875, 9.060546875, 9.5322265625, 10.00390625, 10.4755859375, 10.947265625, 11.4189453125, 11.890625, 12.3623046875, 12.833984375, 13.3056640625, 13.77734375, 14.2490234375, 14.720703125, 15.1923828125, 15.6640625, 16.1357421875, 16.607421875, 17.0791015625, 17.55078125, 18.0224609375, 18.494140625, 18.9658203125, 19.4375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 11.0, 32.0, 42.0, 76.0, 180.0, 317.0, 140.0, 77.0, 41.0, 19.0, 12.0, 3.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.2879638671875, -8.935302734375, -8.5826416015625, -8.22998046875, -7.8773193359375, -7.524658203125, -7.1719970703125, -6.8193359375, -6.4666748046875, -6.114013671875, -5.7613525390625, -5.40869140625, -5.0560302734375, -4.703369140625, -4.3507080078125, -3.998046875, -3.6453857421875, -3.292724609375, -2.9400634765625, -2.58740234375, -2.2347412109375, -1.882080078125, -1.5294189453125, -1.1767578125, -0.8240966796875, -0.471435546875, -0.1187744140625, 0.23388671875, 0.5865478515625, 0.939208984375, 1.2918701171875, 1.64453125, 1.9971923828125, 2.349853515625, 2.7025146484375, 3.05517578125, 3.4078369140625, 3.760498046875, 4.1131591796875, 4.4658203125, 4.8184814453125, 5.171142578125, 5.5238037109375, 5.87646484375, 6.2291259765625, 6.581787109375, 6.9344482421875, 7.287109375, 7.6397705078125, 7.992431640625, 8.3450927734375, 8.69775390625, 9.0504150390625, 9.403076171875, 9.7557373046875, 10.1083984375, 10.4610595703125, 10.813720703125, 11.1663818359375, 11.51904296875, 11.8717041015625, 12.224365234375, 12.5770263671875, 12.9296875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 8.0, 21.0, 34.0, 67.0, 114.0, 193.0, 198.0, 158.0, 94.0, 50.0, 28.0, 18.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.35716247558594, -71.17179870605469, -67.98644256591797, -64.80107879638672, -61.615718841552734, -58.43035888671875, -55.2449951171875, -52.059635162353516, -48.87427520751953, -45.68891525268555, -42.50355529785156, -39.31819152832031, -36.13283157348633, -32.947471618652344, -29.762109756469727, -26.57674789428711, -23.391387939453125, -20.20602798461914, -17.020666122436523, -13.835305213928223, -10.649944305419922, -7.464583396911621, -4.27922248840332, -1.0938606262207031, 2.0914993286132812, 5.276860237121582, 8.462221145629883, 11.647582054138184, 14.832942962646484, 18.01830291748047, 21.203664779663086, 24.389026641845703, 27.574386596679688, 30.759746551513672, 33.945106506347656, 37.130470275878906, 40.31583023071289, 43.501190185546875, 46.686553955078125, 49.87191390991211, 53.057273864746094, 56.24263381958008, 59.42799377441406, 62.61335754394531, 65.79872131347656, 68.98407745361328, 72.16944122314453, 75.35479736328125, 78.5401611328125, 81.72552490234375, 84.91088104248047, 88.09624481201172, 91.28160095214844, 94.46696472167969, 97.65232849121094, 100.83769226074219, 104.0230484008789, 107.20841217041016, 110.39376831054688, 113.57913208007812, 116.76449584960938, 119.9498519897461, 123.13521575927734, 126.32057189941406, 129.5059356689453]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 8.0, 6.0, 5.0, 7.0, 11.0, 15.0, 14.0, 15.0, 15.0, 16.0, 29.0, 20.0, 43.0, 35.0, 54.0, 45.0, 55.0, 40.0, 60.0, 51.0, 42.0, 57.0, 50.0, 48.0, 39.0, 36.0, 26.0, 28.0, 28.0, 24.0, 20.0, 8.0, 15.0, 11.0, 5.0, 7.0, 5.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.42919921875, -52.488861083984375, -50.54852294921875, -48.60818099975586, -46.667842864990234, -44.72750473022461, -42.78716278076172, -40.846824645996094, -38.90648651123047, -36.966148376464844, -35.02581024169922, -33.08546829223633, -31.145130157470703, -29.204792022705078, -27.26445198059082, -25.324111938476562, -23.383773803710938, -21.443435668945312, -19.503095626831055, -17.562755584716797, -15.622417449951172, -13.68207836151123, -11.741739273071289, -9.801400184631348, -7.861061096191406, -5.920722007751465, -3.9803829193115234, -2.040043830871582, -0.09970474243164062, 1.8406343460083008, 3.780973434448242, 5.721312522888184, 7.661651611328125, 9.601990699768066, 11.542329788208008, 13.48266887664795, 15.42300796508789, 17.363346099853516, 19.303686141967773, 21.24402618408203, 23.184364318847656, 25.12470245361328, 27.06504249572754, 29.005382537841797, 30.945720672607422, 32.88605880737305, 34.82640075683594, 36.76673889160156, 38.70707702636719, 40.64741516113281, 42.58775329589844, 44.52809524536133, 46.46843338012695, 48.40877151489258, 50.34911346435547, 52.289451599121094, 54.22978973388672, 56.170127868652344, 58.11046600341797, 60.05080795288086, 61.991146087646484, 63.93148422241211, 65.871826171875, 67.81216430664062, 69.75250244140625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 9.0, 0.0, 8.0, 9.0, 10.0, 18.0, 24.0, 32.0, 46.0, 66.0, 124.0, 186.0, 279.0, 520.0, 1051.0, 2066.0, 5417.0, 15865.0, 72571.0, 3311046.0, 718130.0, 47210.0, 12030.0, 4006.0, 1668.0, 812.0, 436.0, 209.0, 134.0, 95.0, 60.0, 46.0, 30.0, 26.0, 15.0, 8.0, 10.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.359375, -9.023681640625, -8.68798828125, -8.352294921875, -8.0166015625, -7.680908203125, -7.34521484375, -7.009521484375, -6.673828125, -6.338134765625, -6.00244140625, -5.666748046875, -5.3310546875, -4.995361328125, -4.65966796875, -4.323974609375, -3.98828125, -3.652587890625, -3.31689453125, -2.981201171875, -2.6455078125, -2.309814453125, -1.97412109375, -1.638427734375, -1.302734375, -0.967041015625, -0.63134765625, -0.295654296875, 0.0400390625, 0.375732421875, 0.71142578125, 1.047119140625, 1.3828125, 1.718505859375, 2.05419921875, 2.389892578125, 2.7255859375, 3.061279296875, 3.39697265625, 3.732666015625, 4.068359375, 4.404052734375, 4.73974609375, 5.075439453125, 5.4111328125, 5.746826171875, 6.08251953125, 6.418212890625, 6.75390625, 7.089599609375, 7.42529296875, 7.760986328125, 8.0966796875, 8.432373046875, 8.76806640625, 9.103759765625, 9.439453125, 9.775146484375, 10.11083984375, 10.446533203125, 10.7822265625, 11.117919921875, 11.45361328125, 11.789306640625, 12.125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 12.0, 7.0, 4.0, 15.0, 16.0, 11.0, 20.0, 30.0, 26.0, 32.0, 21.0, 38.0, 46.0, 56.0, 50.0, 51.0, 51.0, 52.0, 59.0, 46.0, 52.0, 48.0, 39.0, 43.0, 26.0, 29.0, 26.0, 20.0, 16.0, 16.0, 11.0, 8.0, 10.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.435546875, -2.354461669921875, -2.27337646484375, -2.192291259765625, -2.1112060546875, -2.030120849609375, -1.94903564453125, -1.867950439453125, -1.786865234375, -1.705780029296875, -1.62469482421875, -1.543609619140625, -1.4625244140625, -1.381439208984375, -1.30035400390625, -1.219268798828125, -1.13818359375, -1.057098388671875, -0.97601318359375, -0.894927978515625, -0.8138427734375, -0.732757568359375, -0.65167236328125, -0.570587158203125, -0.489501953125, -0.408416748046875, -0.32733154296875, -0.246246337890625, -0.1651611328125, -0.084075927734375, -0.00299072265625, 0.078094482421875, 0.1591796875, 0.240264892578125, 0.32135009765625, 0.402435302734375, 0.4835205078125, 0.564605712890625, 0.64569091796875, 0.726776123046875, 0.807861328125, 0.888946533203125, 0.97003173828125, 1.051116943359375, 1.1322021484375, 1.213287353515625, 1.29437255859375, 1.375457763671875, 1.45654296875, 1.537628173828125, 1.61871337890625, 1.699798583984375, 1.7808837890625, 1.861968994140625, 1.94305419921875, 2.024139404296875, 2.105224609375, 2.186309814453125, 2.26739501953125, 2.348480224609375, 2.4295654296875, 2.510650634765625, 2.59173583984375, 2.672821044921875, 2.75390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 0.0, 8.0, 17.0, 22.0, 32.0, 35.0, 46.0, 88.0, 120.0, 237.0, 409.0, 958.0, 2386.0, 9952.0, 103256.0, 3937501.0, 123785.0, 10727.0, 2685.0, 956.0, 422.0, 233.0, 142.0, 79.0, 56.0, 35.0, 30.0, 18.0, 19.0, 9.0, 5.0, 4.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.59375, -15.09912109375, -14.6044921875, -14.10986328125, -13.615234375, -13.12060546875, -12.6259765625, -12.13134765625, -11.63671875, -11.14208984375, -10.6474609375, -10.15283203125, -9.658203125, -9.16357421875, -8.6689453125, -8.17431640625, -7.6796875, -7.18505859375, -6.6904296875, -6.19580078125, -5.701171875, -5.20654296875, -4.7119140625, -4.21728515625, -3.72265625, -3.22802734375, -2.7333984375, -2.23876953125, -1.744140625, -1.24951171875, -0.7548828125, -0.26025390625, 0.234375, 0.72900390625, 1.2236328125, 1.71826171875, 2.212890625, 2.70751953125, 3.2021484375, 3.69677734375, 4.19140625, 4.68603515625, 5.1806640625, 5.67529296875, 6.169921875, 6.66455078125, 7.1591796875, 7.65380859375, 8.1484375, 8.64306640625, 9.1376953125, 9.63232421875, 10.126953125, 10.62158203125, 11.1162109375, 11.61083984375, 12.10546875, 12.60009765625, 13.0947265625, 13.58935546875, 14.083984375, 14.57861328125, 15.0732421875, 15.56787109375, 16.0625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 9.0, 11.0, 22.0, 47.0, 82.0, 389.0, 2925.0, 413.0, 103.0, 39.0, 18.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.890625, -8.5421142578125, -8.193603515625, -7.8450927734375, -7.49658203125, -7.1480712890625, -6.799560546875, -6.4510498046875, -6.1025390625, -5.7540283203125, -5.405517578125, -5.0570068359375, -4.70849609375, -4.3599853515625, -4.011474609375, -3.6629638671875, -3.314453125, -2.9659423828125, -2.617431640625, -2.2689208984375, -1.92041015625, -1.5718994140625, -1.223388671875, -0.8748779296875, -0.5263671875, -0.1778564453125, 0.170654296875, 0.5191650390625, 0.86767578125, 1.2161865234375, 1.564697265625, 1.9132080078125, 2.26171875, 2.6102294921875, 2.958740234375, 3.3072509765625, 3.65576171875, 4.0042724609375, 4.352783203125, 4.7012939453125, 5.0498046875, 5.3983154296875, 5.746826171875, 6.0953369140625, 6.44384765625, 6.7923583984375, 7.140869140625, 7.4893798828125, 7.837890625, 8.1864013671875, 8.534912109375, 8.8834228515625, 9.23193359375, 9.5804443359375, 9.928955078125, 10.2774658203125, 10.6259765625, 10.9744873046875, 11.322998046875, 11.6715087890625, 12.02001953125, 12.3685302734375, 12.717041015625, 13.0655517578125, 13.4140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 13.0, 20.0, 44.0, 39.0, 69.0, 104.0, 118.0, 129.0, 119.0, 93.0, 69.0, 43.0, 39.0, 25.0, 15.0, 7.0, 9.0, 6.0, 6.0, 4.0, 1.0, 2.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.337881088256836, -12.686314582824707, -12.034748077392578, -11.38318157196045, -10.73161506652832, -10.080049514770508, -9.428483009338379, -8.77691650390625, -8.125349998474121, -7.473783493041992, -6.822216987609863, -6.170650959014893, -5.519084453582764, -4.867517948150635, -4.215951919555664, -3.564385414123535, -2.9128189086914062, -2.2612524032592773, -1.6096861362457275, -0.9581197500228882, -0.30655336380004883, 0.3450131416320801, 0.9965794086456299, 1.6481456756591797, 2.2997121810913086, 2.9512786865234375, 3.6028449535369873, 4.254411220550537, 4.905977725982666, 5.557544231414795, 6.209110260009766, 6.8606767654418945, 7.512243270874023, 8.163809776306152, 8.815376281738281, 9.46694278717041, 10.118509292602539, 10.770074844360352, 11.42164134979248, 12.07320785522461, 12.724774360656738, 13.376340866088867, 14.027907371520996, 14.679473876953125, 15.331039428710938, 15.982606887817383, 16.634172439575195, 17.28573989868164, 17.937305450439453, 18.588871002197266, 19.24043846130371, 19.892004013061523, 20.54357147216797, 21.19513702392578, 21.846704483032227, 22.49827003479004, 23.149837493896484, 23.801403045654297, 24.452970504760742, 25.104536056518555, 25.756103515625, 26.407669067382812, 27.059236526489258, 27.71080207824707, 28.362367630004883]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 4.0, 6.0, 5.0, 3.0, 8.0, 10.0, 12.0, 10.0, 19.0, 20.0, 26.0, 22.0, 33.0, 33.0, 35.0, 25.0, 39.0, 29.0, 40.0, 47.0, 42.0, 38.0, 41.0, 49.0, 28.0, 35.0, 29.0, 33.0, 34.0, 35.0, 34.0, 24.0, 21.0, 28.0, 18.0, 16.0, 11.0, 12.0, 10.0, 8.0, 7.0, 9.0, 4.0, 6.0, 0.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-16.175437927246094, -15.715279579162598, -15.255121231079102, -14.794962882995605, -14.33480453491211, -13.874646186828613, -13.414487838745117, -12.954328536987305, -12.494171142578125, -12.034012794494629, -11.573854446411133, -11.113696098327637, -10.65353775024414, -10.193379402160645, -9.733221054077148, -9.273061752319336, -8.81290340423584, -8.352745056152344, -7.892586708068848, -7.432428359985352, -6.9722700119018555, -6.512111663818359, -6.051952838897705, -5.591794490814209, -5.131636142730713, -4.671477794647217, -4.211319446563721, -3.7511608600616455, -3.2910025119781494, -2.8308441638946533, -2.370685577392578, -1.910527229309082, -1.4503679275512695, -0.9902095198631287, -0.5300511121749878, -0.06989264488220215, 0.39026570320129395, 0.85042405128479, 1.3105826377868652, 1.7707409858703613, 2.2308993339538574, 2.6910576820373535, 3.1512160301208496, 3.611374616622925, 4.071533203125, 4.531691551208496, 4.991849899291992, 5.452008247375488, 5.912166595458984, 6.3723249435424805, 6.832483291625977, 7.292641639709473, 7.752799987792969, 8.212958335876465, 8.673116683959961, 9.133275985717773, 9.593433380126953, 10.05359172821045, 10.513750076293945, 10.973908424377441, 11.434066772460938, 11.894225120544434, 12.35438346862793, 12.814542770385742, 13.274701118469238]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 11.0, 10.0, 19.0, 27.0, 40.0, 55.0, 84.0, 139.0, 205.0, 291.0, 504.0, 691.0, 1169.0, 2009.0, 3325.0, 5885.0, 10305.0, 19569.0, 38027.0, 79786.0, 165158.0, 263119.0, 224439.0, 117599.0, 55320.0, 27624.0, 14355.0, 7745.0, 4435.0, 2491.0, 1514.0, 899.0, 607.0, 378.0, 256.0, 143.0, 94.0, 68.0, 59.0, 29.0, 19.0, 20.0, 8.0, 9.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.97265625, -4.82086181640625, -4.6690673828125, -4.51727294921875, -4.365478515625, -4.21368408203125, -4.0618896484375, -3.91009521484375, -3.75830078125, -3.60650634765625, -3.4547119140625, -3.30291748046875, -3.151123046875, -2.99932861328125, -2.8475341796875, -2.69573974609375, -2.5439453125, -2.39215087890625, -2.2403564453125, -2.08856201171875, -1.936767578125, -1.78497314453125, -1.6331787109375, -1.48138427734375, -1.32958984375, -1.17779541015625, -1.0260009765625, -0.87420654296875, -0.722412109375, -0.57061767578125, -0.4188232421875, -0.26702880859375, -0.115234375, 0.03656005859375, 0.1883544921875, 0.34014892578125, 0.491943359375, 0.64373779296875, 0.7955322265625, 0.94732666015625, 1.09912109375, 1.25091552734375, 1.4027099609375, 1.55450439453125, 1.706298828125, 1.85809326171875, 2.0098876953125, 2.16168212890625, 2.3134765625, 2.46527099609375, 2.6170654296875, 2.76885986328125, 2.920654296875, 3.07244873046875, 3.2242431640625, 3.37603759765625, 3.52783203125, 3.67962646484375, 3.8314208984375, 3.98321533203125, 4.135009765625, 4.28680419921875, 4.4385986328125, 4.59039306640625, 4.7421875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 7.0, 10.0, 18.0, 15.0, 15.0, 21.0, 30.0, 30.0, 30.0, 33.0, 45.0, 42.0, 49.0, 54.0, 40.0, 52.0, 53.0, 52.0, 53.0, 46.0, 38.0, 38.0, 41.0, 25.0, 21.0, 25.0, 19.0, 17.0, 14.0, 9.0, 10.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.521453857421875, -2.44134521484375, -2.361236572265625, -2.2811279296875, -2.201019287109375, -2.12091064453125, -2.040802001953125, -1.960693359375, -1.880584716796875, -1.80047607421875, -1.720367431640625, -1.6402587890625, -1.560150146484375, -1.48004150390625, -1.399932861328125, -1.31982421875, -1.239715576171875, -1.15960693359375, -1.079498291015625, -0.9993896484375, -0.919281005859375, -0.83917236328125, -0.759063720703125, -0.678955078125, -0.598846435546875, -0.51873779296875, -0.438629150390625, -0.3585205078125, -0.278411865234375, -0.19830322265625, -0.118194580078125, -0.0380859375, 0.042022705078125, 0.12213134765625, 0.202239990234375, 0.2823486328125, 0.362457275390625, 0.44256591796875, 0.522674560546875, 0.602783203125, 0.682891845703125, 0.76300048828125, 0.843109130859375, 0.9232177734375, 1.003326416015625, 1.08343505859375, 1.163543701171875, 1.24365234375, 1.323760986328125, 1.40386962890625, 1.483978271484375, 1.5640869140625, 1.644195556640625, 1.72430419921875, 1.804412841796875, 1.884521484375, 1.964630126953125, 2.04473876953125, 2.124847412109375, 2.2049560546875, 2.285064697265625, 2.36517333984375, 2.445281982421875, 2.525390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 10.0, 12.0, 15.0, 18.0, 24.0, 28.0, 53.0, 84.0, 116.0, 205.0, 334.0, 734.0, 1496.0, 3593.0, 9453.0, 29647.0, 111071.0, 417815.0, 349195.0, 86831.0, 24032.0, 7968.0, 3036.0, 1338.0, 580.0, 329.0, 160.0, 105.0, 78.0, 46.0, 42.0, 28.0, 19.0, 18.0, 9.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8359375, -7.573974609375, -7.31201171875, -7.050048828125, -6.7880859375, -6.526123046875, -6.26416015625, -6.002197265625, -5.740234375, -5.478271484375, -5.21630859375, -4.954345703125, -4.6923828125, -4.430419921875, -4.16845703125, -3.906494140625, -3.64453125, -3.382568359375, -3.12060546875, -2.858642578125, -2.5966796875, -2.334716796875, -2.07275390625, -1.810791015625, -1.548828125, -1.286865234375, -1.02490234375, -0.762939453125, -0.5009765625, -0.239013671875, 0.02294921875, 0.284912109375, 0.546875, 0.808837890625, 1.07080078125, 1.332763671875, 1.5947265625, 1.856689453125, 2.11865234375, 2.380615234375, 2.642578125, 2.904541015625, 3.16650390625, 3.428466796875, 3.6904296875, 3.952392578125, 4.21435546875, 4.476318359375, 4.73828125, 5.000244140625, 5.26220703125, 5.524169921875, 5.7861328125, 6.048095703125, 6.31005859375, 6.572021484375, 6.833984375, 7.095947265625, 7.35791015625, 7.619873046875, 7.8818359375, 8.143798828125, 8.40576171875, 8.667724609375, 8.9296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 7.0, 10.0, 14.0, 12.0, 18.0, 15.0, 23.0, 27.0, 22.0, 36.0, 47.0, 40.0, 42.0, 55.0, 42.0, 50.0, 54.0, 56.0, 48.0, 48.0, 59.0, 36.0, 41.0, 30.0, 29.0, 28.0, 21.0, 17.0, 18.0, 16.0, 3.0, 12.0, 11.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2890625, -14.8214111328125, -14.353759765625, -13.8861083984375, -13.41845703125, -12.9508056640625, -12.483154296875, -12.0155029296875, -11.5478515625, -11.0802001953125, -10.612548828125, -10.1448974609375, -9.67724609375, -9.2095947265625, -8.741943359375, -8.2742919921875, -7.806640625, -7.3389892578125, -6.871337890625, -6.4036865234375, -5.93603515625, -5.4683837890625, -5.000732421875, -4.5330810546875, -4.0654296875, -3.5977783203125, -3.130126953125, -2.6624755859375, -2.19482421875, -1.7271728515625, -1.259521484375, -0.7918701171875, -0.32421875, 0.1434326171875, 0.611083984375, 1.0787353515625, 1.54638671875, 2.0140380859375, 2.481689453125, 2.9493408203125, 3.4169921875, 3.8846435546875, 4.352294921875, 4.8199462890625, 5.28759765625, 5.7552490234375, 6.222900390625, 6.6905517578125, 7.158203125, 7.6258544921875, 8.093505859375, 8.5611572265625, 9.02880859375, 9.4964599609375, 9.964111328125, 10.4317626953125, 10.8994140625, 11.3670654296875, 11.834716796875, 12.3023681640625, 12.77001953125, 13.2376708984375, 13.705322265625, 14.1729736328125, 14.640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 5.0, 7.0, 4.0, 17.0, 13.0, 14.0, 42.0, 29.0, 61.0, 87.0, 122.0, 180.0, 282.0, 502.0, 937.0, 2255.0, 6155.0, 22095.0, 106468.0, 451488.0, 357360.0, 75123.0, 16424.0, 4856.0, 1848.0, 905.0, 425.0, 272.0, 172.0, 116.0, 84.0, 45.0, 34.0, 39.0, 18.0, 14.0, 9.0, 9.0, 7.0, 6.0, 6.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.751953125, -3.622100830078125, -3.49224853515625, -3.362396240234375, -3.2325439453125, -3.102691650390625, -2.97283935546875, -2.842987060546875, -2.713134765625, -2.583282470703125, -2.45343017578125, -2.323577880859375, -2.1937255859375, -2.063873291015625, -1.93402099609375, -1.804168701171875, -1.67431640625, -1.544464111328125, -1.41461181640625, -1.284759521484375, -1.1549072265625, -1.025054931640625, -0.89520263671875, -0.765350341796875, -0.635498046875, -0.505645751953125, -0.37579345703125, -0.245941162109375, -0.1160888671875, 0.013763427734375, 0.14361572265625, 0.273468017578125, 0.4033203125, 0.533172607421875, 0.66302490234375, 0.792877197265625, 0.9227294921875, 1.052581787109375, 1.18243408203125, 1.312286376953125, 1.442138671875, 1.571990966796875, 1.70184326171875, 1.831695556640625, 1.9615478515625, 2.091400146484375, 2.22125244140625, 2.351104736328125, 2.48095703125, 2.610809326171875, 2.74066162109375, 2.870513916015625, 3.0003662109375, 3.130218505859375, 3.26007080078125, 3.389923095703125, 3.519775390625, 3.649627685546875, 3.77947998046875, 3.909332275390625, 4.0391845703125, 4.169036865234375, 4.29888916015625, 4.428741455078125, 4.55859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 3.0, 4.0, 2.0, 8.0, 8.0, 20.0, 25.0, 18.0, 40.0, 39.0, 55.0, 75.0, 63.0, 85.0, 82.0, 84.0, 78.0, 65.0, 61.0, 39.0, 43.0, 26.0, 24.0, 17.0, 8.0, 7.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.0008087158203125, -0.0007883831858634949, -0.0007680505514144897, -0.0007477179169654846, -0.0007273852825164795, -0.0007070526480674744, -0.0006867200136184692, -0.0006663873791694641, -0.000646054744720459, -0.0006257221102714539, -0.0006053894758224487, -0.0005850568413734436, -0.0005647242069244385, -0.0005443915724754333, -0.0005240589380264282, -0.0005037263035774231, -0.00048339366912841797, -0.00046306103467941284, -0.0004427284002304077, -0.0004223957657814026, -0.00040206313133239746, -0.00038173049688339233, -0.0003613978624343872, -0.0003410652279853821, -0.00032073259353637695, -0.0003003999590873718, -0.0002800673246383667, -0.00025973469018936157, -0.00023940205574035645, -0.00021906942129135132, -0.0001987367868423462, -0.00017840415239334106, -0.00015807151794433594, -0.0001377388834953308, -0.00011740624904632568, -9.707361459732056e-05, -7.674098014831543e-05, -5.64083456993103e-05, -3.6075711250305176e-05, -1.574307680130005e-05, 4.589557647705078e-06, 2.4922192096710205e-05, 4.525482654571533e-05, 6.558746099472046e-05, 8.592009544372559e-05, 0.00010625272989273071, 0.00012658536434173584, 0.00014691799879074097, 0.0001672506332397461, 0.00018758326768875122, 0.00020791590213775635, 0.00022824853658676147, 0.0002485811710357666, 0.00026891380548477173, 0.00028924643993377686, 0.000309579074382782, 0.0003299117088317871, 0.00035024434328079224, 0.00037057697772979736, 0.0003909096121788025, 0.0004112422466278076, 0.00043157488107681274, 0.00045190751552581787, 0.000472240149974823, 0.0004925727844238281]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 6.0, 15.0, 12.0, 18.0, 29.0, 34.0, 58.0, 73.0, 136.0, 265.0, 376.0, 659.0, 1315.0, 3048.0, 7853.0, 25831.0, 97221.0, 331244.0, 398133.0, 130851.0, 33977.0, 10110.0, 3658.0, 1645.0, 819.0, 421.0, 283.0, 141.0, 109.0, 62.0, 40.0, 33.0, 18.0, 13.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.939605712890625, -3.82061767578125, -3.701629638671875, -3.5826416015625, -3.463653564453125, -3.34466552734375, -3.225677490234375, -3.106689453125, -2.987701416015625, -2.86871337890625, -2.749725341796875, -2.6307373046875, -2.511749267578125, -2.39276123046875, -2.273773193359375, -2.15478515625, -2.035797119140625, -1.91680908203125, -1.797821044921875, -1.6788330078125, -1.559844970703125, -1.44085693359375, -1.321868896484375, -1.202880859375, -1.083892822265625, -0.96490478515625, -0.845916748046875, -0.7269287109375, -0.607940673828125, -0.48895263671875, -0.369964599609375, -0.2509765625, -0.131988525390625, -0.01300048828125, 0.105987548828125, 0.2249755859375, 0.343963623046875, 0.46295166015625, 0.581939697265625, 0.700927734375, 0.819915771484375, 0.93890380859375, 1.057891845703125, 1.1768798828125, 1.295867919921875, 1.41485595703125, 1.533843994140625, 1.65283203125, 1.771820068359375, 1.89080810546875, 2.009796142578125, 2.1287841796875, 2.247772216796875, 2.36676025390625, 2.485748291015625, 2.604736328125, 2.723724365234375, 2.84271240234375, 2.961700439453125, 3.0806884765625, 3.199676513671875, 3.31866455078125, 3.437652587890625, 3.556640625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 7.0, 10.0, 7.0, 10.0, 16.0, 31.0, 36.0, 42.0, 61.0, 66.0, 83.0, 96.0, 105.0, 102.0, 84.0, 55.0, 52.0, 46.0, 32.0, 14.0, 18.0, 6.0, 8.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.453125, -4.26031494140625, -4.0675048828125, -3.87469482421875, -3.681884765625, -3.48907470703125, -3.2962646484375, -3.10345458984375, -2.91064453125, -2.71783447265625, -2.5250244140625, -2.33221435546875, -2.139404296875, -1.94659423828125, -1.7537841796875, -1.56097412109375, -1.3681640625, -1.17535400390625, -0.9825439453125, -0.78973388671875, -0.596923828125, -0.40411376953125, -0.2113037109375, -0.01849365234375, 0.17431640625, 0.36712646484375, 0.5599365234375, 0.75274658203125, 0.945556640625, 1.13836669921875, 1.3311767578125, 1.52398681640625, 1.716796875, 1.90960693359375, 2.1024169921875, 2.29522705078125, 2.488037109375, 2.68084716796875, 2.8736572265625, 3.06646728515625, 3.25927734375, 3.45208740234375, 3.6448974609375, 3.83770751953125, 4.030517578125, 4.22332763671875, 4.4161376953125, 4.60894775390625, 4.8017578125, 4.99456787109375, 5.1873779296875, 5.38018798828125, 5.572998046875, 5.76580810546875, 5.9586181640625, 6.15142822265625, 6.34423828125, 6.53704833984375, 6.7298583984375, 6.92266845703125, 7.115478515625, 7.30828857421875, 7.5010986328125, 7.69390869140625, 7.88671875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 7.0, 4.0, 6.0, 12.0, 13.0, 38.0, 107.0, 130.0, 214.0, 201.0, 107.0, 80.0, 37.0, 29.0, 12.0, 9.0, 4.0, 4.0, 2.0], "bins": [-167.0768585205078, -163.9799041748047, -160.88294982910156, -157.78599548339844, -154.6890411376953, -151.59207153320312, -148.4951171875, -145.39816284179688, -142.30120849609375, -139.20425415039062, -136.1072998046875, -133.01034545898438, -129.91339111328125, -126.8164291381836, -123.71947479248047, -120.62251281738281, -117.52555847167969, -114.42860412597656, -111.33164978027344, -108.23468780517578, -105.13773345947266, -102.04077911376953, -98.9438247680664, -95.84686279296875, -92.74991607666016, -89.65296173095703, -86.5560073852539, -83.45904541015625, -80.36209106445312, -77.26513671875, -74.16818237304688, -71.07122802734375, -67.9742660522461, -64.87731170654297, -61.78035354614258, -58.68339920043945, -55.58644104003906, -52.48948669433594, -49.39253234863281, -46.29557418823242, -43.1986198425293, -40.10166549682617, -37.00470733642578, -33.907752990722656, -30.810794830322266, -27.71384048461914, -24.616884231567383, -21.519927978515625, -18.422971725463867, -15.32601547241211, -12.229059219360352, -9.13210391998291, -6.035147666931152, -2.9381914138793945, 0.15876388549804688, 3.2557201385498047, 6.3526763916015625, 9.44963264465332, 12.546588897705078, 15.64354419708252, 18.740501403808594, 21.83745574951172, 24.934412002563477, 28.031368255615234, 31.128324508666992]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 10.0, 9.0, 16.0, 10.0, 12.0, 18.0, 21.0, 18.0, 31.0, 34.0, 39.0, 33.0, 36.0, 55.0, 50.0, 53.0, 58.0, 48.0, 37.0, 51.0, 43.0, 46.0, 32.0, 37.0, 35.0, 30.0, 25.0, 21.0, 17.0, 10.0, 8.0, 8.0, 19.0, 5.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.867942810058594, -60.53141784667969, -58.19489288330078, -55.858367919921875, -53.52184295654297, -51.18531799316406, -48.84879684448242, -46.512271881103516, -44.17574691772461, -41.8392219543457, -39.5026969909668, -37.16617202758789, -34.82965087890625, -32.493125915527344, -30.156600952148438, -27.82007598876953, -25.483551025390625, -23.14702606201172, -20.810501098632812, -18.47397804260254, -16.137453079223633, -13.800928115844727, -11.464404106140137, -9.127880096435547, -6.791355133056641, -4.454830646514893, -2.1183061599731445, 0.21821832656860352, 2.5547428131103516, 4.891267776489258, 7.227791786193848, 9.564315795898438, 11.900848388671875, 14.237373352050781, 16.573898315429688, 18.91042137145996, 21.246946334838867, 23.583471298217773, 25.919994354248047, 28.256519317626953, 30.59304428100586, 32.929569244384766, 35.26609420776367, 37.60261917114258, 39.93914031982422, 42.275665283203125, 44.61219024658203, 46.94871520996094, 49.285240173339844, 51.62176513671875, 53.958290100097656, 56.29481506347656, 58.63134002685547, 60.967864990234375, 63.304386138916016, 65.64091491699219, 67.97743225097656, 70.31395721435547, 72.65048217773438, 74.98700714111328, 77.32353210449219, 79.6600570678711, 81.99658203125, 84.33309936523438, 86.66963195800781]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 8.0, 4.0, 6.0, 4.0, 9.0, 16.0, 27.0, 45.0, 42.0, 77.0, 97.0, 132.0, 231.0, 330.0, 585.0, 994.0, 1932.0, 4167.0, 9585.0, 31188.0, 259536.0, 3791520.0, 66310.0, 15477.0, 5885.0, 2685.0, 1414.0, 759.0, 440.0, 248.0, 156.0, 104.0, 87.0, 62.0, 40.0, 20.0, 18.0, 17.0, 10.0, 6.0, 8.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.80859375, -6.55853271484375, -6.3084716796875, -6.05841064453125, -5.808349609375, -5.55828857421875, -5.3082275390625, -5.05816650390625, -4.80810546875, -4.55804443359375, -4.3079833984375, -4.05792236328125, -3.807861328125, -3.55780029296875, -3.3077392578125, -3.05767822265625, -2.8076171875, -2.55755615234375, -2.3074951171875, -2.05743408203125, -1.807373046875, -1.55731201171875, -1.3072509765625, -1.05718994140625, -0.80712890625, -0.55706787109375, -0.3070068359375, -0.05694580078125, 0.193115234375, 0.44317626953125, 0.6932373046875, 0.94329833984375, 1.193359375, 1.44342041015625, 1.6934814453125, 1.94354248046875, 2.193603515625, 2.44366455078125, 2.6937255859375, 2.94378662109375, 3.19384765625, 3.44390869140625, 3.6939697265625, 3.94403076171875, 4.194091796875, 4.44415283203125, 4.6942138671875, 4.94427490234375, 5.1943359375, 5.44439697265625, 5.6944580078125, 5.94451904296875, 6.194580078125, 6.44464111328125, 6.6947021484375, 6.94476318359375, 7.19482421875, 7.44488525390625, 7.6949462890625, 7.94500732421875, 8.195068359375, 8.44512939453125, 8.6951904296875, 8.94525146484375, 9.1953125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 5.0, 7.0, 6.0, 5.0, 10.0, 9.0, 12.0, 13.0, 21.0, 29.0, 23.0, 28.0, 33.0, 37.0, 30.0, 46.0, 35.0, 52.0, 44.0, 58.0, 54.0, 44.0, 52.0, 40.0, 44.0, 44.0, 47.0, 28.0, 25.0, 26.0, 15.0, 18.0, 15.0, 12.0, 7.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8828125, -2.7855224609375, -2.688232421875, -2.5909423828125, -2.49365234375, -2.3963623046875, -2.299072265625, -2.2017822265625, -2.1044921875, -2.0072021484375, -1.909912109375, -1.8126220703125, -1.71533203125, -1.6180419921875, -1.520751953125, -1.4234619140625, -1.326171875, -1.2288818359375, -1.131591796875, -1.0343017578125, -0.93701171875, -0.8397216796875, -0.742431640625, -0.6451416015625, -0.5478515625, -0.4505615234375, -0.353271484375, -0.2559814453125, -0.15869140625, -0.0614013671875, 0.035888671875, 0.1331787109375, 0.23046875, 0.3277587890625, 0.425048828125, 0.5223388671875, 0.61962890625, 0.7169189453125, 0.814208984375, 0.9114990234375, 1.0087890625, 1.1060791015625, 1.203369140625, 1.3006591796875, 1.39794921875, 1.4952392578125, 1.592529296875, 1.6898193359375, 1.787109375, 1.8843994140625, 1.981689453125, 2.0789794921875, 2.17626953125, 2.2735595703125, 2.370849609375, 2.4681396484375, 2.5654296875, 2.6627197265625, 2.760009765625, 2.8572998046875, 2.95458984375, 3.0518798828125, 3.149169921875, 3.2464599609375, 3.34375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 6.0, 20.0, 20.0, 26.0, 27.0, 22.0, 33.0, 45.0, 57.0, 65.0, 121.0, 167.0, 256.0, 417.0, 720.0, 1442.0, 3083.0, 9955.0, 71493.0, 3935592.0, 147868.0, 14586.0, 4128.0, 1702.0, 910.0, 521.0, 303.0, 173.0, 129.0, 84.0, 54.0, 51.0, 29.0, 42.0, 31.0, 18.0, 18.0, 13.0, 12.0, 9.0, 4.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6875, -11.31787109375, -10.9482421875, -10.57861328125, -10.208984375, -9.83935546875, -9.4697265625, -9.10009765625, -8.73046875, -8.36083984375, -7.9912109375, -7.62158203125, -7.251953125, -6.88232421875, -6.5126953125, -6.14306640625, -5.7734375, -5.40380859375, -5.0341796875, -4.66455078125, -4.294921875, -3.92529296875, -3.5556640625, -3.18603515625, -2.81640625, -2.44677734375, -2.0771484375, -1.70751953125, -1.337890625, -0.96826171875, -0.5986328125, -0.22900390625, 0.140625, 0.51025390625, 0.8798828125, 1.24951171875, 1.619140625, 1.98876953125, 2.3583984375, 2.72802734375, 3.09765625, 3.46728515625, 3.8369140625, 4.20654296875, 4.576171875, 4.94580078125, 5.3154296875, 5.68505859375, 6.0546875, 6.42431640625, 6.7939453125, 7.16357421875, 7.533203125, 7.90283203125, 8.2724609375, 8.64208984375, 9.01171875, 9.38134765625, 9.7509765625, 10.12060546875, 10.490234375, 10.85986328125, 11.2294921875, 11.59912109375, 11.96875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 13.0, 39.0, 144.0, 2664.0, 975.0, 123.0, 46.0, 22.0, 15.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.320831298828125, -2.21002197265625, -2.099212646484375, -1.9884033203125, -1.877593994140625, -1.76678466796875, -1.655975341796875, -1.545166015625, -1.434356689453125, -1.32354736328125, -1.212738037109375, -1.1019287109375, -0.991119384765625, -0.88031005859375, -0.769500732421875, -0.65869140625, -0.547882080078125, -0.43707275390625, -0.326263427734375, -0.2154541015625, -0.104644775390625, 0.00616455078125, 0.116973876953125, 0.227783203125, 0.338592529296875, 0.44940185546875, 0.560211181640625, 0.6710205078125, 0.781829833984375, 0.89263916015625, 1.003448486328125, 1.1142578125, 1.225067138671875, 1.33587646484375, 1.446685791015625, 1.5574951171875, 1.668304443359375, 1.77911376953125, 1.889923095703125, 2.000732421875, 2.111541748046875, 2.22235107421875, 2.333160400390625, 2.4439697265625, 2.554779052734375, 2.66558837890625, 2.776397705078125, 2.88720703125, 2.998016357421875, 3.10882568359375, 3.219635009765625, 3.3304443359375, 3.441253662109375, 3.55206298828125, 3.662872314453125, 3.773681640625, 3.884490966796875, 3.99530029296875, 4.106109619140625, 4.2169189453125, 4.327728271484375, 4.43853759765625, 4.549346923828125, 4.66015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 21.0, 21.0, 44.0, 81.0, 174.0, 173.0, 161.0, 127.0, 80.0, 52.0, 29.0, 12.0, 9.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.312112808227539, -9.902215957641602, -9.49232006072998, -9.08242416381836, -8.672527313232422, -8.262630462646484, -7.852734565734863, -7.442838191986084, -7.032941818237305, -6.623045444488525, -6.213149070739746, -5.803252696990967, -5.3933563232421875, -4.983459949493408, -4.573563575744629, -4.16366720199585, -3.7537708282470703, -3.343874454498291, -2.9339780807495117, -2.5240817070007324, -2.114185333251953, -1.7042889595031738, -1.2943925857543945, -0.8844962120056152, -0.47459983825683594, -0.06470346450805664, 0.34519290924072266, 0.755089282989502, 1.1649856567382812, 1.5748820304870605, 1.9847784042358398, 2.394674777984619, 2.8045711517333984, 3.2144675254821777, 3.624363899230957, 4.034260272979736, 4.444156646728516, 4.854053020477295, 5.263949394226074, 5.6738457679748535, 6.083742141723633, 6.493638515472412, 6.903534889221191, 7.313431262969971, 7.72332763671875, 8.133224487304688, 8.543120384216309, 8.95301628112793, 9.362913131713867, 9.772809982299805, 10.182705879211426, 10.592601776123047, 11.002498626708984, 11.412395477294922, 11.822291374206543, 12.232187271118164, 12.642084121704102, 13.051980972290039, 13.46187686920166, 13.871772766113281, 14.281669616699219, 14.691566467285156, 15.101462364196777, 15.511358261108398, 15.921255111694336]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 12.0, 13.0, 24.0, 27.0, 15.0, 26.0, 17.0, 29.0, 31.0, 34.0, 32.0, 37.0, 43.0, 36.0, 32.0, 51.0, 30.0, 42.0, 25.0, 37.0, 33.0, 42.0, 23.0, 34.0, 30.0, 20.0, 18.0, 24.0, 21.0, 21.0, 22.0, 22.0, 18.0, 11.0, 6.0, 8.0, 7.0, 7.0, 4.0, 1.0, 3.0, 5.0, 2.0, 5.0, 0.0, 1.0, 2.0], "bins": [-5.945357322692871, -5.77437686920166, -5.603396415710449, -5.432415962219238, -5.2614359855651855, -5.090455532073975, -4.919475078582764, -4.748494625091553, -4.577514171600342, -4.406533718109131, -4.23555326461792, -4.064573287963867, -3.893592596054077, -3.7226123809814453, -3.5516319274902344, -3.3806514739990234, -3.2096712589263916, -3.0386908054351807, -2.867710590362549, -2.696730136871338, -2.525749683380127, -2.354769229888916, -2.183789014816284, -2.0128085613250732, -1.8418282270431519, -1.6708478927612305, -1.4998674392700195, -1.3288871049880981, -1.1579067707061768, -0.9869263172149658, -0.8159459829330444, -0.6449655294418335, -0.4739851951599121, -0.30300480127334595, -0.13202443718910217, 0.0389559268951416, 0.20993632078170776, 0.3809167146682739, 0.5518970489501953, 0.7228775024414062, 0.8938578367233276, 1.064838171005249, 1.23581862449646, 1.4067989587783813, 1.5777792930603027, 1.7487597465515137, 1.919740080833435, 2.0907206535339355, 2.2617008686065674, 2.4326813220977783, 2.60366153717041, 2.774641990661621, 2.945622444152832, 3.116602897644043, 3.287583112716675, 3.4585635662078857, 3.6295437812805176, 3.8005242347717285, 3.9715044498443604, 4.142484664916992, 4.313465118408203, 4.484445571899414, 4.655426025390625, 4.826406478881836, 4.997386932373047]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 10.0, 2.0, 9.0, 9.0, 22.0, 27.0, 37.0, 45.0, 108.0, 133.0, 238.0, 387.0, 664.0, 1150.0, 2130.0, 4049.0, 8232.0, 17663.0, 41965.0, 106652.0, 255163.0, 325444.0, 168052.0, 65371.0, 26838.0, 11931.0, 5561.0, 2955.0, 1580.0, 823.0, 464.0, 310.0, 176.0, 105.0, 80.0, 49.0, 43.0, 21.0, 23.0, 7.0, 4.0, 6.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.7734375, -6.556640625, -6.33984375, -6.123046875, -5.90625, -5.689453125, -5.47265625, -5.255859375, -5.0390625, -4.822265625, -4.60546875, -4.388671875, -4.171875, -3.955078125, -3.73828125, -3.521484375, -3.3046875, -3.087890625, -2.87109375, -2.654296875, -2.4375, -2.220703125, -2.00390625, -1.787109375, -1.5703125, -1.353515625, -1.13671875, -0.919921875, -0.703125, -0.486328125, -0.26953125, -0.052734375, 0.1640625, 0.380859375, 0.59765625, 0.814453125, 1.03125, 1.248046875, 1.46484375, 1.681640625, 1.8984375, 2.115234375, 2.33203125, 2.548828125, 2.765625, 2.982421875, 3.19921875, 3.416015625, 3.6328125, 3.849609375, 4.06640625, 4.283203125, 4.5, 4.716796875, 4.93359375, 5.150390625, 5.3671875, 5.583984375, 5.80078125, 6.017578125, 6.234375, 6.451171875, 6.66796875, 6.884765625, 7.1015625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 2.0, 7.0, 4.0, 8.0, 15.0, 6.0, 10.0, 12.0, 24.0, 29.0, 23.0, 25.0, 37.0, 44.0, 36.0, 57.0, 43.0, 43.0, 43.0, 46.0, 51.0, 44.0, 51.0, 40.0, 38.0, 42.0, 36.0, 33.0, 27.0, 18.0, 22.0, 15.0, 19.0, 10.0, 12.0, 3.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.203125, -3.097747802734375, -2.99237060546875, -2.886993408203125, -2.7816162109375, -2.676239013671875, -2.57086181640625, -2.465484619140625, -2.360107421875, -2.254730224609375, -2.14935302734375, -2.043975830078125, -1.9385986328125, -1.833221435546875, -1.72784423828125, -1.622467041015625, -1.51708984375, -1.411712646484375, -1.30633544921875, -1.200958251953125, -1.0955810546875, -0.990203857421875, -0.88482666015625, -0.779449462890625, -0.674072265625, -0.568695068359375, -0.46331787109375, -0.357940673828125, -0.2525634765625, -0.147186279296875, -0.04180908203125, 0.063568115234375, 0.1689453125, 0.274322509765625, 0.37969970703125, 0.485076904296875, 0.5904541015625, 0.695831298828125, 0.80120849609375, 0.906585693359375, 1.011962890625, 1.117340087890625, 1.22271728515625, 1.328094482421875, 1.4334716796875, 1.538848876953125, 1.64422607421875, 1.749603271484375, 1.85498046875, 1.960357666015625, 2.06573486328125, 2.171112060546875, 2.2764892578125, 2.381866455078125, 2.48724365234375, 2.592620849609375, 2.697998046875, 2.803375244140625, 2.90875244140625, 3.014129638671875, 3.1195068359375, 3.224884033203125, 3.33026123046875, 3.435638427734375, 3.541015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 17.0, 17.0, 18.0, 30.0, 59.0, 89.0, 134.0, 246.0, 565.0, 1174.0, 3001.0, 8845.0, 36185.0, 227739.0, 620178.0, 118496.0, 21795.0, 5994.0, 2041.0, 915.0, 430.0, 215.0, 121.0, 72.0, 51.0, 35.0, 21.0, 21.0, 12.0, 7.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.328125, -12.950927734375, -12.57373046875, -12.196533203125, -11.8193359375, -11.442138671875, -11.06494140625, -10.687744140625, -10.310546875, -9.933349609375, -9.55615234375, -9.178955078125, -8.8017578125, -8.424560546875, -8.04736328125, -7.670166015625, -7.29296875, -6.915771484375, -6.53857421875, -6.161376953125, -5.7841796875, -5.406982421875, -5.02978515625, -4.652587890625, -4.275390625, -3.898193359375, -3.52099609375, -3.143798828125, -2.7666015625, -2.389404296875, -2.01220703125, -1.635009765625, -1.2578125, -0.880615234375, -0.50341796875, -0.126220703125, 0.2509765625, 0.628173828125, 1.00537109375, 1.382568359375, 1.759765625, 2.136962890625, 2.51416015625, 2.891357421875, 3.2685546875, 3.645751953125, 4.02294921875, 4.400146484375, 4.77734375, 5.154541015625, 5.53173828125, 5.908935546875, 6.2861328125, 6.663330078125, 7.04052734375, 7.417724609375, 7.794921875, 8.172119140625, 8.54931640625, 8.926513671875, 9.3037109375, 9.680908203125, 10.05810546875, 10.435302734375, 10.8125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 16.0, 16.0, 27.0, 30.0, 24.0, 46.0, 57.0, 50.0, 63.0, 50.0, 70.0, 73.0, 62.0, 61.0, 53.0, 43.0, 42.0, 35.0, 33.0, 30.0, 17.0, 26.0, 16.0, 12.0, 5.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.65625, -21.95166015625, -21.2470703125, -20.54248046875, -19.837890625, -19.13330078125, -18.4287109375, -17.72412109375, -17.01953125, -16.31494140625, -15.6103515625, -14.90576171875, -14.201171875, -13.49658203125, -12.7919921875, -12.08740234375, -11.3828125, -10.67822265625, -9.9736328125, -9.26904296875, -8.564453125, -7.85986328125, -7.1552734375, -6.45068359375, -5.74609375, -5.04150390625, -4.3369140625, -3.63232421875, -2.927734375, -2.22314453125, -1.5185546875, -0.81396484375, -0.109375, 0.59521484375, 1.2998046875, 2.00439453125, 2.708984375, 3.41357421875, 4.1181640625, 4.82275390625, 5.52734375, 6.23193359375, 6.9365234375, 7.64111328125, 8.345703125, 9.05029296875, 9.7548828125, 10.45947265625, 11.1640625, 11.86865234375, 12.5732421875, 13.27783203125, 13.982421875, 14.68701171875, 15.3916015625, 16.09619140625, 16.80078125, 17.50537109375, 18.2099609375, 18.91455078125, 19.619140625, 20.32373046875, 21.0283203125, 21.73291015625, 22.4375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 21.0, 15.0, 20.0, 43.0, 92.0, 262.0, 615.0, 1886.0, 7830.0, 71183.0, 817659.0, 133838.0, 11324.0, 2461.0, 789.0, 268.0, 122.0, 56.0, 24.0, 15.0, 5.0, 11.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.98968505859375, -8.7371826171875, -8.48468017578125, -8.232177734375, -7.97967529296875, -7.7271728515625, -7.47467041015625, -7.22216796875, -6.96966552734375, -6.7171630859375, -6.46466064453125, -6.212158203125, -5.95965576171875, -5.7071533203125, -5.45465087890625, -5.2021484375, -4.94964599609375, -4.6971435546875, -4.44464111328125, -4.192138671875, -3.93963623046875, -3.6871337890625, -3.43463134765625, -3.18212890625, -2.92962646484375, -2.6771240234375, -2.42462158203125, -2.172119140625, -1.91961669921875, -1.6671142578125, -1.41461181640625, -1.162109375, -0.90960693359375, -0.6571044921875, -0.40460205078125, -0.152099609375, 0.10040283203125, 0.3529052734375, 0.60540771484375, 0.85791015625, 1.11041259765625, 1.3629150390625, 1.61541748046875, 1.867919921875, 2.12042236328125, 2.3729248046875, 2.62542724609375, 2.8779296875, 3.13043212890625, 3.3829345703125, 3.63543701171875, 3.887939453125, 4.14044189453125, 4.3929443359375, 4.64544677734375, 4.89794921875, 5.15045166015625, 5.4029541015625, 5.65545654296875, 5.907958984375, 6.16046142578125, 6.4129638671875, 6.66546630859375, 6.91796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 4.0, 4.0, 8.0, 10.0, 17.0, 21.0, 34.0, 46.0, 47.0, 64.0, 109.0, 98.0, 111.0, 90.0, 78.0, 52.0, 70.0, 32.0, 37.0, 20.0, 12.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0009016990661621094, -0.0008774474263191223, -0.0008531957864761353, -0.0008289441466331482, -0.0008046925067901611, -0.0007804408669471741, -0.000756189227104187, -0.0007319375872612, -0.0007076859474182129, -0.0006834343075752258, -0.0006591826677322388, -0.0006349310278892517, -0.0006106793880462646, -0.0005864277482032776, -0.0005621761083602905, -0.0005379244685173035, -0.0005136728286743164, -0.0004894211888313293, -0.0004651695489883423, -0.0004409179091453552, -0.00041666626930236816, -0.0003924146294593811, -0.00036816298961639404, -0.000343911349773407, -0.0003196597099304199, -0.00029540807008743286, -0.0002711564302444458, -0.00024690479040145874, -0.00022265315055847168, -0.00019840151071548462, -0.00017414987087249756, -0.0001498982310295105, -0.00012564659118652344, -0.00010139495134353638, -7.714331150054932e-05, -5.2891671657562256e-05, -2.8640031814575195e-05, -4.388391971588135e-06, 1.9863247871398926e-05, 4.4114887714385986e-05, 6.836652755737305e-05, 9.261816740036011e-05, 0.00011686980724334717, 0.00014112144708633423, 0.0001653730869293213, 0.00018962472677230835, 0.0002138763666152954, 0.00023812800645828247, 0.00026237964630126953, 0.0002866312861442566, 0.00031088292598724365, 0.0003351345658302307, 0.0003593862056732178, 0.00038363784551620483, 0.0004078894853591919, 0.00043214112520217896, 0.000456392765045166, 0.0004806444048881531, 0.0005048960447311401, 0.0005291476845741272, 0.0005533993244171143, 0.0005776509642601013, 0.0006019026041030884, 0.0006261542439460754, 0.0006504058837890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 7.0, 4.0, 8.0, 22.0, 27.0, 34.0, 68.0, 92.0, 177.0, 324.0, 739.0, 1816.0, 6002.0, 28581.0, 270752.0, 650153.0, 73065.0, 11454.0, 3101.0, 1070.0, 479.0, 239.0, 113.0, 66.0, 43.0, 39.0, 18.0, 17.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.83984375, -7.634765625, -7.4296875, -7.224609375, -7.01953125, -6.814453125, -6.609375, -6.404296875, -6.19921875, -5.994140625, -5.7890625, -5.583984375, -5.37890625, -5.173828125, -4.96875, -4.763671875, -4.55859375, -4.353515625, -4.1484375, -3.943359375, -3.73828125, -3.533203125, -3.328125, -3.123046875, -2.91796875, -2.712890625, -2.5078125, -2.302734375, -2.09765625, -1.892578125, -1.6875, -1.482421875, -1.27734375, -1.072265625, -0.8671875, -0.662109375, -0.45703125, -0.251953125, -0.046875, 0.158203125, 0.36328125, 0.568359375, 0.7734375, 0.978515625, 1.18359375, 1.388671875, 1.59375, 1.798828125, 2.00390625, 2.208984375, 2.4140625, 2.619140625, 2.82421875, 3.029296875, 3.234375, 3.439453125, 3.64453125, 3.849609375, 4.0546875, 4.259765625, 4.46484375, 4.669921875, 4.875, 5.080078125, 5.28515625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 11.0, 11.0, 20.0, 22.0, 25.0, 39.0, 64.0, 88.0, 123.0, 119.0, 132.0, 111.0, 75.0, 51.0, 31.0, 24.0, 18.0, 10.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4921875, -7.2314453125, -6.970703125, -6.7099609375, -6.44921875, -6.1884765625, -5.927734375, -5.6669921875, -5.40625, -5.1455078125, -4.884765625, -4.6240234375, -4.36328125, -4.1025390625, -3.841796875, -3.5810546875, -3.3203125, -3.0595703125, -2.798828125, -2.5380859375, -2.27734375, -2.0166015625, -1.755859375, -1.4951171875, -1.234375, -0.9736328125, -0.712890625, -0.4521484375, -0.19140625, 0.0693359375, 0.330078125, 0.5908203125, 0.8515625, 1.1123046875, 1.373046875, 1.6337890625, 1.89453125, 2.1552734375, 2.416015625, 2.6767578125, 2.9375, 3.1982421875, 3.458984375, 3.7197265625, 3.98046875, 4.2412109375, 4.501953125, 4.7626953125, 5.0234375, 5.2841796875, 5.544921875, 5.8056640625, 6.06640625, 6.3271484375, 6.587890625, 6.8486328125, 7.109375, 7.3701171875, 7.630859375, 7.8916015625, 8.15234375, 8.4130859375, 8.673828125, 8.9345703125, 9.1953125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 17.0, 31.0, 83.0, 198.0, 297.0, 206.0, 101.0, 37.0, 22.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-240.6915740966797, -235.83929443359375, -230.9870147705078, -226.13473510742188, -221.28245544433594, -216.43017578125, -211.57789611816406, -206.72561645507812, -201.87335205078125, -197.0210723876953, -192.16879272460938, -187.31651306152344, -182.4642333984375, -177.61195373535156, -172.75967407226562, -167.90740966796875, -163.05511474609375, -158.2028350830078, -153.35055541992188, -148.49827575683594, -143.64599609375, -138.79371643066406, -133.94143676757812, -129.08917236328125, -124.23688507080078, -119.38460540771484, -114.5323257446289, -109.68004608154297, -104.82777404785156, -99.97549438476562, -95.12321472167969, -90.27093505859375, -85.41864013671875, -80.56636047363281, -75.71408081054688, -70.86180114746094, -66.009521484375, -61.15724563598633, -56.304969787597656, -51.45269012451172, -46.60041046142578, -41.748130798339844, -36.895851135253906, -32.043575286865234, -27.191295623779297, -22.33901596069336, -17.486738204956055, -12.63446044921875, -7.7821807861328125, -2.9299020767211914, 1.9223766326904297, 6.774655342102051, 11.626934051513672, 16.47921371459961, 21.331491470336914, 26.18376922607422, 31.036048889160156, 35.888328552246094, 40.74060821533203, 45.5928840637207, 50.44516372680664, 55.29744338989258, 60.14971923828125, 65.00199890136719, 69.85427856445312]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 11.0, 9.0, 6.0, 9.0, 14.0, 10.0, 21.0, 18.0, 14.0, 20.0, 23.0, 26.0, 34.0, 30.0, 37.0, 26.0, 39.0, 41.0, 49.0, 42.0, 34.0, 37.0, 37.0, 43.0, 33.0, 31.0, 42.0, 27.0, 31.0, 35.0, 19.0, 21.0, 13.0, 21.0, 11.0, 7.0, 12.0, 6.0, 4.0, 7.0, 6.0, 8.0, 7.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0], "bins": [-64.01964569091797, -61.981971740722656, -59.94430160522461, -57.9066276550293, -55.86895751953125, -53.83128356933594, -51.793609619140625, -49.75593566894531, -47.718265533447266, -45.68059158325195, -43.642921447753906, -41.605247497558594, -39.56757354736328, -37.529903411865234, -35.49222946166992, -33.454559326171875, -31.416885375976562, -29.379213333129883, -27.341541290283203, -25.30386734008789, -23.26619529724121, -21.22852325439453, -19.19084930419922, -17.15317726135254, -15.11550521850586, -13.07783317565918, -11.040160179138184, -9.002487182617188, -6.964815139770508, -4.927143096923828, -2.889470100402832, -0.8517971038818359, 1.185882568359375, 3.223555088043213, 5.261227607727051, 7.298900127410889, 9.336572647094727, 11.374244689941406, 13.411917686462402, 15.449590682983398, 17.487262725830078, 19.524934768676758, 21.562606811523438, 23.60028076171875, 25.63795280456543, 27.67562484741211, 29.713298797607422, 31.7509708404541, 33.78864288330078, 35.826316833496094, 37.86398696899414, 39.90166091918945, 41.9393310546875, 43.97700500488281, 46.014678955078125, 48.05235290527344, 50.090023040771484, 52.1276969909668, 54.165367126464844, 56.203041076660156, 58.24071502685547, 60.278385162353516, 62.31605911254883, 64.35372924804688, 66.39140319824219]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 10.0, 7.0, 7.0, 21.0, 18.0, 36.0, 35.0, 52.0, 77.0, 85.0, 146.0, 229.0, 277.0, 418.0, 590.0, 909.0, 1482.0, 2370.0, 4693.0, 11607.0, 41480.0, 603666.0, 3447923.0, 52018.0, 13571.0, 5262.0, 2728.0, 1544.0, 954.0, 577.0, 401.0, 300.0, 198.0, 160.0, 106.0, 93.0, 52.0, 44.0, 32.0, 24.0, 15.0, 14.0, 16.0, 6.0, 8.0, 6.0, 2.0, 4.0, 0.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.65234375, -6.438232421875, -6.22412109375, -6.010009765625, -5.7958984375, -5.581787109375, -5.36767578125, -5.153564453125, -4.939453125, -4.725341796875, -4.51123046875, -4.297119140625, -4.0830078125, -3.868896484375, -3.65478515625, -3.440673828125, -3.2265625, -3.012451171875, -2.79833984375, -2.584228515625, -2.3701171875, -2.156005859375, -1.94189453125, -1.727783203125, -1.513671875, -1.299560546875, -1.08544921875, -0.871337890625, -0.6572265625, -0.443115234375, -0.22900390625, -0.014892578125, 0.19921875, 0.413330078125, 0.62744140625, 0.841552734375, 1.0556640625, 1.269775390625, 1.48388671875, 1.697998046875, 1.912109375, 2.126220703125, 2.34033203125, 2.554443359375, 2.7685546875, 2.982666015625, 3.19677734375, 3.410888671875, 3.625, 3.839111328125, 4.05322265625, 4.267333984375, 4.4814453125, 4.695556640625, 4.90966796875, 5.123779296875, 5.337890625, 5.552001953125, 5.76611328125, 5.980224609375, 6.1943359375, 6.408447265625, 6.62255859375, 6.836669921875, 7.05078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 2.0, 4.0, 11.0, 12.0, 8.0, 5.0, 7.0, 11.0, 20.0, 30.0, 21.0, 30.0, 34.0, 31.0, 32.0, 38.0, 41.0, 33.0, 53.0, 44.0, 61.0, 45.0, 48.0, 50.0, 35.0, 35.0, 35.0, 36.0, 30.0, 27.0, 23.0, 15.0, 16.0, 17.0, 7.0, 4.0, 15.0, 4.0, 5.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.283203125, -3.183319091796875, -3.08343505859375, -2.983551025390625, -2.8836669921875, -2.783782958984375, -2.68389892578125, -2.584014892578125, -2.484130859375, -2.384246826171875, -2.28436279296875, -2.184478759765625, -2.0845947265625, -1.984710693359375, -1.88482666015625, -1.784942626953125, -1.68505859375, -1.585174560546875, -1.48529052734375, -1.385406494140625, -1.2855224609375, -1.185638427734375, -1.08575439453125, -0.985870361328125, -0.885986328125, -0.786102294921875, -0.68621826171875, -0.586334228515625, -0.4864501953125, -0.386566162109375, -0.28668212890625, -0.186798095703125, -0.0869140625, 0.012969970703125, 0.11285400390625, 0.212738037109375, 0.3126220703125, 0.412506103515625, 0.51239013671875, 0.612274169921875, 0.712158203125, 0.812042236328125, 0.91192626953125, 1.011810302734375, 1.1116943359375, 1.211578369140625, 1.31146240234375, 1.411346435546875, 1.51123046875, 1.611114501953125, 1.71099853515625, 1.810882568359375, 1.9107666015625, 2.010650634765625, 2.11053466796875, 2.210418701171875, 2.310302734375, 2.410186767578125, 2.51007080078125, 2.609954833984375, 2.7098388671875, 2.809722900390625, 2.90960693359375, 3.009490966796875, 3.109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 12.0, 18.0, 15.0, 13.0, 16.0, 22.0, 36.0, 41.0, 61.0, 84.0, 127.0, 218.0, 284.0, 482.0, 807.0, 1361.0, 2512.0, 5563.0, 16459.0, 82563.0, 3531409.0, 490055.0, 42314.0, 10746.0, 4085.0, 1968.0, 1114.0, 597.0, 412.0, 260.0, 178.0, 122.0, 83.0, 55.0, 52.0, 30.0, 21.0, 26.0, 15.0, 13.0, 8.0, 5.0, 2.0, 9.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.58203125, -7.35101318359375, -7.1199951171875, -6.88897705078125, -6.657958984375, -6.42694091796875, -6.1959228515625, -5.96490478515625, -5.73388671875, -5.50286865234375, -5.2718505859375, -5.04083251953125, -4.809814453125, -4.57879638671875, -4.3477783203125, -4.11676025390625, -3.8857421875, -3.65472412109375, -3.4237060546875, -3.19268798828125, -2.961669921875, -2.73065185546875, -2.4996337890625, -2.26861572265625, -2.03759765625, -1.80657958984375, -1.5755615234375, -1.34454345703125, -1.113525390625, -0.88250732421875, -0.6514892578125, -0.42047119140625, -0.189453125, 0.04156494140625, 0.2725830078125, 0.50360107421875, 0.734619140625, 0.96563720703125, 1.1966552734375, 1.42767333984375, 1.65869140625, 1.88970947265625, 2.1207275390625, 2.35174560546875, 2.582763671875, 2.81378173828125, 3.0447998046875, 3.27581787109375, 3.5068359375, 3.73785400390625, 3.9688720703125, 4.19989013671875, 4.430908203125, 4.66192626953125, 4.8929443359375, 5.12396240234375, 5.35498046875, 5.58599853515625, 5.8170166015625, 6.04803466796875, 6.279052734375, 6.51007080078125, 6.7410888671875, 6.97210693359375, 7.203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 17.0, 25.0, 57.0, 135.0, 460.0, 2854.0, 313.0, 95.0, 41.0, 25.0, 9.0, 13.0, 4.0, 7.0, 6.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.453125, -3.36077880859375, -3.2684326171875, -3.17608642578125, -3.083740234375, -2.99139404296875, -2.8990478515625, -2.80670166015625, -2.71435546875, -2.62200927734375, -2.5296630859375, -2.43731689453125, -2.344970703125, -2.25262451171875, -2.1602783203125, -2.06793212890625, -1.9755859375, -1.88323974609375, -1.7908935546875, -1.69854736328125, -1.606201171875, -1.51385498046875, -1.4215087890625, -1.32916259765625, -1.23681640625, -1.14447021484375, -1.0521240234375, -0.95977783203125, -0.867431640625, -0.77508544921875, -0.6827392578125, -0.59039306640625, -0.498046875, -0.40570068359375, -0.3133544921875, -0.22100830078125, -0.128662109375, -0.03631591796875, 0.0560302734375, 0.14837646484375, 0.24072265625, 0.33306884765625, 0.4254150390625, 0.51776123046875, 0.610107421875, 0.70245361328125, 0.7947998046875, 0.88714599609375, 0.9794921875, 1.07183837890625, 1.1641845703125, 1.25653076171875, 1.348876953125, 1.44122314453125, 1.5335693359375, 1.62591552734375, 1.71826171875, 1.81060791015625, 1.9029541015625, 1.99530029296875, 2.087646484375, 2.17999267578125, 2.2723388671875, 2.36468505859375, 2.45703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 11.0, 7.0, 15.0, 22.0, 28.0, 40.0, 55.0, 71.0, 92.0, 105.0, 94.0, 95.0, 90.0, 82.0, 71.0, 40.0, 25.0, 20.0, 13.0, 10.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.574042320251465, -4.330786228179932, -4.087530136108398, -3.8442745208740234, -3.6010184288024902, -3.357762336730957, -3.114506483078003, -2.871250629425049, -2.6279945373535156, -2.3847384452819824, -2.1414825916290283, -1.8982266187667847, -1.654970645904541, -1.4117146730422974, -1.1684587001800537, -0.9252027273178101, -0.6819467544555664, -0.43869078159332275, -0.1954348087310791, 0.04782116413116455, 0.2910771369934082, 0.5343331098556519, 0.7775890827178955, 1.0208450555801392, 1.2641010284423828, 1.5073570013046265, 1.7506129741668701, 1.9938689470291138, 2.2371249198913574, 2.4803810119628906, 2.7236368656158447, 2.966892719268799, 3.210148811340332, 3.4534049034118652, 3.6966607570648193, 3.9399166107177734, 4.183172702789307, 4.42642879486084, 4.669684410095215, 4.912940502166748, 5.156196594238281, 5.3994526863098145, 5.642708778381348, 5.885964393615723, 6.129220485687256, 6.372476577758789, 6.615732192993164, 6.858988285064697, 7.1022443771362305, 7.345500469207764, 7.588756561279297, 7.832012176513672, 8.075267791748047, 8.318524360656738, 8.561779975891113, 8.805036544799805, 9.04829216003418, 9.291547775268555, 9.534804344177246, 9.778059959411621, 10.021316528320312, 10.264572143554688, 10.507827758789062, 10.751084327697754, 10.994339942932129]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 5.0, 8.0, 10.0, 14.0, 14.0, 22.0, 21.0, 31.0, 42.0, 40.0, 57.0, 55.0, 57.0, 67.0, 66.0, 69.0, 51.0, 64.0, 48.0, 33.0, 45.0, 40.0, 36.0, 25.0, 16.0, 15.0, 18.0, 5.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.925815582275391, -4.720465660095215, -4.515115261077881, -4.309764862060547, -4.104414939880371, -3.899064779281616, -3.6937146186828613, -3.4883644580841064, -3.2830142974853516, -3.0776641368865967, -2.872313976287842, -2.666963815689087, -2.461613655090332, -2.256263494491577, -2.0509133338928223, -1.8455631732940674, -1.6402130126953125, -1.4348628520965576, -1.2295126914978027, -1.0241625308990479, -0.818812370300293, -0.6134622097015381, -0.4081120491027832, -0.20276188850402832, 0.0025882720947265625, 0.20793843269348145, 0.41328859329223633, 0.6186387538909912, 0.8239889144897461, 1.029339075088501, 1.2346892356872559, 1.4400393962860107, 1.6453895568847656, 1.8507397174835205, 2.0560898780822754, 2.2614400386810303, 2.466790199279785, 2.67214035987854, 2.877490520477295, 3.08284068107605, 3.2881908416748047, 3.4935410022735596, 3.6988911628723145, 3.9042413234710693, 4.109591484069824, 4.31494140625, 4.520291805267334, 4.725642204284668, 4.930992126464844, 5.1363420486450195, 5.3416924476623535, 5.5470428466796875, 5.752392768859863, 5.957742691040039, 6.163093090057373, 6.368443489074707, 6.573793411254883, 6.779143333435059, 6.984493732452393, 7.189844131469727, 7.395194053649902, 7.600543975830078, 7.805894374847412, 8.011244773864746, 8.216594696044922]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 13.0, 18.0, 24.0, 22.0, 50.0, 84.0, 133.0, 228.0, 392.0, 818.0, 1587.0, 3387.0, 7156.0, 17225.0, 44810.0, 130876.0, 322917.0, 317203.0, 127521.0, 44034.0, 16481.0, 6896.0, 3274.0, 1515.0, 787.0, 400.0, 249.0, 156.0, 99.0, 65.0, 45.0, 30.0, 20.0, 11.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.8853759765625, -4.704345703125, -4.5233154296875, -4.34228515625, -4.1612548828125, -3.980224609375, -3.7991943359375, -3.6181640625, -3.4371337890625, -3.256103515625, -3.0750732421875, -2.89404296875, -2.7130126953125, -2.531982421875, -2.3509521484375, -2.169921875, -1.9888916015625, -1.807861328125, -1.6268310546875, -1.44580078125, -1.2647705078125, -1.083740234375, -0.9027099609375, -0.7216796875, -0.5406494140625, -0.359619140625, -0.1785888671875, 0.00244140625, 0.1834716796875, 0.364501953125, 0.5455322265625, 0.7265625, 0.9075927734375, 1.088623046875, 1.2696533203125, 1.45068359375, 1.6317138671875, 1.812744140625, 1.9937744140625, 2.1748046875, 2.3558349609375, 2.536865234375, 2.7178955078125, 2.89892578125, 3.0799560546875, 3.260986328125, 3.4420166015625, 3.623046875, 3.8040771484375, 3.985107421875, 4.1661376953125, 4.34716796875, 4.5281982421875, 4.709228515625, 4.8902587890625, 5.0712890625, 5.2523193359375, 5.433349609375, 5.6143798828125, 5.79541015625, 5.9764404296875, 6.157470703125, 6.3385009765625, 6.51953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 10.0, 5.0, 8.0, 8.0, 10.0, 8.0, 7.0, 8.0, 19.0, 17.0, 30.0, 26.0, 29.0, 43.0, 41.0, 41.0, 41.0, 49.0, 43.0, 48.0, 57.0, 48.0, 40.0, 56.0, 42.0, 43.0, 42.0, 25.0, 30.0, 24.0, 22.0, 14.0, 12.0, 10.0, 9.0, 10.0, 8.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.478515625, -3.372039794921875, -3.26556396484375, -3.159088134765625, -3.0526123046875, -2.946136474609375, -2.83966064453125, -2.733184814453125, -2.626708984375, -2.520233154296875, -2.41375732421875, -2.307281494140625, -2.2008056640625, -2.094329833984375, -1.98785400390625, -1.881378173828125, -1.77490234375, -1.668426513671875, -1.56195068359375, -1.455474853515625, -1.3489990234375, -1.242523193359375, -1.13604736328125, -1.029571533203125, -0.923095703125, -0.816619873046875, -0.71014404296875, -0.603668212890625, -0.4971923828125, -0.390716552734375, -0.28424072265625, -0.177764892578125, -0.0712890625, 0.035186767578125, 0.14166259765625, 0.248138427734375, 0.3546142578125, 0.461090087890625, 0.56756591796875, 0.674041748046875, 0.780517578125, 0.886993408203125, 0.99346923828125, 1.099945068359375, 1.2064208984375, 1.312896728515625, 1.41937255859375, 1.525848388671875, 1.63232421875, 1.738800048828125, 1.84527587890625, 1.951751708984375, 2.0582275390625, 2.164703369140625, 2.27117919921875, 2.377655029296875, 2.484130859375, 2.590606689453125, 2.69708251953125, 2.803558349609375, 2.9100341796875, 3.016510009765625, 3.12298583984375, 3.229461669921875, 3.3359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 4.0, 11.0, 17.0, 17.0, 24.0, 37.0, 67.0, 77.0, 137.0, 211.0, 361.0, 679.0, 1465.0, 3388.0, 10617.0, 44545.0, 258283.0, 575801.0, 118022.0, 23417.0, 6652.0, 2372.0, 1014.0, 487.0, 289.0, 180.0, 97.0, 73.0, 59.0, 44.0, 24.0, 21.0, 9.0, 11.0, 5.0, 10.0, 7.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.6171875, -8.35833740234375, -8.0994873046875, -7.84063720703125, -7.581787109375, -7.32293701171875, -7.0640869140625, -6.80523681640625, -6.54638671875, -6.28753662109375, -6.0286865234375, -5.76983642578125, -5.510986328125, -5.25213623046875, -4.9932861328125, -4.73443603515625, -4.4755859375, -4.21673583984375, -3.9578857421875, -3.69903564453125, -3.440185546875, -3.18133544921875, -2.9224853515625, -2.66363525390625, -2.40478515625, -2.14593505859375, -1.8870849609375, -1.62823486328125, -1.369384765625, -1.11053466796875, -0.8516845703125, -0.59283447265625, -0.333984375, -0.07513427734375, 0.1837158203125, 0.44256591796875, 0.701416015625, 0.96026611328125, 1.2191162109375, 1.47796630859375, 1.73681640625, 1.99566650390625, 2.2545166015625, 2.51336669921875, 2.772216796875, 3.03106689453125, 3.2899169921875, 3.54876708984375, 3.8076171875, 4.06646728515625, 4.3253173828125, 4.58416748046875, 4.843017578125, 5.10186767578125, 5.3607177734375, 5.61956787109375, 5.87841796875, 6.13726806640625, 6.3961181640625, 6.65496826171875, 6.913818359375, 7.17266845703125, 7.4315185546875, 7.69036865234375, 7.94921875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 24.0, 14.0, 17.0, 20.0, 33.0, 35.0, 35.0, 40.0, 41.0, 38.0, 53.0, 57.0, 54.0, 46.0, 60.0, 55.0, 53.0, 48.0, 36.0, 38.0, 34.0, 40.0, 22.0, 22.0, 23.0, 6.0, 11.0, 11.0, 9.0, 4.0, 2.0, 2.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.3125, -18.7830810546875, -18.253662109375, -17.7242431640625, -17.19482421875, -16.6654052734375, -16.135986328125, -15.6065673828125, -15.0771484375, -14.5477294921875, -14.018310546875, -13.4888916015625, -12.95947265625, -12.4300537109375, -11.900634765625, -11.3712158203125, -10.841796875, -10.3123779296875, -9.782958984375, -9.2535400390625, -8.72412109375, -8.1947021484375, -7.665283203125, -7.1358642578125, -6.6064453125, -6.0770263671875, -5.547607421875, -5.0181884765625, -4.48876953125, -3.9593505859375, -3.429931640625, -2.9005126953125, -2.37109375, -1.8416748046875, -1.312255859375, -0.7828369140625, -0.25341796875, 0.2760009765625, 0.805419921875, 1.3348388671875, 1.8642578125, 2.3936767578125, 2.923095703125, 3.4525146484375, 3.98193359375, 4.5113525390625, 5.040771484375, 5.5701904296875, 6.099609375, 6.6290283203125, 7.158447265625, 7.6878662109375, 8.21728515625, 8.7467041015625, 9.276123046875, 9.8055419921875, 10.3349609375, 10.8643798828125, 11.393798828125, 11.9232177734375, 12.45263671875, 12.9820556640625, 13.511474609375, 14.0408935546875, 14.5703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 9.0, 10.0, 12.0, 37.0, 45.0, 71.0, 133.0, 291.0, 748.0, 2441.0, 13711.0, 179887.0, 775958.0, 65463.0, 7134.0, 1525.0, 542.0, 234.0, 111.0, 60.0, 42.0, 20.0, 24.0, 16.0, 6.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.046875, -6.85809326171875, -6.6693115234375, -6.48052978515625, -6.291748046875, -6.10296630859375, -5.9141845703125, -5.72540283203125, -5.53662109375, -5.34783935546875, -5.1590576171875, -4.97027587890625, -4.781494140625, -4.59271240234375, -4.4039306640625, -4.21514892578125, -4.0263671875, -3.83758544921875, -3.6488037109375, -3.46002197265625, -3.271240234375, -3.08245849609375, -2.8936767578125, -2.70489501953125, -2.51611328125, -2.32733154296875, -2.1385498046875, -1.94976806640625, -1.760986328125, -1.57220458984375, -1.3834228515625, -1.19464111328125, -1.005859375, -0.81707763671875, -0.6282958984375, -0.43951416015625, -0.250732421875, -0.06195068359375, 0.1268310546875, 0.31561279296875, 0.50439453125, 0.69317626953125, 0.8819580078125, 1.07073974609375, 1.259521484375, 1.44830322265625, 1.6370849609375, 1.82586669921875, 2.0146484375, 2.20343017578125, 2.3922119140625, 2.58099365234375, 2.769775390625, 2.95855712890625, 3.1473388671875, 3.33612060546875, 3.52490234375, 3.71368408203125, 3.9024658203125, 4.09124755859375, 4.280029296875, 4.46881103515625, 4.6575927734375, 4.84637451171875, 5.03515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 8.0, 8.0, 11.0, 6.0, 17.0, 17.0, 34.0, 38.0, 40.0, 60.0, 57.0, 67.0, 79.0, 80.0, 77.0, 77.0, 65.0, 51.0, 51.0, 34.0, 21.0, 19.0, 12.0, 20.0, 8.0, 9.0, 10.0, 1.0, 3.0, 9.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005440711975097656, -0.0005255565047264099, -0.0005070418119430542, -0.0004885271191596985, -0.0004700124263763428, -0.00045149773359298706, -0.00043298304080963135, -0.00041446834802627563, -0.0003959536552429199, -0.0003774389624595642, -0.0003589242696762085, -0.0003404095768928528, -0.00032189488410949707, -0.00030338019132614136, -0.00028486549854278564, -0.00026635080575942993, -0.0002478361129760742, -0.0002293214201927185, -0.0002108067274093628, -0.00019229203462600708, -0.00017377734184265137, -0.00015526264905929565, -0.00013674795627593994, -0.00011823326349258423, -9.971857070922852e-05, -8.12038779258728e-05, -6.268918514251709e-05, -4.417449235916138e-05, -2.5659799575805664e-05, -7.145106792449951e-06, 1.1369585990905762e-05, 2.9884278774261475e-05, 4.839897155761719e-05, 6.69136643409729e-05, 8.542835712432861e-05, 0.00010394304990768433, 0.00012245774269104004, 0.00014097243547439575, 0.00015948712825775146, 0.00017800182104110718, 0.0001965165138244629, 0.0002150312066078186, 0.00023354589939117432, 0.00025206059217453003, 0.00027057528495788574, 0.00028908997774124146, 0.00030760467052459717, 0.0003261193633079529, 0.0003446340560913086, 0.0003631487488746643, 0.00038166344165802, 0.00040017813444137573, 0.00041869282722473145, 0.00043720752000808716, 0.00045572221279144287, 0.0004742369055747986, 0.0004927515983581543, 0.00051126629114151, 0.0005297809839248657, 0.0005482956767082214, 0.0005668103694915771, 0.0005853250622749329, 0.0006038397550582886, 0.0006223544478416443, 0.000640869140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 10.0, 11.0, 15.0, 22.0, 40.0, 90.0, 150.0, 361.0, 890.0, 3306.0, 28685.0, 744361.0, 256178.0, 11360.0, 2012.0, 575.0, 243.0, 106.0, 57.0, 26.0, 18.0, 13.0, 9.0, 4.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.4078369140625, -8.151611328125, -7.8953857421875, -7.63916015625, -7.3829345703125, -7.126708984375, -6.8704833984375, -6.6142578125, -6.3580322265625, -6.101806640625, -5.8455810546875, -5.58935546875, -5.3331298828125, -5.076904296875, -4.8206787109375, -4.564453125, -4.3082275390625, -4.052001953125, -3.7957763671875, -3.53955078125, -3.2833251953125, -3.027099609375, -2.7708740234375, -2.5146484375, -2.2584228515625, -2.002197265625, -1.7459716796875, -1.48974609375, -1.2335205078125, -0.977294921875, -0.7210693359375, -0.46484375, -0.2086181640625, 0.047607421875, 0.3038330078125, 0.56005859375, 0.8162841796875, 1.072509765625, 1.3287353515625, 1.5849609375, 1.8411865234375, 2.097412109375, 2.3536376953125, 2.60986328125, 2.8660888671875, 3.122314453125, 3.3785400390625, 3.634765625, 3.8909912109375, 4.147216796875, 4.4034423828125, 4.65966796875, 4.9158935546875, 5.172119140625, 5.4283447265625, 5.6845703125, 5.9407958984375, 6.197021484375, 6.4532470703125, 6.70947265625, 6.9656982421875, 7.221923828125, 7.4781494140625, 7.734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 15.0, 16.0, 31.0, 32.0, 69.0, 85.0, 83.0, 124.0, 118.0, 109.0, 92.0, 66.0, 50.0, 35.0, 26.0, 19.0, 12.0, 4.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.1964111328125, -7.013916015625, -6.8314208984375, -6.64892578125, -6.4664306640625, -6.283935546875, -6.1014404296875, -5.9189453125, -5.7364501953125, -5.553955078125, -5.3714599609375, -5.18896484375, -5.0064697265625, -4.823974609375, -4.6414794921875, -4.458984375, -4.2764892578125, -4.093994140625, -3.9114990234375, -3.72900390625, -3.5465087890625, -3.364013671875, -3.1815185546875, -2.9990234375, -2.8165283203125, -2.634033203125, -2.4515380859375, -2.26904296875, -2.0865478515625, -1.904052734375, -1.7215576171875, -1.5390625, -1.3565673828125, -1.174072265625, -0.9915771484375, -0.80908203125, -0.6265869140625, -0.444091796875, -0.2615966796875, -0.0791015625, 0.1033935546875, 0.285888671875, 0.4683837890625, 0.65087890625, 0.8333740234375, 1.015869140625, 1.1983642578125, 1.380859375, 1.5633544921875, 1.745849609375, 1.9283447265625, 2.11083984375, 2.2933349609375, 2.475830078125, 2.6583251953125, 2.8408203125, 3.0233154296875, 3.205810546875, 3.3883056640625, 3.57080078125, 3.7532958984375, 3.935791015625, 4.1182861328125, 4.30078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 9.0, 15.0, 22.0, 54.0, 69.0, 110.0, 162.0, 156.0, 149.0, 113.0, 60.0, 35.0, 20.0, 10.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.90678405761719, -68.56118774414062, -66.2155990600586, -63.87000274658203, -61.524410247802734, -59.17881774902344, -56.83322525024414, -54.487632751464844, -52.14203643798828, -49.796443939208984, -47.45085144042969, -45.105255126953125, -42.75966262817383, -40.41407012939453, -38.068477630615234, -35.72288513183594, -33.37729263305664, -31.031700134277344, -28.686105728149414, -26.340513229370117, -23.994918823242188, -21.64932632446289, -19.303733825683594, -16.958139419555664, -14.612546920776367, -12.266953468322754, -9.92136001586914, -7.575767517089844, -5.2301740646362305, -2.884580612182617, -0.5389881134033203, 1.8066062927246094, 4.152198791503906, 6.4977922439575195, 8.843385696411133, 11.18897819519043, 13.534571647644043, 15.880165100097656, 18.225757598876953, 20.571352005004883, 22.91694450378418, 25.262537002563477, 27.608131408691406, 29.953723907470703, 32.29931640625, 34.64491271972656, 36.990501403808594, 39.336097717285156, 41.68169021606445, 44.02728271484375, 46.37287521362305, 48.718467712402344, 51.064064025878906, 53.4096565246582, 55.7552490234375, 58.10084533691406, 60.446434020996094, 62.79202651977539, 65.13761901855469, 67.48321533203125, 69.82880401611328, 72.17440032958984, 74.51998901367188, 76.86558532714844, 79.211181640625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 5.0, 4.0, 15.0, 13.0, 14.0, 18.0, 26.0, 29.0, 47.0, 40.0, 41.0, 60.0, 45.0, 56.0, 59.0, 60.0, 46.0, 47.0, 56.0, 39.0, 50.0, 41.0, 27.0, 30.0, 31.0, 16.0, 17.0, 17.0, 11.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.93276977539062, -75.59931945800781, -73.265869140625, -70.93241882324219, -68.59896850585938, -66.2655258178711, -63.93207550048828, -61.59862518310547, -59.265174865722656, -56.931724548339844, -54.59827423095703, -52.264827728271484, -49.93137741088867, -47.59792709350586, -45.26448059082031, -42.9310302734375, -40.59757995605469, -38.264129638671875, -35.93067932128906, -33.597232818603516, -31.263782501220703, -28.93033218383789, -26.59688377380371, -24.26343536376953, -21.92998504638672, -19.596534729003906, -17.263086318969727, -14.92963695526123, -12.596187591552734, -10.262738227844238, -7.929288864135742, -5.5958404541015625, -3.2623825073242188, -0.9289331436157227, 1.4045162200927734, 3.7379655838012695, 6.071414947509766, 8.404864311218262, 10.738313674926758, 13.071762084960938, 15.40521240234375, 17.738662719726562, 20.072111129760742, 22.405559539794922, 24.739009857177734, 27.072460174560547, 29.405908584594727, 31.739356994628906, 34.07280731201172, 36.40625762939453, 38.739707946777344, 41.07315444946289, 43.4066047668457, 45.740055084228516, 48.07350158691406, 50.406951904296875, 52.74040222167969, 55.0738525390625, 57.40730285644531, 59.74074935913086, 62.07419967651367, 64.40764617919922, 66.74109649658203, 69.07454681396484, 71.40799713134766]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 7.0, 16.0, 27.0, 37.0, 66.0, 81.0, 131.0, 230.0, 334.0, 606.0, 995.0, 2020.0, 4223.0, 10167.0, 32604.0, 223946.0, 3829912.0, 60974.0, 15821.0, 6012.0, 2722.0, 1316.0, 715.0, 417.0, 270.0, 200.0, 115.0, 99.0, 56.0, 32.0, 36.0, 23.0, 14.0, 13.0, 6.0, 6.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9375, -5.753173828125, -5.56884765625, -5.384521484375, -5.2001953125, -5.015869140625, -4.83154296875, -4.647216796875, -4.462890625, -4.278564453125, -4.09423828125, -3.909912109375, -3.7255859375, -3.541259765625, -3.35693359375, -3.172607421875, -2.98828125, -2.803955078125, -2.61962890625, -2.435302734375, -2.2509765625, -2.066650390625, -1.88232421875, -1.697998046875, -1.513671875, -1.329345703125, -1.14501953125, -0.960693359375, -0.7763671875, -0.592041015625, -0.40771484375, -0.223388671875, -0.0390625, 0.145263671875, 0.32958984375, 0.513916015625, 0.6982421875, 0.882568359375, 1.06689453125, 1.251220703125, 1.435546875, 1.619873046875, 1.80419921875, 1.988525390625, 2.1728515625, 2.357177734375, 2.54150390625, 2.725830078125, 2.91015625, 3.094482421875, 3.27880859375, 3.463134765625, 3.6474609375, 3.831787109375, 4.01611328125, 4.200439453125, 4.384765625, 4.569091796875, 4.75341796875, 4.937744140625, 5.1220703125, 5.306396484375, 5.49072265625, 5.675048828125, 5.859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 2.0, 2.0, 5.0, 4.0, 12.0, 9.0, 14.0, 21.0, 11.0, 20.0, 23.0, 27.0, 49.0, 26.0, 32.0, 43.0, 50.0, 51.0, 44.0, 65.0, 45.0, 56.0, 42.0, 58.0, 44.0, 38.0, 31.0, 33.0, 28.0, 17.0, 20.0, 19.0, 11.0, 15.0, 10.0, 3.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.669921875, -3.560516357421875, -3.45111083984375, -3.341705322265625, -3.2322998046875, -3.122894287109375, -3.01348876953125, -2.904083251953125, -2.794677734375, -2.685272216796875, -2.57586669921875, -2.466461181640625, -2.3570556640625, -2.247650146484375, -2.13824462890625, -2.028839111328125, -1.91943359375, -1.810028076171875, -1.70062255859375, -1.591217041015625, -1.4818115234375, -1.372406005859375, -1.26300048828125, -1.153594970703125, -1.044189453125, -0.934783935546875, -0.82537841796875, -0.715972900390625, -0.6065673828125, -0.497161865234375, -0.38775634765625, -0.278350830078125, -0.1689453125, -0.059539794921875, 0.04986572265625, 0.159271240234375, 0.2686767578125, 0.378082275390625, 0.48748779296875, 0.596893310546875, 0.706298828125, 0.815704345703125, 0.92510986328125, 1.034515380859375, 1.1439208984375, 1.253326416015625, 1.36273193359375, 1.472137451171875, 1.58154296875, 1.690948486328125, 1.80035400390625, 1.909759521484375, 2.0191650390625, 2.128570556640625, 2.23797607421875, 2.347381591796875, 2.456787109375, 2.566192626953125, 2.67559814453125, 2.785003662109375, 2.8944091796875, 3.003814697265625, 3.11322021484375, 3.222625732421875, 3.33203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 6.0, 8.0, 11.0, 12.0, 11.0, 12.0, 9.0, 22.0, 21.0, 30.0, 40.0, 44.0, 78.0, 108.0, 194.0, 325.0, 610.0, 1491.0, 5479.0, 51603.0, 4044142.0, 79762.0, 6912.0, 1632.0, 673.0, 361.0, 211.0, 125.0, 73.0, 65.0, 41.0, 37.0, 23.0, 26.0, 19.0, 9.0, 9.0, 11.0, 5.0, 10.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-13.625, -13.2308349609375, -12.836669921875, -12.4425048828125, -12.04833984375, -11.6541748046875, -11.260009765625, -10.8658447265625, -10.4716796875, -10.0775146484375, -9.683349609375, -9.2891845703125, -8.89501953125, -8.5008544921875, -8.106689453125, -7.7125244140625, -7.318359375, -6.9241943359375, -6.530029296875, -6.1358642578125, -5.74169921875, -5.3475341796875, -4.953369140625, -4.5592041015625, -4.1650390625, -3.7708740234375, -3.376708984375, -2.9825439453125, -2.58837890625, -2.1942138671875, -1.800048828125, -1.4058837890625, -1.01171875, -0.6175537109375, -0.223388671875, 0.1707763671875, 0.56494140625, 0.9591064453125, 1.353271484375, 1.7474365234375, 2.1416015625, 2.5357666015625, 2.929931640625, 3.3240966796875, 3.71826171875, 4.1124267578125, 4.506591796875, 4.9007568359375, 5.294921875, 5.6890869140625, 6.083251953125, 6.4774169921875, 6.87158203125, 7.2657470703125, 7.659912109375, 8.0540771484375, 8.4482421875, 8.8424072265625, 9.236572265625, 9.6307373046875, 10.02490234375, 10.4190673828125, 10.813232421875, 11.2073974609375, 11.6015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 16.0, 28.0, 58.0, 184.0, 3205.0, 403.0, 91.0, 37.0, 19.0, 13.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9111328125, -1.8143768310546875, -1.717620849609375, -1.6208648681640625, -1.52410888671875, -1.4273529052734375, -1.330596923828125, -1.2338409423828125, -1.1370849609375, -1.0403289794921875, -0.943572998046875, -0.8468170166015625, -0.75006103515625, -0.6533050537109375, -0.556549072265625, -0.4597930908203125, -0.363037109375, -0.2662811279296875, -0.169525146484375, -0.0727691650390625, 0.02398681640625, 0.1207427978515625, 0.217498779296875, 0.3142547607421875, 0.4110107421875, 0.5077667236328125, 0.604522705078125, 0.7012786865234375, 0.79803466796875, 0.8947906494140625, 0.991546630859375, 1.0883026123046875, 1.18505859375, 1.2818145751953125, 1.378570556640625, 1.4753265380859375, 1.57208251953125, 1.6688385009765625, 1.765594482421875, 1.8623504638671875, 1.9591064453125, 2.0558624267578125, 2.152618408203125, 2.2493743896484375, 2.34613037109375, 2.4428863525390625, 2.539642333984375, 2.6363983154296875, 2.733154296875, 2.8299102783203125, 2.926666259765625, 3.0234222412109375, 3.12017822265625, 3.2169342041015625, 3.313690185546875, 3.4104461669921875, 3.5072021484375, 3.6039581298828125, 3.700714111328125, 3.7974700927734375, 3.89422607421875, 3.9909820556640625, 4.087738037109375, 4.1844940185546875, 4.28125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 19.0, 44.0, 81.0, 152.0, 178.0, 204.0, 139.0, 87.0, 40.0, 26.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.838037967681885, -5.4201812744140625, -5.00232458114624, -4.584467887878418, -4.166611194610596, -3.7487547397613525, -3.3308980464935303, -2.913041353225708, -2.4951846599578857, -2.0773279666900635, -1.6594712734222412, -1.2416146993637085, -0.8237580060958862, -0.4059014320373535, 0.01195526123046875, 0.429811954498291, 0.8476686477661133, 1.2655253410339355, 1.6833820343017578, 2.10123872756958, 2.5190954208374023, 2.9369518756866455, 3.3548085689544678, 3.77266526222229, 4.190522193908691, 4.608378887176514, 5.026235580444336, 5.444092273712158, 5.8619489669799805, 6.2798051834106445, 6.697662353515625, 7.115518569946289, 7.5333757400512695, 7.951232433319092, 8.369089126586914, 8.786945343017578, 9.204802513122559, 9.622658729553223, 10.040515899658203, 10.458372116088867, 10.876229286193848, 11.294085502624512, 11.711942672729492, 12.129798889160156, 12.547656059265137, 12.9655122756958, 13.383369445800781, 13.801225662231445, 14.21908187866211, 14.636938095092773, 15.054795265197754, 15.472651481628418, 15.890508651733398, 16.308364868164062, 16.726221084594727, 17.144079208374023, 17.561935424804688, 17.97979164123535, 18.397647857666016, 18.815505981445312, 19.233362197875977, 19.65121841430664, 20.069074630737305, 20.4869327545166, 20.904788970947266]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 2.0, 8.0, 7.0, 7.0, 11.0, 15.0, 17.0, 16.0, 21.0, 24.0, 26.0, 36.0, 33.0, 37.0, 31.0, 52.0, 41.0, 56.0, 49.0, 48.0, 70.0, 47.0, 45.0, 39.0, 39.0, 31.0, 33.0, 19.0, 20.0, 20.0, 20.0, 19.0, 12.0, 10.0, 9.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.284671306610107, -4.147883415222168, -4.0110955238342285, -3.87430739402771, -3.7375192642211914, -3.600731372833252, -3.4639434814453125, -3.327155590057373, -3.1903674602508545, -3.053579568862915, -2.9167914390563965, -2.780003547668457, -2.6432156562805176, -2.506427526473999, -2.3696396350860596, -2.232851505279541, -2.0960636138916016, -1.9592756032943726, -1.8224875926971436, -1.685699701309204, -1.548911690711975, -1.412123680114746, -1.2753357887268066, -1.1385477781295776, -1.0017597675323486, -0.8649717569351196, -0.7281838059425354, -0.5913958549499512, -0.45460784435272217, -0.31781983375549316, -0.18103188276290894, -0.04424393177032471, 0.0925440788269043, 0.2293320596218109, 0.36612004041671753, 0.5029079914093018, 0.6396960020065308, 0.7764840126037598, 0.913271963596344, 1.0500599145889282, 1.1868479251861572, 1.3236359357833862, 1.4604239463806152, 1.5972118377685547, 1.7339998483657837, 1.8707878589630127, 2.007575750350952, 2.1443638801574707, 2.28115177154541, 2.4179396629333496, 2.554727792739868, 2.6915156841278076, 2.828303813934326, 2.9650917053222656, 3.101879596710205, 3.2386674880981445, 3.375455617904663, 3.5122435092926025, 3.649031639099121, 3.7858195304870605, 3.922607421875, 4.059395790100098, 4.196183681488037, 4.332971572875977, 4.469759464263916]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 7.0, 11.0, 11.0, 24.0, 24.0, 40.0, 61.0, 102.0, 119.0, 176.0, 274.0, 419.0, 695.0, 1224.0, 1999.0, 3743.0, 7313.0, 14705.0, 30954.0, 69330.0, 157568.0, 290093.0, 248831.0, 119707.0, 52248.0, 23829.0, 11642.0, 5871.0, 3015.0, 1718.0, 1052.0, 620.0, 369.0, 224.0, 155.0, 116.0, 70.0, 59.0, 37.0, 25.0, 14.0, 14.0, 12.0, 13.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.65234375, -3.53387451171875, -3.4154052734375, -3.29693603515625, -3.178466796875, -3.05999755859375, -2.9415283203125, -2.82305908203125, -2.70458984375, -2.58612060546875, -2.4676513671875, -2.34918212890625, -2.230712890625, -2.11224365234375, -1.9937744140625, -1.87530517578125, -1.7568359375, -1.63836669921875, -1.5198974609375, -1.40142822265625, -1.282958984375, -1.16448974609375, -1.0460205078125, -0.92755126953125, -0.80908203125, -0.69061279296875, -0.5721435546875, -0.45367431640625, -0.335205078125, -0.21673583984375, -0.0982666015625, 0.02020263671875, 0.138671875, 0.25714111328125, 0.3756103515625, 0.49407958984375, 0.612548828125, 0.73101806640625, 0.8494873046875, 0.96795654296875, 1.08642578125, 1.20489501953125, 1.3233642578125, 1.44183349609375, 1.560302734375, 1.67877197265625, 1.7972412109375, 1.91571044921875, 2.0341796875, 2.15264892578125, 2.2711181640625, 2.38958740234375, 2.508056640625, 2.62652587890625, 2.7449951171875, 2.86346435546875, 2.98193359375, 3.10040283203125, 3.2188720703125, 3.33734130859375, 3.455810546875, 3.57427978515625, 3.6927490234375, 3.81121826171875, 3.9296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 0.0, 1.0, 3.0, 12.0, 9.0, 11.0, 14.0, 19.0, 26.0, 25.0, 28.0, 31.0, 36.0, 29.0, 21.0, 47.0, 48.0, 50.0, 62.0, 54.0, 45.0, 43.0, 41.0, 54.0, 47.0, 38.0, 29.0, 36.0, 21.0, 27.0, 22.0, 21.0, 12.0, 5.0, 9.0, 3.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.34765625, -4.23382568359375, -4.1199951171875, -4.00616455078125, -3.892333984375, -3.77850341796875, -3.6646728515625, -3.55084228515625, -3.43701171875, -3.32318115234375, -3.2093505859375, -3.09552001953125, -2.981689453125, -2.86785888671875, -2.7540283203125, -2.64019775390625, -2.5263671875, -2.41253662109375, -2.2987060546875, -2.18487548828125, -2.071044921875, -1.95721435546875, -1.8433837890625, -1.72955322265625, -1.61572265625, -1.50189208984375, -1.3880615234375, -1.27423095703125, -1.160400390625, -1.04656982421875, -0.9327392578125, -0.81890869140625, -0.705078125, -0.59124755859375, -0.4774169921875, -0.36358642578125, -0.249755859375, -0.13592529296875, -0.0220947265625, 0.09173583984375, 0.20556640625, 0.31939697265625, 0.4332275390625, 0.54705810546875, 0.660888671875, 0.77471923828125, 0.8885498046875, 1.00238037109375, 1.1162109375, 1.23004150390625, 1.3438720703125, 1.45770263671875, 1.571533203125, 1.68536376953125, 1.7991943359375, 1.91302490234375, 2.02685546875, 2.14068603515625, 2.2545166015625, 2.36834716796875, 2.482177734375, 2.59600830078125, 2.7098388671875, 2.82366943359375, 2.9375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 9.0, 14.0, 9.0, 18.0, 28.0, 49.0, 69.0, 116.0, 235.0, 467.0, 949.0, 2657.0, 9853.0, 64623.0, 705347.0, 232531.0, 23803.0, 4905.0, 1494.0, 620.0, 309.0, 182.0, 99.0, 56.0, 36.0, 17.0, 15.0, 10.0, 8.0, 5.0, 9.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.828125, -12.458984375, -12.08984375, -11.720703125, -11.3515625, -10.982421875, -10.61328125, -10.244140625, -9.875, -9.505859375, -9.13671875, -8.767578125, -8.3984375, -8.029296875, -7.66015625, -7.291015625, -6.921875, -6.552734375, -6.18359375, -5.814453125, -5.4453125, -5.076171875, -4.70703125, -4.337890625, -3.96875, -3.599609375, -3.23046875, -2.861328125, -2.4921875, -2.123046875, -1.75390625, -1.384765625, -1.015625, -0.646484375, -0.27734375, 0.091796875, 0.4609375, 0.830078125, 1.19921875, 1.568359375, 1.9375, 2.306640625, 2.67578125, 3.044921875, 3.4140625, 3.783203125, 4.15234375, 4.521484375, 4.890625, 5.259765625, 5.62890625, 5.998046875, 6.3671875, 6.736328125, 7.10546875, 7.474609375, 7.84375, 8.212890625, 8.58203125, 8.951171875, 9.3203125, 9.689453125, 10.05859375, 10.427734375, 10.796875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 6.0, 10.0, 9.0, 22.0, 21.0, 21.0, 22.0, 25.0, 34.0, 37.0, 46.0, 46.0, 55.0, 57.0, 61.0, 57.0, 49.0, 57.0, 55.0, 38.0, 43.0, 35.0, 34.0, 30.0, 24.0, 20.0, 23.0, 13.0, 13.0, 8.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.5, -17.885498046875, -17.27099609375, -16.656494140625, -16.0419921875, -15.427490234375, -14.81298828125, -14.198486328125, -13.583984375, -12.969482421875, -12.35498046875, -11.740478515625, -11.1259765625, -10.511474609375, -9.89697265625, -9.282470703125, -8.66796875, -8.053466796875, -7.43896484375, -6.824462890625, -6.2099609375, -5.595458984375, -4.98095703125, -4.366455078125, -3.751953125, -3.137451171875, -2.52294921875, -1.908447265625, -1.2939453125, -0.679443359375, -0.06494140625, 0.549560546875, 1.1640625, 1.778564453125, 2.39306640625, 3.007568359375, 3.6220703125, 4.236572265625, 4.85107421875, 5.465576171875, 6.080078125, 6.694580078125, 7.30908203125, 7.923583984375, 8.5380859375, 9.152587890625, 9.76708984375, 10.381591796875, 10.99609375, 11.610595703125, 12.22509765625, 12.839599609375, 13.4541015625, 14.068603515625, 14.68310546875, 15.297607421875, 15.912109375, 16.526611328125, 17.14111328125, 17.755615234375, 18.3701171875, 18.984619140625, 19.59912109375, 20.213623046875, 20.828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 7.0, 1.0, 13.0, 14.0, 12.0, 24.0, 41.0, 57.0, 113.0, 221.0, 640.0, 2942.0, 68549.0, 952867.0, 20394.0, 1733.0, 488.0, 179.0, 96.0, 60.0, 37.0, 19.0, 13.0, 10.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.03125, -8.760498046875, -8.48974609375, -8.218994140625, -7.9482421875, -7.677490234375, -7.40673828125, -7.135986328125, -6.865234375, -6.594482421875, -6.32373046875, -6.052978515625, -5.7822265625, -5.511474609375, -5.24072265625, -4.969970703125, -4.69921875, -4.428466796875, -4.15771484375, -3.886962890625, -3.6162109375, -3.345458984375, -3.07470703125, -2.803955078125, -2.533203125, -2.262451171875, -1.99169921875, -1.720947265625, -1.4501953125, -1.179443359375, -0.90869140625, -0.637939453125, -0.3671875, -0.096435546875, 0.17431640625, 0.445068359375, 0.7158203125, 0.986572265625, 1.25732421875, 1.528076171875, 1.798828125, 2.069580078125, 2.34033203125, 2.611083984375, 2.8818359375, 3.152587890625, 3.42333984375, 3.694091796875, 3.96484375, 4.235595703125, 4.50634765625, 4.777099609375, 5.0478515625, 5.318603515625, 5.58935546875, 5.860107421875, 6.130859375, 6.401611328125, 6.67236328125, 6.943115234375, 7.2138671875, 7.484619140625, 7.75537109375, 8.026123046875, 8.296875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 7.0, 10.0, 10.0, 12.0, 21.0, 23.0, 38.0, 33.0, 47.0, 81.0, 95.0, 114.0, 109.0, 98.0, 67.0, 52.0, 44.0, 27.0, 23.0, 25.0, 17.0, 13.0, 8.0, 4.0, 5.0, 2.0, 1.0, 4.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000530242919921875, -0.0005120262503623962, -0.0004938095808029175, -0.0004755929112434387, -0.00045737624168395996, -0.0004391595721244812, -0.00042094290256500244, -0.0004027262330055237, -0.0003845095634460449, -0.00036629289388656616, -0.0003480762243270874, -0.00032985955476760864, -0.0003116428852081299, -0.0002934262156486511, -0.00027520954608917236, -0.0002569928765296936, -0.00023877620697021484, -0.00022055953741073608, -0.00020234286785125732, -0.00018412619829177856, -0.0001659095287322998, -0.00014769285917282104, -0.00012947618961334229, -0.00011125952005386353, -9.304285049438477e-05, -7.4826180934906e-05, -5.6609511375427246e-05, -3.8392841815948486e-05, -2.0176172256469727e-05, -1.959502696990967e-06, 1.6257166862487793e-05, 3.447383642196655e-05, 5.269050598144531e-05, 7.090717554092407e-05, 8.912384510040283e-05, 0.00010734051465988159, 0.00012555718421936035, 0.0001437738537788391, 0.00016199052333831787, 0.00018020719289779663, 0.0001984238624572754, 0.00021664053201675415, 0.0002348572015762329, 0.00025307387113571167, 0.00027129054069519043, 0.0002895072102546692, 0.00030772387981414795, 0.0003259405493736267, 0.00034415721893310547, 0.00036237388849258423, 0.000380590558052063, 0.00039880722761154175, 0.0004170238971710205, 0.00043524056673049927, 0.00045345723628997803, 0.0004716739058494568, 0.0004898905754089355, 0.0005081072449684143, 0.0005263239145278931, 0.0005445405840873718, 0.0005627572536468506, 0.0005809739232063293, 0.0005991905927658081, 0.0006174072623252869, 0.0006356239318847656]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 7.0, 9.0, 26.0, 31.0, 38.0, 97.0, 131.0, 281.0, 591.0, 1550.0, 5183.0, 31623.0, 548247.0, 426237.0, 27127.0, 4769.0, 1417.0, 578.0, 252.0, 135.0, 84.0, 55.0, 25.0, 26.0, 11.0, 6.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.34942626953125, -5.1871337890625, -5.02484130859375, -4.862548828125, -4.70025634765625, -4.5379638671875, -4.37567138671875, -4.21337890625, -4.05108642578125, -3.8887939453125, -3.72650146484375, -3.564208984375, -3.40191650390625, -3.2396240234375, -3.07733154296875, -2.9150390625, -2.75274658203125, -2.5904541015625, -2.42816162109375, -2.265869140625, -2.10357666015625, -1.9412841796875, -1.77899169921875, -1.61669921875, -1.45440673828125, -1.2921142578125, -1.12982177734375, -0.967529296875, -0.80523681640625, -0.6429443359375, -0.48065185546875, -0.318359375, -0.15606689453125, 0.0062255859375, 0.16851806640625, 0.330810546875, 0.49310302734375, 0.6553955078125, 0.81768798828125, 0.97998046875, 1.14227294921875, 1.3045654296875, 1.46685791015625, 1.629150390625, 1.79144287109375, 1.9537353515625, 2.11602783203125, 2.2783203125, 2.44061279296875, 2.6029052734375, 2.76519775390625, 2.927490234375, 3.08978271484375, 3.2520751953125, 3.41436767578125, 3.57666015625, 3.73895263671875, 3.9012451171875, 4.06353759765625, 4.225830078125, 4.38812255859375, 4.5504150390625, 4.71270751953125, 4.875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 14.0, 18.0, 22.0, 33.0, 50.0, 75.0, 117.0, 151.0, 137.0, 91.0, 97.0, 51.0, 40.0, 21.0, 16.0, 16.0, 6.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.12213134765625, -5.9473876953125, -5.77264404296875, -5.597900390625, -5.42315673828125, -5.2484130859375, -5.07366943359375, -4.89892578125, -4.72418212890625, -4.5494384765625, -4.37469482421875, -4.199951171875, -4.02520751953125, -3.8504638671875, -3.67572021484375, -3.5009765625, -3.32623291015625, -3.1514892578125, -2.97674560546875, -2.802001953125, -2.62725830078125, -2.4525146484375, -2.27777099609375, -2.10302734375, -1.92828369140625, -1.7535400390625, -1.57879638671875, -1.404052734375, -1.22930908203125, -1.0545654296875, -0.87982177734375, -0.705078125, -0.53033447265625, -0.3555908203125, -0.18084716796875, -0.006103515625, 0.16864013671875, 0.3433837890625, 0.51812744140625, 0.69287109375, 0.86761474609375, 1.0423583984375, 1.21710205078125, 1.391845703125, 1.56658935546875, 1.7413330078125, 1.91607666015625, 2.0908203125, 2.26556396484375, 2.4403076171875, 2.61505126953125, 2.789794921875, 2.96453857421875, 3.1392822265625, 3.31402587890625, 3.48876953125, 3.66351318359375, 3.8382568359375, 4.01300048828125, 4.187744140625, 4.36248779296875, 4.5372314453125, 4.71197509765625, 4.88671875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 19.0, 62.0, 259.0, 418.0, 188.0, 35.0, 14.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-291.00189208984375, -285.3441162109375, -279.6863098144531, -274.0285339355469, -268.3707580566406, -262.7129821777344, -257.05517578125, -251.39739990234375, -245.7396240234375, -240.0818328857422, -234.42405700683594, -228.76626586914062, -223.10848999023438, -217.45069885253906, -211.79290771484375, -206.1351318359375, -200.4773406982422, -194.81954956054688, -189.16177368164062, -183.5039825439453, -177.84620666503906, -172.18841552734375, -166.5306396484375, -160.8728485107422, -155.21505737304688, -149.55726623535156, -143.8994903564453, -138.24169921875, -132.58392333984375, -126.92613220214844, -121.26834869384766, -115.61056518554688, -109.95279693603516, -104.29501342773438, -98.6372299194336, -92.97944641113281, -87.3216552734375, -81.66387939453125, -76.00608825683594, -70.34830474853516, -64.69052124023438, -59.032737731933594, -53.37495422363281, -47.717166900634766, -42.059383392333984, -36.4015998840332, -30.743812561035156, -25.086029052734375, -19.428245544433594, -13.770461082458496, -8.112676620483398, -2.4548912048339844, 3.202892303466797, 8.860675811767578, 14.518463134765625, 20.176246643066406, 25.834030151367188, 31.49181365966797, 37.14959716796875, 42.8073844909668, 48.46516799926758, 54.12295150756836, 59.780738830566406, 65.43852233886719, 71.09630584716797]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 7.0, 12.0, 13.0, 7.0, 8.0, 14.0, 16.0, 23.0, 14.0, 34.0, 34.0, 25.0, 30.0, 44.0, 49.0, 40.0, 39.0, 42.0, 59.0, 42.0, 53.0, 48.0, 33.0, 40.0, 40.0, 29.0, 26.0, 37.0, 19.0, 18.0, 16.0, 17.0, 7.0, 8.0, 15.0, 8.0, 7.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.720909118652344, -59.628684997558594, -57.536460876464844, -55.444236755371094, -53.352012634277344, -51.259788513183594, -49.167564392089844, -47.075340270996094, -44.983116149902344, -42.890892028808594, -40.798667907714844, -38.706443786621094, -36.614219665527344, -34.521995544433594, -32.429771423339844, -30.337547302246094, -28.245323181152344, -26.153099060058594, -24.060874938964844, -21.968650817871094, -19.876426696777344, -17.784202575683594, -15.691978454589844, -13.599754333496094, -11.507530212402344, -9.415306091308594, -7.323081970214844, -5.230857849121094, -3.1386337280273438, -1.0464096069335938, 1.0458145141601562, 3.1380386352539062, 5.2302703857421875, 7.3224945068359375, 9.414718627929688, 11.506942749023438, 13.599166870117188, 15.691390991210938, 17.783615112304688, 19.875839233398438, 21.968063354492188, 24.060287475585938, 26.152511596679688, 28.244735717773438, 30.336959838867188, 32.42918395996094, 34.52140808105469, 36.61363220214844, 38.70585632324219, 40.79808044433594, 42.89030456542969, 44.98252868652344, 47.07475280761719, 49.16697692871094, 51.25920104980469, 53.35142517089844, 55.44364929199219, 57.53587341308594, 59.62809753417969, 61.72032165527344, 63.81254577636719, 65.90476989746094, 67.99699401855469, 70.08921813964844, 72.18144226074219]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 10.0, 9.0, 14.0, 30.0, 33.0, 44.0, 83.0, 143.0, 264.0, 408.0, 816.0, 1714.0, 4488.0, 13435.0, 62386.0, 3610556.0, 446585.0, 37046.0, 9624.0, 3412.0, 1538.0, 691.0, 387.0, 217.0, 118.0, 78.0, 45.0, 31.0, 20.0, 16.0, 14.0, 3.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.19140625, -6.008544921875, -5.82568359375, -5.642822265625, -5.4599609375, -5.277099609375, -5.09423828125, -4.911376953125, -4.728515625, -4.545654296875, -4.36279296875, -4.179931640625, -3.9970703125, -3.814208984375, -3.63134765625, -3.448486328125, -3.265625, -3.082763671875, -2.89990234375, -2.717041015625, -2.5341796875, -2.351318359375, -2.16845703125, -1.985595703125, -1.802734375, -1.619873046875, -1.43701171875, -1.254150390625, -1.0712890625, -0.888427734375, -0.70556640625, -0.522705078125, -0.33984375, -0.156982421875, 0.02587890625, 0.208740234375, 0.3916015625, 0.574462890625, 0.75732421875, 0.940185546875, 1.123046875, 1.305908203125, 1.48876953125, 1.671630859375, 1.8544921875, 2.037353515625, 2.22021484375, 2.403076171875, 2.5859375, 2.768798828125, 2.95166015625, 3.134521484375, 3.3173828125, 3.500244140625, 3.68310546875, 3.865966796875, 4.048828125, 4.231689453125, 4.41455078125, 4.597412109375, 4.7802734375, 4.963134765625, 5.14599609375, 5.328857421875, 5.51171875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 3.0, 2.0, 6.0, 9.0, 9.0, 8.0, 19.0, 24.0, 21.0, 26.0, 39.0, 45.0, 41.0, 51.0, 52.0, 53.0, 57.0, 63.0, 67.0, 55.0, 58.0, 37.0, 48.0, 37.0, 37.0, 31.0, 17.0, 18.0, 18.0, 11.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.416015625, -3.294891357421875, -3.17376708984375, -3.052642822265625, -2.9315185546875, -2.810394287109375, -2.68927001953125, -2.568145751953125, -2.447021484375, -2.325897216796875, -2.20477294921875, -2.083648681640625, -1.9625244140625, -1.841400146484375, -1.72027587890625, -1.599151611328125, -1.47802734375, -1.356903076171875, -1.23577880859375, -1.114654541015625, -0.9935302734375, -0.872406005859375, -0.75128173828125, -0.630157470703125, -0.509033203125, -0.387908935546875, -0.26678466796875, -0.145660400390625, -0.0245361328125, 0.096588134765625, 0.21771240234375, 0.338836669921875, 0.4599609375, 0.581085205078125, 0.70220947265625, 0.823333740234375, 0.9444580078125, 1.065582275390625, 1.18670654296875, 1.307830810546875, 1.428955078125, 1.550079345703125, 1.67120361328125, 1.792327880859375, 1.9134521484375, 2.034576416015625, 2.15570068359375, 2.276824951171875, 2.39794921875, 2.519073486328125, 2.64019775390625, 2.761322021484375, 2.8824462890625, 3.003570556640625, 3.12469482421875, 3.245819091796875, 3.366943359375, 3.488067626953125, 3.60919189453125, 3.730316162109375, 3.8514404296875, 3.972564697265625, 4.09368896484375, 4.214813232421875, 4.3359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 6.0, 6.0, 5.0, 7.0, 17.0, 17.0, 24.0, 25.0, 33.0, 47.0, 72.0, 80.0, 129.0, 161.0, 246.0, 307.0, 433.0, 696.0, 956.0, 1640.0, 3155.0, 7401.0, 25116.0, 180308.0, 3779136.0, 155940.0, 23301.0, 7097.0, 3005.0, 1621.0, 1001.0, 666.0, 469.0, 285.0, 250.0, 175.0, 126.0, 95.0, 65.0, 52.0, 35.0, 16.0, 26.0, 15.0, 5.0, 11.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1875, -5.00531005859375, -4.8231201171875, -4.64093017578125, -4.458740234375, -4.27655029296875, -4.0943603515625, -3.91217041015625, -3.72998046875, -3.54779052734375, -3.3656005859375, -3.18341064453125, -3.001220703125, -2.81903076171875, -2.6368408203125, -2.45465087890625, -2.2724609375, -2.09027099609375, -1.9080810546875, -1.72589111328125, -1.543701171875, -1.36151123046875, -1.1793212890625, -0.99713134765625, -0.81494140625, -0.63275146484375, -0.4505615234375, -0.26837158203125, -0.086181640625, 0.09600830078125, 0.2781982421875, 0.46038818359375, 0.642578125, 0.82476806640625, 1.0069580078125, 1.18914794921875, 1.371337890625, 1.55352783203125, 1.7357177734375, 1.91790771484375, 2.10009765625, 2.28228759765625, 2.4644775390625, 2.64666748046875, 2.828857421875, 3.01104736328125, 3.1932373046875, 3.37542724609375, 3.5576171875, 3.73980712890625, 3.9219970703125, 4.10418701171875, 4.286376953125, 4.46856689453125, 4.6507568359375, 4.83294677734375, 5.01513671875, 5.19732666015625, 5.3795166015625, 5.56170654296875, 5.743896484375, 5.92608642578125, 6.1082763671875, 6.29046630859375, 6.47265625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 13.0, 22.0, 37.0, 111.0, 419.0, 2888.0, 364.0, 104.0, 38.0, 26.0, 10.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.38671875, -4.2471923828125, -4.107666015625, -3.9681396484375, -3.82861328125, -3.6890869140625, -3.549560546875, -3.4100341796875, -3.2705078125, -3.1309814453125, -2.991455078125, -2.8519287109375, -2.71240234375, -2.5728759765625, -2.433349609375, -2.2938232421875, -2.154296875, -2.0147705078125, -1.875244140625, -1.7357177734375, -1.59619140625, -1.4566650390625, -1.317138671875, -1.1776123046875, -1.0380859375, -0.8985595703125, -0.759033203125, -0.6195068359375, -0.47998046875, -0.3404541015625, -0.200927734375, -0.0614013671875, 0.078125, 0.2176513671875, 0.357177734375, 0.4967041015625, 0.63623046875, 0.7757568359375, 0.915283203125, 1.0548095703125, 1.1943359375, 1.3338623046875, 1.473388671875, 1.6129150390625, 1.75244140625, 1.8919677734375, 2.031494140625, 2.1710205078125, 2.310546875, 2.4500732421875, 2.589599609375, 2.7291259765625, 2.86865234375, 3.0081787109375, 3.147705078125, 3.2872314453125, 3.4267578125, 3.5662841796875, 3.705810546875, 3.8453369140625, 3.98486328125, 4.1243896484375, 4.263916015625, 4.4034423828125, 4.54296875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 9.0, 19.0, 23.0, 73.0, 97.0, 141.0, 183.0, 152.0, 108.0, 63.0, 56.0, 30.0, 16.0, 14.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.977409362792969, -11.444223403930664, -10.91103744506836, -10.377851486206055, -9.84466552734375, -9.311479568481445, -8.778292655944824, -8.24510669708252, -7.711920738220215, -7.17873477935791, -6.6455488204956055, -6.112362384796143, -5.579176425933838, -5.045990467071533, -4.51280403137207, -3.9796180725097656, -3.446432113647461, -2.9132461547851562, -2.3800599575042725, -1.8468738794326782, -1.313687801361084, -0.7805018424987793, -0.2473156452178955, 0.2858705520629883, 0.819056510925293, 1.3522425889968872, 1.8854286670684814, 2.4186148643493652, 2.95180082321167, 3.4849867820739746, 4.0181732177734375, 4.551359176635742, 5.084545135498047, 5.617731094360352, 6.150917053222656, 6.684103488922119, 7.217289447784424, 7.7504754066467285, 8.283661842346191, 8.816847801208496, 9.3500337600708, 9.883219718933105, 10.41640567779541, 10.949591636657715, 11.482778549194336, 12.01596450805664, 12.549150466918945, 13.08233642578125, 13.615522384643555, 14.14870834350586, 14.681894302368164, 15.215080261230469, 15.748266220092773, 16.281452178955078, 16.814638137817383, 17.347824096679688, 17.881011962890625, 18.41419792175293, 18.947383880615234, 19.48056983947754, 20.013755798339844, 20.54694175720215, 21.080127716064453, 21.61331558227539, 22.146499633789062]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 1.0, 3.0, 8.0, 3.0, 11.0, 13.0, 10.0, 23.0, 23.0, 33.0, 31.0, 29.0, 41.0, 37.0, 52.0, 37.0, 41.0, 53.0, 50.0, 49.0, 53.0, 36.0, 48.0, 46.0, 52.0, 22.0, 30.0, 25.0, 31.0, 19.0, 17.0, 12.0, 11.0, 14.0, 14.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.870329856872559, -6.616978645324707, -6.3636274337768555, -6.110276222229004, -5.856925010681152, -5.603573799133301, -5.350222587585449, -5.096871376037598, -4.843520164489746, -4.5901689529418945, -4.336817741394043, -4.083466529846191, -3.83011531829834, -3.5767641067504883, -3.3234126567840576, -3.070061445236206, -2.8167099952697754, -2.563358783721924, -2.3100075721740723, -2.0566563606262207, -1.8033050298690796, -1.549953818321228, -1.296602487564087, -1.0432512760162354, -0.7899000644683838, -0.5365488529205322, -0.2831975817680359, -0.02984631061553955, 0.223504900932312, 0.4768561124801636, 0.7302074432373047, 0.9835586547851562, 1.2369098663330078, 1.4902610778808594, 1.743612289428711, 1.996963620185852, 2.250314712524414, 2.5036659240722656, 2.7570173740386963, 3.010368585586548, 3.2637197971343994, 3.517071008682251, 3.7704222202301025, 4.023773670196533, 4.277124881744385, 4.530476093292236, 4.783827304840088, 5.0371785163879395, 5.290529727935791, 5.543880939483643, 5.797232151031494, 6.050583362579346, 6.303934574127197, 6.557285785675049, 6.810637474060059, 7.06398868560791, 7.317339897155762, 7.570691108703613, 7.824042320251465, 8.077393531799316, 8.330744743347168, 8.58409595489502, 8.837447166442871, 9.090798377990723, 9.344149589538574]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 10.0, 17.0, 16.0, 25.0, 35.0, 56.0, 79.0, 136.0, 253.0, 383.0, 654.0, 1242.0, 2582.0, 6131.0, 15447.0, 44591.0, 142836.0, 376354.0, 303956.0, 100641.0, 32075.0, 11675.0, 4720.0, 2162.0, 998.0, 556.0, 336.0, 187.0, 117.0, 80.0, 58.0, 33.0, 26.0, 15.0, 21.0, 9.0, 5.0, 11.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.5390625, -5.380126953125, -5.22119140625, -5.062255859375, -4.9033203125, -4.744384765625, -4.58544921875, -4.426513671875, -4.267578125, -4.108642578125, -3.94970703125, -3.790771484375, -3.6318359375, -3.472900390625, -3.31396484375, -3.155029296875, -2.99609375, -2.837158203125, -2.67822265625, -2.519287109375, -2.3603515625, -2.201416015625, -2.04248046875, -1.883544921875, -1.724609375, -1.565673828125, -1.40673828125, -1.247802734375, -1.0888671875, -0.929931640625, -0.77099609375, -0.612060546875, -0.453125, -0.294189453125, -0.13525390625, 0.023681640625, 0.1826171875, 0.341552734375, 0.50048828125, 0.659423828125, 0.818359375, 0.977294921875, 1.13623046875, 1.295166015625, 1.4541015625, 1.613037109375, 1.77197265625, 1.930908203125, 2.08984375, 2.248779296875, 2.40771484375, 2.566650390625, 2.7255859375, 2.884521484375, 3.04345703125, 3.202392578125, 3.361328125, 3.520263671875, 3.67919921875, 3.838134765625, 3.9970703125, 4.156005859375, 4.31494140625, 4.473876953125, 4.6328125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 5.0, 10.0, 9.0, 8.0, 18.0, 12.0, 30.0, 30.0, 28.0, 32.0, 38.0, 36.0, 63.0, 55.0, 44.0, 54.0, 41.0, 58.0, 55.0, 48.0, 49.0, 42.0, 29.0, 40.0, 37.0, 18.0, 21.0, 10.0, 12.0, 15.0, 10.0, 8.0, 4.0, 4.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.111328125, -2.997039794921875, -2.88275146484375, -2.768463134765625, -2.6541748046875, -2.539886474609375, -2.42559814453125, -2.311309814453125, -2.197021484375, -2.082733154296875, -1.96844482421875, -1.854156494140625, -1.7398681640625, -1.625579833984375, -1.51129150390625, -1.397003173828125, -1.28271484375, -1.168426513671875, -1.05413818359375, -0.939849853515625, -0.8255615234375, -0.711273193359375, -0.59698486328125, -0.482696533203125, -0.368408203125, -0.254119873046875, -0.13983154296875, -0.025543212890625, 0.0887451171875, 0.203033447265625, 0.31732177734375, 0.431610107421875, 0.5458984375, 0.660186767578125, 0.77447509765625, 0.888763427734375, 1.0030517578125, 1.117340087890625, 1.23162841796875, 1.345916748046875, 1.460205078125, 1.574493408203125, 1.68878173828125, 1.803070068359375, 1.9173583984375, 2.031646728515625, 2.14593505859375, 2.260223388671875, 2.37451171875, 2.488800048828125, 2.60308837890625, 2.717376708984375, 2.8316650390625, 2.945953369140625, 3.06024169921875, 3.174530029296875, 3.288818359375, 3.403106689453125, 3.51739501953125, 3.631683349609375, 3.7459716796875, 3.860260009765625, 3.97454833984375, 4.088836669921875, 4.203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 6.0, 21.0, 25.0, 43.0, 50.0, 88.0, 167.0, 347.0, 888.0, 3133.0, 25317.0, 730585.0, 272563.0, 12043.0, 1991.0, 646.0, 272.0, 123.0, 70.0, 42.0, 35.0, 26.0, 18.0, 14.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.1641845703125, -15.672119140625, -15.1800537109375, -14.68798828125, -14.1959228515625, -13.703857421875, -13.2117919921875, -12.7197265625, -12.2276611328125, -11.735595703125, -11.2435302734375, -10.75146484375, -10.2593994140625, -9.767333984375, -9.2752685546875, -8.783203125, -8.2911376953125, -7.799072265625, -7.3070068359375, -6.81494140625, -6.3228759765625, -5.830810546875, -5.3387451171875, -4.8466796875, -4.3546142578125, -3.862548828125, -3.3704833984375, -2.87841796875, -2.3863525390625, -1.894287109375, -1.4022216796875, -0.91015625, -0.4180908203125, 0.073974609375, 0.5660400390625, 1.05810546875, 1.5501708984375, 2.042236328125, 2.5343017578125, 3.0263671875, 3.5184326171875, 4.010498046875, 4.5025634765625, 4.99462890625, 5.4866943359375, 5.978759765625, 6.4708251953125, 6.962890625, 7.4549560546875, 7.947021484375, 8.4390869140625, 8.93115234375, 9.4232177734375, 9.915283203125, 10.4073486328125, 10.8994140625, 11.3914794921875, 11.883544921875, 12.3756103515625, 12.86767578125, 13.3597412109375, 13.851806640625, 14.3438720703125, 14.8359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 2.0, 11.0, 8.0, 14.0, 13.0, 17.0, 17.0, 25.0, 25.0, 33.0, 40.0, 35.0, 48.0, 51.0, 49.0, 64.0, 47.0, 56.0, 55.0, 57.0, 51.0, 48.0, 40.0, 26.0, 42.0, 16.0, 17.0, 16.0, 20.0, 11.0, 13.0, 9.0, 5.0, 7.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.421875, -17.9102783203125, -17.398681640625, -16.8870849609375, -16.37548828125, -15.8638916015625, -15.352294921875, -14.8406982421875, -14.3291015625, -13.8175048828125, -13.305908203125, -12.7943115234375, -12.28271484375, -11.7711181640625, -11.259521484375, -10.7479248046875, -10.236328125, -9.7247314453125, -9.213134765625, -8.7015380859375, -8.18994140625, -7.6783447265625, -7.166748046875, -6.6551513671875, -6.1435546875, -5.6319580078125, -5.120361328125, -4.6087646484375, -4.09716796875, -3.5855712890625, -3.073974609375, -2.5623779296875, -2.05078125, -1.5391845703125, -1.027587890625, -0.5159912109375, -0.00439453125, 0.5072021484375, 1.018798828125, 1.5303955078125, 2.0419921875, 2.5535888671875, 3.065185546875, 3.5767822265625, 4.08837890625, 4.5999755859375, 5.111572265625, 5.6231689453125, 6.134765625, 6.6463623046875, 7.157958984375, 7.6695556640625, 8.18115234375, 8.6927490234375, 9.204345703125, 9.7159423828125, 10.2275390625, 10.7391357421875, 11.250732421875, 11.7623291015625, 12.27392578125, 12.7855224609375, 13.297119140625, 13.8087158203125, 14.3203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 5.0, 16.0, 21.0, 30.0, 51.0, 54.0, 93.0, 163.0, 338.0, 716.0, 2377.0, 12778.0, 186004.0, 786365.0, 51611.0, 5515.0, 1312.0, 473.0, 251.0, 145.0, 71.0, 48.0, 35.0, 21.0, 18.0, 8.0, 6.0, 7.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.921875, -5.78814697265625, -5.6544189453125, -5.52069091796875, -5.386962890625, -5.25323486328125, -5.1195068359375, -4.98577880859375, -4.85205078125, -4.71832275390625, -4.5845947265625, -4.45086669921875, -4.317138671875, -4.18341064453125, -4.0496826171875, -3.91595458984375, -3.7822265625, -3.64849853515625, -3.5147705078125, -3.38104248046875, -3.247314453125, -3.11358642578125, -2.9798583984375, -2.84613037109375, -2.71240234375, -2.57867431640625, -2.4449462890625, -2.31121826171875, -2.177490234375, -2.04376220703125, -1.9100341796875, -1.77630615234375, -1.642578125, -1.50885009765625, -1.3751220703125, -1.24139404296875, -1.107666015625, -0.97393798828125, -0.8402099609375, -0.70648193359375, -0.57275390625, -0.43902587890625, -0.3052978515625, -0.17156982421875, -0.037841796875, 0.09588623046875, 0.2296142578125, 0.36334228515625, 0.4970703125, 0.63079833984375, 0.7645263671875, 0.89825439453125, 1.031982421875, 1.16571044921875, 1.2994384765625, 1.43316650390625, 1.56689453125, 1.70062255859375, 1.8343505859375, 1.96807861328125, 2.101806640625, 2.23553466796875, 2.3692626953125, 2.50299072265625, 2.63671875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 10.0, 6.0, 15.0, 19.0, 12.0, 22.0, 21.0, 31.0, 50.0, 53.0, 83.0, 120.0, 157.0, 100.0, 47.0, 42.0, 34.0, 37.0, 30.0, 20.0, 24.0, 12.0, 7.0, 9.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007152557373046875, -0.0006960704922676086, -0.0006768852472305298, -0.0006577000021934509, -0.0006385147571563721, -0.0006193295121192932, -0.0006001442670822144, -0.0005809590220451355, -0.0005617737770080566, -0.0005425885319709778, -0.0005234032869338989, -0.0005042180418968201, -0.0004850327968597412, -0.00046584755182266235, -0.0004466623067855835, -0.00042747706174850464, -0.0004082918167114258, -0.0003891065716743469, -0.00036992132663726807, -0.0003507360816001892, -0.00033155083656311035, -0.0003123655915260315, -0.00029318034648895264, -0.0002739951014518738, -0.0002548098564147949, -0.00023562461137771606, -0.0002164393663406372, -0.00019725412130355835, -0.0001780688762664795, -0.00015888363122940063, -0.00013969838619232178, -0.00012051314115524292, -0.00010132789611816406, -8.21426510810852e-05, -6.295740604400635e-05, -4.377216100692749e-05, -2.4586915969848633e-05, -5.401670932769775e-06, 1.3783574104309082e-05, 3.296881914138794e-05, 5.21540641784668e-05, 7.133930921554565e-05, 9.052455425262451e-05, 0.00010970979928970337, 0.00012889504432678223, 0.00014808028936386108, 0.00016726553440093994, 0.0001864507794380188, 0.00020563602447509766, 0.00022482126951217651, 0.00024400651454925537, 0.00026319175958633423, 0.0002823770046234131, 0.00030156224966049194, 0.0003207474946975708, 0.00033993273973464966, 0.0003591179847717285, 0.0003783032298088074, 0.00039748847484588623, 0.0004166737198829651, 0.00043585896492004395, 0.0004550442099571228, 0.00047422945499420166, 0.0004934147000312805, 0.0005125999450683594]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 4.0, 9.0, 9.0, 21.0, 16.0, 46.0, 81.0, 132.0, 243.0, 586.0, 1489.0, 4739.0, 25433.0, 446387.0, 533415.0, 28146.0, 5077.0, 1531.0, 600.0, 254.0, 118.0, 68.0, 40.0, 22.0, 18.0, 12.0, 7.0, 6.0, 11.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.38671875, -5.218505859375, -5.05029296875, -4.882080078125, -4.7138671875, -4.545654296875, -4.37744140625, -4.209228515625, -4.041015625, -3.872802734375, -3.70458984375, -3.536376953125, -3.3681640625, -3.199951171875, -3.03173828125, -2.863525390625, -2.6953125, -2.527099609375, -2.35888671875, -2.190673828125, -2.0224609375, -1.854248046875, -1.68603515625, -1.517822265625, -1.349609375, -1.181396484375, -1.01318359375, -0.844970703125, -0.6767578125, -0.508544921875, -0.34033203125, -0.172119140625, -0.00390625, 0.164306640625, 0.33251953125, 0.500732421875, 0.6689453125, 0.837158203125, 1.00537109375, 1.173583984375, 1.341796875, 1.510009765625, 1.67822265625, 1.846435546875, 2.0146484375, 2.182861328125, 2.35107421875, 2.519287109375, 2.6875, 2.855712890625, 3.02392578125, 3.192138671875, 3.3603515625, 3.528564453125, 3.69677734375, 3.864990234375, 4.033203125, 4.201416015625, 4.36962890625, 4.537841796875, 4.7060546875, 4.874267578125, 5.04248046875, 5.210693359375, 5.37890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 1.0, 9.0, 7.0, 7.0, 11.0, 16.0, 16.0, 24.0, 29.0, 60.0, 47.0, 51.0, 76.0, 83.0, 115.0, 111.0, 68.0, 70.0, 35.0, 38.0, 30.0, 20.0, 17.0, 14.0, 10.0, 5.0, 5.0, 7.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.253173828125, -3.14306640625, -3.032958984375, -2.9228515625, -2.812744140625, -2.70263671875, -2.592529296875, -2.482421875, -2.372314453125, -2.26220703125, -2.152099609375, -2.0419921875, -1.931884765625, -1.82177734375, -1.711669921875, -1.6015625, -1.491455078125, -1.38134765625, -1.271240234375, -1.1611328125, -1.051025390625, -0.94091796875, -0.830810546875, -0.720703125, -0.610595703125, -0.50048828125, -0.390380859375, -0.2802734375, -0.170166015625, -0.06005859375, 0.050048828125, 0.16015625, 0.270263671875, 0.38037109375, 0.490478515625, 0.6005859375, 0.710693359375, 0.82080078125, 0.930908203125, 1.041015625, 1.151123046875, 1.26123046875, 1.371337890625, 1.4814453125, 1.591552734375, 1.70166015625, 1.811767578125, 1.921875, 2.031982421875, 2.14208984375, 2.252197265625, 2.3623046875, 2.472412109375, 2.58251953125, 2.692626953125, 2.802734375, 2.912841796875, 3.02294921875, 3.133056640625, 3.2431640625, 3.353271484375, 3.46337890625, 3.573486328125, 3.68359375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 8.0, 10.0, 32.0, 87.0, 283.0, 332.0, 181.0, 44.0, 16.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.99026489257812, -136.7591552734375, -132.52804565429688, -128.29693603515625, -124.0658187866211, -119.83470916748047, -115.60359191894531, -111.37248229980469, -107.14137268066406, -102.91026306152344, -98.67915344238281, -94.44803619384766, -90.21692657470703, -85.9858169555664, -81.75469970703125, -77.52359008789062, -73.29248046875, -69.06137084960938, -64.83026123046875, -60.599143981933594, -56.36803436279297, -52.136924743652344, -47.90581130981445, -43.67469787597656, -39.44358825683594, -35.21247863769531, -30.981365203857422, -26.750253677368164, -22.519142150878906, -18.28803062438965, -14.05691909790039, -9.825807571411133, -5.594696044921875, -1.3635845184326172, 2.8675270080566406, 7.098638534545898, 11.329750061035156, 15.560861587524414, 19.791973114013672, 24.02308464050293, 28.254196166992188, 32.48530578613281, 36.7164192199707, 40.947532653808594, 45.17864227294922, 49.409751892089844, 53.640865325927734, 57.871978759765625, 62.10308837890625, 66.33419799804688, 70.5653076171875, 74.79642486572266, 79.02753448486328, 83.2586441040039, 87.48976135253906, 91.72087097167969, 95.95198059082031, 100.18309020996094, 104.41419982910156, 108.64531707763672, 112.87642669677734, 117.10753631591797, 121.33865356445312, 125.56976318359375, 129.80087280273438]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 5.0, 8.0, 10.0, 19.0, 11.0, 18.0, 19.0, 19.0, 19.0, 31.0, 26.0, 32.0, 47.0, 33.0, 46.0, 39.0, 51.0, 51.0, 43.0, 58.0, 32.0, 39.0, 26.0, 46.0, 32.0, 42.0, 23.0, 22.0, 23.0, 14.0, 19.0, 18.0, 10.0, 7.0, 6.0, 5.0, 5.0, 4.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-56.064056396484375, -54.36747741699219, -52.670902252197266, -50.97432327270508, -49.27774429321289, -47.58116912841797, -45.88459014892578, -44.188011169433594, -42.491432189941406, -40.79485321044922, -39.0982780456543, -37.40169906616211, -35.70512008666992, -34.008544921875, -32.31196594238281, -30.615386962890625, -28.91880989074707, -27.222232818603516, -25.525653839111328, -23.829076766967773, -22.132497787475586, -20.43592071533203, -18.739341735839844, -17.04276466369629, -15.346186637878418, -13.649608612060547, -11.953030586242676, -10.256452560424805, -8.55987548828125, -6.863297462463379, -5.166719436645508, -3.4701414108276367, -1.7735633850097656, -0.07698547840118408, 1.6195924282073975, 3.3161702156066895, 5.0127482414245605, 6.709325790405273, 8.405903816223145, 10.102481842041016, 11.799059867858887, 13.495637893676758, 15.192215919494629, 16.8887939453125, 18.585371017456055, 20.28194808959961, 21.978527069091797, 23.675106048583984, 25.37168312072754, 27.068260192871094, 28.76483917236328, 30.461416244506836, 32.15799331665039, 33.85457229614258, 35.551151275634766, 37.24772644042969, 38.944305419921875, 40.64088439941406, 42.337459564208984, 44.03403854370117, 45.73061752319336, 47.42719268798828, 49.12377166748047, 50.820350646972656, 52.516929626464844]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 11.0, 10.0, 19.0, 32.0, 69.0, 141.0, 273.0, 587.0, 1229.0, 2921.0, 8644.0, 40727.0, 1043783.0, 2995361.0, 81271.0, 12385.0, 4010.0, 1460.0, 646.0, 338.0, 169.0, 83.0, 44.0, 22.0, 17.0, 14.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.59375, -8.3848876953125, -8.176025390625, -7.9671630859375, -7.75830078125, -7.5494384765625, -7.340576171875, -7.1317138671875, -6.9228515625, -6.7139892578125, -6.505126953125, -6.2962646484375, -6.08740234375, -5.8785400390625, -5.669677734375, -5.4608154296875, -5.251953125, -5.0430908203125, -4.834228515625, -4.6253662109375, -4.41650390625, -4.2076416015625, -3.998779296875, -3.7899169921875, -3.5810546875, -3.3721923828125, -3.163330078125, -2.9544677734375, -2.74560546875, -2.5367431640625, -2.327880859375, -2.1190185546875, -1.91015625, -1.7012939453125, -1.492431640625, -1.2835693359375, -1.07470703125, -0.8658447265625, -0.656982421875, -0.4481201171875, -0.2392578125, -0.0303955078125, 0.178466796875, 0.3873291015625, 0.59619140625, 0.8050537109375, 1.013916015625, 1.2227783203125, 1.431640625, 1.6405029296875, 1.849365234375, 2.0582275390625, 2.26708984375, 2.4759521484375, 2.684814453125, 2.8936767578125, 3.1025390625, 3.3114013671875, 3.520263671875, 3.7291259765625, 3.93798828125, 4.1468505859375, 4.355712890625, 4.5645751953125, 4.7734375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 6.0, 9.0, 12.0, 11.0, 11.0, 22.0, 28.0, 28.0, 18.0, 49.0, 53.0, 57.0, 44.0, 64.0, 59.0, 57.0, 57.0, 67.0, 40.0, 66.0, 29.0, 32.0, 44.0, 20.0, 26.0, 25.0, 14.0, 11.0, 4.0, 4.0, 5.0, 6.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.899139404296875, -2.78851318359375, -2.677886962890625, -2.5672607421875, -2.456634521484375, -2.34600830078125, -2.235382080078125, -2.124755859375, -2.014129638671875, -1.90350341796875, -1.792877197265625, -1.6822509765625, -1.571624755859375, -1.46099853515625, -1.350372314453125, -1.23974609375, -1.129119873046875, -1.01849365234375, -0.907867431640625, -0.7972412109375, -0.686614990234375, -0.57598876953125, -0.465362548828125, -0.354736328125, -0.244110107421875, -0.13348388671875, -0.022857666015625, 0.0877685546875, 0.198394775390625, 0.30902099609375, 0.419647216796875, 0.5302734375, 0.640899658203125, 0.75152587890625, 0.862152099609375, 0.9727783203125, 1.083404541015625, 1.19403076171875, 1.304656982421875, 1.415283203125, 1.525909423828125, 1.63653564453125, 1.747161865234375, 1.8577880859375, 1.968414306640625, 2.07904052734375, 2.189666748046875, 2.30029296875, 2.410919189453125, 2.52154541015625, 2.632171630859375, 2.7427978515625, 2.853424072265625, 2.96405029296875, 3.074676513671875, 3.185302734375, 3.295928955078125, 3.40655517578125, 3.517181396484375, 3.6278076171875, 3.738433837890625, 3.84906005859375, 3.959686279296875, 4.0703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 6.0, 6.0, 7.0, 14.0, 18.0, 43.0, 62.0, 121.0, 311.0, 834.0, 2931.0, 12059.0, 114034.0, 3912780.0, 132727.0, 13267.0, 3300.0, 1028.0, 385.0, 151.0, 59.0, 42.0, 18.0, 16.0, 10.0, 10.0, 4.0, 6.0, 7.0, 0.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5234375, -10.1895751953125, -9.855712890625, -9.5218505859375, -9.18798828125, -8.8541259765625, -8.520263671875, -8.1864013671875, -7.8525390625, -7.5186767578125, -7.184814453125, -6.8509521484375, -6.51708984375, -6.1832275390625, -5.849365234375, -5.5155029296875, -5.181640625, -4.8477783203125, -4.513916015625, -4.1800537109375, -3.84619140625, -3.5123291015625, -3.178466796875, -2.8446044921875, -2.5107421875, -2.1768798828125, -1.843017578125, -1.5091552734375, -1.17529296875, -0.8414306640625, -0.507568359375, -0.1737060546875, 0.16015625, 0.4940185546875, 0.827880859375, 1.1617431640625, 1.49560546875, 1.8294677734375, 2.163330078125, 2.4971923828125, 2.8310546875, 3.1649169921875, 3.498779296875, 3.8326416015625, 4.16650390625, 4.5003662109375, 4.834228515625, 5.1680908203125, 5.501953125, 5.8358154296875, 6.169677734375, 6.5035400390625, 6.83740234375, 7.1712646484375, 7.505126953125, 7.8389892578125, 8.1728515625, 8.5067138671875, 8.840576171875, 9.1744384765625, 9.50830078125, 9.8421630859375, 10.176025390625, 10.5098876953125, 10.84375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 5.0, 8.0, 8.0, 15.0, 27.0, 20.0, 64.0, 93.0, 188.0, 372.0, 935.0, 1139.0, 625.0, 242.0, 131.0, 57.0, 37.0, 22.0, 19.0, 12.0, 10.0, 10.0, 8.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98828125, -5.75042724609375, -5.5125732421875, -5.27471923828125, -5.036865234375, -4.79901123046875, -4.5611572265625, -4.32330322265625, -4.08544921875, -3.84759521484375, -3.6097412109375, -3.37188720703125, -3.134033203125, -2.89617919921875, -2.6583251953125, -2.42047119140625, -2.1826171875, -1.94476318359375, -1.7069091796875, -1.46905517578125, -1.231201171875, -0.99334716796875, -0.7554931640625, -0.51763916015625, -0.27978515625, -0.04193115234375, 0.1959228515625, 0.43377685546875, 0.671630859375, 0.90948486328125, 1.1473388671875, 1.38519287109375, 1.623046875, 1.86090087890625, 2.0987548828125, 2.33660888671875, 2.574462890625, 2.81231689453125, 3.0501708984375, 3.28802490234375, 3.52587890625, 3.76373291015625, 4.0015869140625, 4.23944091796875, 4.477294921875, 4.71514892578125, 4.9530029296875, 5.19085693359375, 5.4287109375, 5.66656494140625, 5.9044189453125, 6.14227294921875, 6.380126953125, 6.61798095703125, 6.8558349609375, 7.09368896484375, 7.33154296875, 7.56939697265625, 7.8072509765625, 8.04510498046875, 8.282958984375, 8.52081298828125, 8.7586669921875, 8.99652099609375, 9.234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 12.0, 20.0, 44.0, 114.0, 164.0, 223.0, 181.0, 112.0, 68.0, 18.0, 13.0, 9.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.09721374511719, -70.97959899902344, -68.86198425292969, -66.7443618774414, -64.62674713134766, -62.509132385253906, -60.391517639160156, -58.27389907836914, -56.156280517578125, -54.038665771484375, -51.92104721069336, -49.80343246459961, -47.685813903808594, -45.568199157714844, -43.450584411621094, -41.33296585083008, -39.21535110473633, -37.09773635864258, -34.98011779785156, -32.86250305175781, -30.744884490966797, -28.627269744873047, -26.509653091430664, -24.39203643798828, -22.2744197845459, -20.156803131103516, -18.039186477661133, -15.921570777893066, -13.803954124450684, -11.6863374710083, -9.568721771240234, -7.451105117797852, -5.333484649658203, -3.2158682346343994, -1.0982518196105957, 1.019364356994629, 3.1369810104370117, 5.2545976638793945, 7.372213363647461, 9.489830017089844, 11.607446670532227, 13.72506332397461, 15.842679977416992, 17.960296630859375, 20.077911376953125, 22.19552993774414, 24.31314468383789, 26.430761337280273, 28.548377990722656, 30.66599464416504, 32.78361129760742, 34.90122604370117, 37.01884460449219, 39.13645935058594, 41.25407409667969, 43.3716926574707, 45.48931121826172, 47.60692596435547, 49.724544525146484, 51.842159271240234, 53.95977783203125, 56.077392578125, 58.19500732421875, 60.312625885009766, 62.430240631103516]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 7.0, 9.0, 5.0, 15.0, 17.0, 17.0, 13.0, 17.0, 16.0, 27.0, 41.0, 35.0, 30.0, 43.0, 43.0, 48.0, 44.0, 36.0, 32.0, 49.0, 44.0, 38.0, 39.0, 42.0, 47.0, 33.0, 31.0, 39.0, 21.0, 27.0, 19.0, 12.0, 10.0, 13.0, 5.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-29.870325088500977, -29.03856658935547, -28.206806182861328, -27.375045776367188, -26.54328727722168, -25.711528778076172, -24.87976837158203, -24.04800796508789, -23.216249465942383, -22.384490966796875, -21.552730560302734, -20.720970153808594, -19.889211654663086, -19.057453155517578, -18.225692749023438, -17.393932342529297, -16.56217384338379, -15.730414390563965, -14.89865493774414, -14.066895484924316, -13.235136032104492, -12.403376579284668, -11.571617126464844, -10.73985767364502, -9.908098220825195, -9.076338768005371, -8.244579315185547, -7.412819862365723, -6.581060409545898, -5.749300956726074, -4.91754150390625, -4.085782051086426, -3.2540225982666016, -2.4222631454467773, -1.5905036926269531, -0.7587442398071289, 0.07301521301269531, 0.9047746658325195, 1.7365341186523438, 2.568293571472168, 3.400053024291992, 4.231812477111816, 5.063571929931641, 5.895331382751465, 6.727090835571289, 7.558850288391113, 8.390609741210938, 9.222369194030762, 10.054128646850586, 10.88588809967041, 11.717647552490234, 12.549407005310059, 13.381166458129883, 14.212925910949707, 15.044685363769531, 15.876444816589355, 16.70820426940918, 17.539962768554688, 18.371723175048828, 19.20348358154297, 20.035242080688477, 20.867000579833984, 21.698760986328125, 22.530521392822266, 23.362279891967773]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 9.0, 14.0, 13.0, 20.0, 17.0, 63.0, 54.0, 102.0, 106.0, 182.0, 332.0, 482.0, 820.0, 1345.0, 2442.0, 4574.0, 8901.0, 17916.0, 39022.0, 87098.0, 195251.0, 317756.0, 202176.0, 90606.0, 40510.0, 18806.0, 9192.0, 4620.0, 2467.0, 1377.0, 857.0, 472.0, 307.0, 203.0, 126.0, 96.0, 62.0, 39.0, 21.0, 27.0, 21.0, 14.0, 4.0, 11.0, 8.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.400390625, -3.29583740234375, -3.1912841796875, -3.08673095703125, -2.982177734375, -2.87762451171875, -2.7730712890625, -2.66851806640625, -2.56396484375, -2.45941162109375, -2.3548583984375, -2.25030517578125, -2.145751953125, -2.04119873046875, -1.9366455078125, -1.83209228515625, -1.7275390625, -1.62298583984375, -1.5184326171875, -1.41387939453125, -1.309326171875, -1.20477294921875, -1.1002197265625, -0.99566650390625, -0.89111328125, -0.78656005859375, -0.6820068359375, -0.57745361328125, -0.472900390625, -0.36834716796875, -0.2637939453125, -0.15924072265625, -0.0546875, 0.04986572265625, 0.1544189453125, 0.25897216796875, 0.363525390625, 0.46807861328125, 0.5726318359375, 0.67718505859375, 0.78173828125, 0.88629150390625, 0.9908447265625, 1.09539794921875, 1.199951171875, 1.30450439453125, 1.4090576171875, 1.51361083984375, 1.6181640625, 1.72271728515625, 1.8272705078125, 1.93182373046875, 2.036376953125, 2.14093017578125, 2.2454833984375, 2.35003662109375, 2.45458984375, 2.55914306640625, 2.6636962890625, 2.76824951171875, 2.872802734375, 2.97735595703125, 3.0819091796875, 3.18646240234375, 3.291015625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 7.0, 6.0, 8.0, 17.0, 12.0, 13.0, 12.0, 22.0, 36.0, 31.0, 39.0, 30.0, 43.0, 58.0, 51.0, 43.0, 54.0, 61.0, 48.0, 54.0, 52.0, 31.0, 40.0, 36.0, 34.0, 26.0, 31.0, 15.0, 10.0, 16.0, 14.0, 15.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.1585693359375, -3.065185546875, -2.9718017578125, -2.87841796875, -2.7850341796875, -2.691650390625, -2.5982666015625, -2.5048828125, -2.4114990234375, -2.318115234375, -2.2247314453125, -2.13134765625, -2.0379638671875, -1.944580078125, -1.8511962890625, -1.7578125, -1.6644287109375, -1.571044921875, -1.4776611328125, -1.38427734375, -1.2908935546875, -1.197509765625, -1.1041259765625, -1.0107421875, -0.9173583984375, -0.823974609375, -0.7305908203125, -0.63720703125, -0.5438232421875, -0.450439453125, -0.3570556640625, -0.263671875, -0.1702880859375, -0.076904296875, 0.0164794921875, 0.10986328125, 0.2032470703125, 0.296630859375, 0.3900146484375, 0.4833984375, 0.5767822265625, 0.670166015625, 0.7635498046875, 0.85693359375, 0.9503173828125, 1.043701171875, 1.1370849609375, 1.23046875, 1.3238525390625, 1.417236328125, 1.5106201171875, 1.60400390625, 1.6973876953125, 1.790771484375, 1.8841552734375, 1.9775390625, 2.0709228515625, 2.164306640625, 2.2576904296875, 2.35107421875, 2.4444580078125, 2.537841796875, 2.6312255859375, 2.724609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 10.0, 16.0, 18.0, 47.0, 53.0, 129.0, 173.0, 312.0, 785.0, 2416.0, 14965.0, 670621.0, 345060.0, 10637.0, 1907.0, 725.0, 294.0, 141.0, 94.0, 47.0, 40.0, 16.0, 9.0, 9.0, 8.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.1256103515625, -14.602783203125, -14.0799560546875, -13.55712890625, -13.0343017578125, -12.511474609375, -11.9886474609375, -11.4658203125, -10.9429931640625, -10.420166015625, -9.8973388671875, -9.37451171875, -8.8516845703125, -8.328857421875, -7.8060302734375, -7.283203125, -6.7603759765625, -6.237548828125, -5.7147216796875, -5.19189453125, -4.6690673828125, -4.146240234375, -3.6234130859375, -3.1005859375, -2.5777587890625, -2.054931640625, -1.5321044921875, -1.00927734375, -0.4864501953125, 0.036376953125, 0.5592041015625, 1.08203125, 1.6048583984375, 2.127685546875, 2.6505126953125, 3.17333984375, 3.6961669921875, 4.218994140625, 4.7418212890625, 5.2646484375, 5.7874755859375, 6.310302734375, 6.8331298828125, 7.35595703125, 7.8787841796875, 8.401611328125, 8.9244384765625, 9.447265625, 9.9700927734375, 10.492919921875, 11.0157470703125, 11.53857421875, 12.0614013671875, 12.584228515625, 13.1070556640625, 13.6298828125, 14.1527099609375, 14.675537109375, 15.1983642578125, 15.72119140625, 16.2440185546875, 16.766845703125, 17.2896728515625, 17.8125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 16.0, 9.0, 18.0, 14.0, 19.0, 27.0, 32.0, 32.0, 47.0, 54.0, 44.0, 74.0, 67.0, 67.0, 66.0, 56.0, 73.0, 46.0, 45.0, 27.0, 28.0, 21.0, 22.0, 21.0, 13.0, 11.0, 6.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.671875, -17.1937255859375, -16.715576171875, -16.2374267578125, -15.75927734375, -15.2811279296875, -14.802978515625, -14.3248291015625, -13.8466796875, -13.3685302734375, -12.890380859375, -12.4122314453125, -11.93408203125, -11.4559326171875, -10.977783203125, -10.4996337890625, -10.021484375, -9.5433349609375, -9.065185546875, -8.5870361328125, -8.10888671875, -7.6307373046875, -7.152587890625, -6.6744384765625, -6.1962890625, -5.7181396484375, -5.239990234375, -4.7618408203125, -4.28369140625, -3.8055419921875, -3.327392578125, -2.8492431640625, -2.37109375, -1.8929443359375, -1.414794921875, -0.9366455078125, -0.45849609375, 0.0196533203125, 0.497802734375, 0.9759521484375, 1.4541015625, 1.9322509765625, 2.410400390625, 2.8885498046875, 3.36669921875, 3.8448486328125, 4.322998046875, 4.8011474609375, 5.279296875, 5.7574462890625, 6.235595703125, 6.7137451171875, 7.19189453125, 7.6700439453125, 8.148193359375, 8.6263427734375, 9.1044921875, 9.5826416015625, 10.060791015625, 10.5389404296875, 11.01708984375, 11.4952392578125, 11.973388671875, 12.4515380859375, 12.9296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 0.0, 4.0, 6.0, 10.0, 11.0, 20.0, 20.0, 52.0, 116.0, 422.0, 10522.0, 1034660.0, 2275.0, 241.0, 80.0, 50.0, 19.0, 15.0, 8.0, 3.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.40625, -32.534912109375, -31.66357421875, -30.792236328125, -29.9208984375, -29.049560546875, -28.17822265625, -27.306884765625, -26.435546875, -25.564208984375, -24.69287109375, -23.821533203125, -22.9501953125, -22.078857421875, -21.20751953125, -20.336181640625, -19.46484375, -18.593505859375, -17.72216796875, -16.850830078125, -15.9794921875, -15.108154296875, -14.23681640625, -13.365478515625, -12.494140625, -11.622802734375, -10.75146484375, -9.880126953125, -9.0087890625, -8.137451171875, -7.26611328125, -6.394775390625, -5.5234375, -4.652099609375, -3.78076171875, -2.909423828125, -2.0380859375, -1.166748046875, -0.29541015625, 0.575927734375, 1.447265625, 2.318603515625, 3.18994140625, 4.061279296875, 4.9326171875, 5.803955078125, 6.67529296875, 7.546630859375, 8.41796875, 9.289306640625, 10.16064453125, 11.031982421875, 11.9033203125, 12.774658203125, 13.64599609375, 14.517333984375, 15.388671875, 16.260009765625, 17.13134765625, 18.002685546875, 18.8740234375, 19.745361328125, 20.61669921875, 21.488037109375, 22.359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 5.0, 16.0, 17.0, 17.0, 19.0, 31.0, 57.0, 98.0, 198.0, 225.0, 98.0, 65.0, 31.0, 35.0, 24.0, 15.0, 6.0, 11.0, 7.0, 3.0, 2.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009441375732421875, -0.0009063631296157837, -0.0008685886859893799, -0.0008308142423629761, -0.0007930397987365723, -0.0007552653551101685, -0.0007174909114837646, -0.0006797164678573608, -0.000641942024230957, -0.0006041675806045532, -0.0005663931369781494, -0.0005286186933517456, -0.0004908442497253418, -0.000453069806098938, -0.0004152953624725342, -0.00037752091884613037, -0.00033974647521972656, -0.00030197203159332275, -0.00026419758796691895, -0.00022642314434051514, -0.00018864870071411133, -0.00015087425708770752, -0.00011309981346130371, -7.53253698348999e-05, -3.7550926208496094e-05, 2.2351741790771484e-07, 3.7997961044311523e-05, 7.577240467071533e-05, 0.00011354684829711914, 0.00015132129192352295, 0.00018909573554992676, 0.00022687017917633057, 0.0002646446228027344, 0.0003024190664291382, 0.000340193510055542, 0.0003779679536819458, 0.0004157423973083496, 0.0004535168409347534, 0.0004912912845611572, 0.000529065728187561, 0.0005668401718139648, 0.0006046146154403687, 0.0006423890590667725, 0.0006801635026931763, 0.0007179379463195801, 0.0007557123899459839, 0.0007934868335723877, 0.0008312612771987915, 0.0008690357208251953, 0.0009068101644515991, 0.0009445846080780029, 0.0009823590517044067, 0.0010201334953308105, 0.0010579079389572144, 0.0010956823825836182, 0.001133456826210022, 0.0011712312698364258, 0.0012090057134628296, 0.0012467801570892334, 0.0012845546007156372, 0.001322329044342041, 0.0013601034879684448, 0.0013978779315948486, 0.0014356523752212524, 0.0014734268188476562]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 7.0, 9.0, 14.0, 16.0, 24.0, 35.0, 43.0, 80.0, 171.0, 318.0, 773.0, 1927.0, 6716.0, 434678.0, 593383.0, 6833.0, 1945.0, 737.0, 374.0, 168.0, 88.0, 56.0, 40.0, 21.0, 12.0, 21.0, 9.0, 9.0, 7.0, 6.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.0, -23.314453125, -22.62890625, -21.943359375, -21.2578125, -20.572265625, -19.88671875, -19.201171875, -18.515625, -17.830078125, -17.14453125, -16.458984375, -15.7734375, -15.087890625, -14.40234375, -13.716796875, -13.03125, -12.345703125, -11.66015625, -10.974609375, -10.2890625, -9.603515625, -8.91796875, -8.232421875, -7.546875, -6.861328125, -6.17578125, -5.490234375, -4.8046875, -4.119140625, -3.43359375, -2.748046875, -2.0625, -1.376953125, -0.69140625, -0.005859375, 0.6796875, 1.365234375, 2.05078125, 2.736328125, 3.421875, 4.107421875, 4.79296875, 5.478515625, 6.1640625, 6.849609375, 7.53515625, 8.220703125, 8.90625, 9.591796875, 10.27734375, 10.962890625, 11.6484375, 12.333984375, 13.01953125, 13.705078125, 14.390625, 15.076171875, 15.76171875, 16.447265625, 17.1328125, 17.818359375, 18.50390625, 19.189453125, 19.875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 4.0, 7.0, 10.0, 19.0, 34.0, 61.0, 154.0, 323.0, 216.0, 82.0, 26.0, 12.0, 12.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.78173828125, -10.3916015625, -10.00146484375, -9.611328125, -9.22119140625, -8.8310546875, -8.44091796875, -8.05078125, -7.66064453125, -7.2705078125, -6.88037109375, -6.490234375, -6.10009765625, -5.7099609375, -5.31982421875, -4.9296875, -4.53955078125, -4.1494140625, -3.75927734375, -3.369140625, -2.97900390625, -2.5888671875, -2.19873046875, -1.80859375, -1.41845703125, -1.0283203125, -0.63818359375, -0.248046875, 0.14208984375, 0.5322265625, 0.92236328125, 1.3125, 1.70263671875, 2.0927734375, 2.48291015625, 2.873046875, 3.26318359375, 3.6533203125, 4.04345703125, 4.43359375, 4.82373046875, 5.2138671875, 5.60400390625, 5.994140625, 6.38427734375, 6.7744140625, 7.16455078125, 7.5546875, 7.94482421875, 8.3349609375, 8.72509765625, 9.115234375, 9.50537109375, 9.8955078125, 10.28564453125, 10.67578125, 11.06591796875, 11.4560546875, 11.84619140625, 12.236328125, 12.62646484375, 13.0166015625, 13.40673828125, 13.796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 25.0, 93.0, 341.0, 371.0, 112.0, 35.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-250.1065673828125, -244.0308380126953, -237.95510864257812, -231.87937927246094, -225.80364990234375, -219.72792053222656, -213.65219116210938, -207.5764617919922, -201.500732421875, -195.4250030517578, -189.34927368164062, -183.27354431152344, -177.19781494140625, -171.12208557128906, -165.04635620117188, -158.9706268310547, -152.8948974609375, -146.8191680908203, -140.74343872070312, -134.66770935058594, -128.59197998046875, -122.51625061035156, -116.44052124023438, -110.36479187011719, -104.2890625, -98.21333312988281, -92.13760375976562, -86.06187438964844, -79.98614501953125, -73.91041564941406, -67.83468627929688, -61.75895690917969, -55.6832275390625, -49.60749816894531, -43.531768798828125, -37.45603942871094, -31.38031005859375, -25.304580688476562, -19.228851318359375, -13.153121948242188, -7.077392578125, -1.0016632080078125, 5.074066162109375, 11.149795532226562, 17.22552490234375, 23.301254272460938, 29.376983642578125, 35.45271301269531, 41.5284423828125, 47.60417175292969, 53.679901123046875, 59.75563049316406, 65.83135986328125, 71.90708923339844, 77.98281860351562, 84.05854797363281, 90.13427734375, 96.21000671386719, 102.28573608398438, 108.36146545410156, 114.43719482421875, 120.51292419433594, 126.58865356445312, 132.6643829345703, 138.7401123046875]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 7.0, 12.0, 10.0, 12.0, 17.0, 25.0, 30.0, 30.0, 31.0, 56.0, 51.0, 65.0, 77.0, 79.0, 60.0, 73.0, 68.0, 66.0, 39.0, 38.0, 35.0, 33.0, 14.0, 15.0, 19.0, 13.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.08047485351562, -83.86880493164062, -81.65713500976562, -79.4454574584961, -77.2337875366211, -75.0221176147461, -72.8104476928711, -70.5987777709961, -68.38710021972656, -66.17543029785156, -63.9637565612793, -61.7520866394043, -59.54041290283203, -57.32874298095703, -55.11707305908203, -52.90540313720703, -50.69373321533203, -48.48206329345703, -46.270389556884766, -44.058719635009766, -41.8470458984375, -39.6353759765625, -37.4237060546875, -35.2120361328125, -33.000362396240234, -30.7886905670166, -28.57701873779297, -26.36534881591797, -24.153676986694336, -21.942005157470703, -19.730335235595703, -17.51866340637207, -15.306999206542969, -13.095327377319336, -10.88365650177002, -8.671985626220703, -6.46031379699707, -4.2486419677734375, -2.036971092224121, 0.1746997833251953, 2.386371612548828, 4.598042964935303, 6.809714317321777, 9.021385192871094, 11.233057022094727, 13.44472885131836, 15.656399726867676, 17.868070602416992, 20.079742431640625, 22.291414260864258, 24.50308609008789, 26.71475601196289, 28.926427841186523, 31.138099670410156, 33.349769592285156, 35.561439514160156, 37.77311325073242, 39.98478317260742, 42.19645690917969, 44.40812683105469, 46.61979675292969, 48.83147048950195, 51.04314041137695, 53.25481414794922, 55.46648406982422]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 7.0, 16.0, 21.0, 29.0, 37.0, 78.0, 127.0, 236.0, 814.0, 199158.0, 3991465.0, 1627.0, 301.0, 147.0, 77.0, 58.0, 22.0, 17.0, 12.0, 8.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.6875, -42.510009765625, -41.33251953125, -40.155029296875, -38.9775390625, -37.800048828125, -36.62255859375, -35.445068359375, -34.267578125, -33.090087890625, -31.91259765625, -30.735107421875, -29.5576171875, -28.380126953125, -27.20263671875, -26.025146484375, -24.84765625, -23.670166015625, -22.49267578125, -21.315185546875, -20.1376953125, -18.960205078125, -17.78271484375, -16.605224609375, -15.427734375, -14.250244140625, -13.07275390625, -11.895263671875, -10.7177734375, -9.540283203125, -8.36279296875, -7.185302734375, -6.0078125, -4.830322265625, -3.65283203125, -2.475341796875, -1.2978515625, -0.120361328125, 1.05712890625, 2.234619140625, 3.412109375, 4.589599609375, 5.76708984375, 6.944580078125, 8.1220703125, 9.299560546875, 10.47705078125, 11.654541015625, 12.83203125, 14.009521484375, 15.18701171875, 16.364501953125, 17.5419921875, 18.719482421875, 19.89697265625, 21.074462890625, 22.251953125, 23.429443359375, 24.60693359375, 25.784423828125, 26.9619140625, 28.139404296875, 29.31689453125, 30.494384765625, 31.671875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 8.0, 10.0, 13.0, 23.0, 33.0, 37.0, 44.0, 57.0, 68.0, 74.0, 57.0, 95.0, 76.0, 87.0, 58.0, 76.0, 47.0, 34.0, 28.0, 26.0, 18.0, 10.0, 7.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1328125, -5.981292724609375, -5.82977294921875, -5.678253173828125, -5.5267333984375, -5.375213623046875, -5.22369384765625, -5.072174072265625, -4.920654296875, -4.769134521484375, -4.61761474609375, -4.466094970703125, -4.3145751953125, -4.163055419921875, -4.01153564453125, -3.860015869140625, -3.70849609375, -3.556976318359375, -3.40545654296875, -3.253936767578125, -3.1024169921875, -2.950897216796875, -2.79937744140625, -2.647857666015625, -2.496337890625, -2.344818115234375, -2.19329833984375, -2.041778564453125, -1.8902587890625, -1.738739013671875, -1.58721923828125, -1.435699462890625, -1.2841796875, -1.132659912109375, -0.98114013671875, -0.829620361328125, -0.6781005859375, -0.526580810546875, -0.37506103515625, -0.223541259765625, -0.072021484375, 0.079498291015625, 0.23101806640625, 0.382537841796875, 0.5340576171875, 0.685577392578125, 0.83709716796875, 0.988616943359375, 1.14013671875, 1.291656494140625, 1.44317626953125, 1.594696044921875, 1.7462158203125, 1.897735595703125, 2.04925537109375, 2.200775146484375, 2.352294921875, 2.503814697265625, 2.65533447265625, 2.806854248046875, 2.9583740234375, 3.109893798828125, 3.26141357421875, 3.412933349609375, 3.564453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 7.0, 4.0, 2.0, 6.0, 12.0, 9.0, 19.0, 20.0, 31.0, 26.0, 52.0, 61.0, 54.0, 95.0, 140.0, 245.0, 541.0, 1308.0, 3794.0, 12864.0, 67372.0, 2681492.0, 1363881.0, 47074.0, 10107.0, 2970.0, 997.0, 426.0, 234.0, 132.0, 81.0, 57.0, 39.0, 33.0, 32.0, 21.0, 17.0, 12.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.29986572265625, -6.0567626953125, -5.81365966796875, -5.570556640625, -5.32745361328125, -5.0843505859375, -4.84124755859375, -4.59814453125, -4.35504150390625, -4.1119384765625, -3.86883544921875, -3.625732421875, -3.38262939453125, -3.1395263671875, -2.89642333984375, -2.6533203125, -2.41021728515625, -2.1671142578125, -1.92401123046875, -1.680908203125, -1.43780517578125, -1.1947021484375, -0.95159912109375, -0.70849609375, -0.46539306640625, -0.2222900390625, 0.02081298828125, 0.263916015625, 0.50701904296875, 0.7501220703125, 0.99322509765625, 1.236328125, 1.47943115234375, 1.7225341796875, 1.96563720703125, 2.208740234375, 2.45184326171875, 2.6949462890625, 2.93804931640625, 3.18115234375, 3.42425537109375, 3.6673583984375, 3.91046142578125, 4.153564453125, 4.39666748046875, 4.6397705078125, 4.88287353515625, 5.1259765625, 5.36907958984375, 5.6121826171875, 5.85528564453125, 6.098388671875, 6.34149169921875, 6.5845947265625, 6.82769775390625, 7.07080078125, 7.31390380859375, 7.5570068359375, 7.80010986328125, 8.043212890625, 8.28631591796875, 8.5294189453125, 8.77252197265625, 9.015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 5.0, 2.0, 6.0, 6.0, 3.0, 6.0, 11.0, 6.0, 15.0, 7.0, 23.0, 38.0, 65.0, 114.0, 210.0, 374.0, 690.0, 887.0, 689.0, 412.0, 190.0, 132.0, 62.0, 36.0, 17.0, 14.0, 12.0, 10.0, 10.0, 8.0, 6.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-7.3125, -7.13629150390625, -6.9600830078125, -6.78387451171875, -6.607666015625, -6.43145751953125, -6.2552490234375, -6.07904052734375, -5.90283203125, -5.72662353515625, -5.5504150390625, -5.37420654296875, -5.197998046875, -5.02178955078125, -4.8455810546875, -4.66937255859375, -4.4931640625, -4.31695556640625, -4.1407470703125, -3.96453857421875, -3.788330078125, -3.61212158203125, -3.4359130859375, -3.25970458984375, -3.08349609375, -2.90728759765625, -2.7310791015625, -2.55487060546875, -2.378662109375, -2.20245361328125, -2.0262451171875, -1.85003662109375, -1.673828125, -1.49761962890625, -1.3214111328125, -1.14520263671875, -0.968994140625, -0.79278564453125, -0.6165771484375, -0.44036865234375, -0.26416015625, -0.08795166015625, 0.0882568359375, 0.26446533203125, 0.440673828125, 0.61688232421875, 0.7930908203125, 0.96929931640625, 1.1455078125, 1.32171630859375, 1.4979248046875, 1.67413330078125, 1.850341796875, 2.02655029296875, 2.2027587890625, 2.37896728515625, 2.55517578125, 2.73138427734375, 2.9075927734375, 3.08380126953125, 3.260009765625, 3.43621826171875, 3.6124267578125, 3.78863525390625, 3.96484375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 11.0, 24.0, 42.0, 122.0, 236.0, 272.0, 184.0, 69.0, 23.0, 12.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-140.1982421875, -137.35736083984375, -134.51649475097656, -131.6756134033203, -128.83474731445312, -125.9938735961914, -123.15299987792969, -120.31211853027344, -117.47125244140625, -114.63037872314453, -111.78950500488281, -108.9486312866211, -106.10775756835938, -103.26688385009766, -100.42601013183594, -97.58512878417969, -94.74425506591797, -91.90338134765625, -89.06250762939453, -86.22163391113281, -83.3807601928711, -80.53988647460938, -77.69900512695312, -74.85813903808594, -72.01725769042969, -69.17638397216797, -66.33551025390625, -63.49463653564453, -60.65376281738281, -57.812889099121094, -54.97201156616211, -52.13113784790039, -49.290260314941406, -46.44938659667969, -43.60851287841797, -40.76763916015625, -37.92676544189453, -35.08589172363281, -32.24501419067383, -29.40414047241211, -26.56326675415039, -23.722393035888672, -20.881519317626953, -18.0406436920166, -15.199769973754883, -12.358896255493164, -9.518020629882812, -6.677146911621094, -3.836273193359375, -0.995398998260498, 1.845475196838379, 4.686349868774414, 7.527223587036133, 10.368097305297852, 13.208972930908203, 16.049846649169922, 18.89072036743164, 21.73159408569336, 24.572467803955078, 27.41334342956543, 30.25421714782715, 33.0950927734375, 35.93596649169922, 38.77684020996094, 41.617713928222656]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 7.0, 6.0, 8.0, 11.0, 13.0, 17.0, 22.0, 25.0, 28.0, 48.0, 22.0, 43.0, 41.0, 44.0, 59.0, 52.0, 50.0, 53.0, 66.0, 60.0, 38.0, 37.0, 39.0, 36.0, 27.0, 27.0, 20.0, 19.0, 16.0, 17.0, 5.0, 7.0, 8.0, 7.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-27.459341049194336, -26.670984268188477, -25.88262939453125, -25.09427261352539, -24.30591583251953, -23.517560958862305, -22.729204177856445, -21.94084930419922, -21.15249252319336, -20.3641357421875, -19.575780868530273, -18.787424087524414, -17.999069213867188, -17.210712432861328, -16.42235565185547, -15.633999824523926, -14.845643997192383, -14.05728816986084, -13.268932342529297, -12.480575561523438, -11.692219734191895, -10.903863906860352, -10.115507125854492, -9.32715129852295, -8.538795471191406, -7.750439643859863, -6.962083339691162, -6.173727035522461, -5.385371208190918, -4.597015380859375, -3.808659076690674, -3.0203027725219727, -2.2319488525390625, -1.4435927867889404, -0.6552367210388184, 0.1331193447113037, 0.9214754104614258, 1.7098314762115479, 2.49818754196167, 3.286543846130371, 4.074899673461914, 4.863255500793457, 5.651611804962158, 6.439968109130859, 7.228323936462402, 8.016679763793945, 8.805036544799805, 9.593392372131348, 10.38174819946289, 11.170104026794434, 11.958459854125977, 12.746816635131836, 13.535172462463379, 14.323528289794922, 15.111885070800781, 15.900240898132324, 16.688596725463867, 17.476953506469727, 18.265308380126953, 19.053665161132812, 19.842021942138672, 20.6303768157959, 21.418733596801758, 22.207088470458984, 22.995445251464844]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 10.0, 23.0, 29.0, 63.0, 135.0, 256.0, 823.0, 4263.0, 47029.0, 770152.0, 210846.0, 12387.0, 1756.0, 410.0, 172.0, 69.0, 38.0, 25.0, 17.0, 13.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8125, -15.3701171875, -14.927734375, -14.4853515625, -14.04296875, -13.6005859375, -13.158203125, -12.7158203125, -12.2734375, -11.8310546875, -11.388671875, -10.9462890625, -10.50390625, -10.0615234375, -9.619140625, -9.1767578125, -8.734375, -8.2919921875, -7.849609375, -7.4072265625, -6.96484375, -6.5224609375, -6.080078125, -5.6376953125, -5.1953125, -4.7529296875, -4.310546875, -3.8681640625, -3.42578125, -2.9833984375, -2.541015625, -2.0986328125, -1.65625, -1.2138671875, -0.771484375, -0.3291015625, 0.11328125, 0.5556640625, 0.998046875, 1.4404296875, 1.8828125, 2.3251953125, 2.767578125, 3.2099609375, 3.65234375, 4.0947265625, 4.537109375, 4.9794921875, 5.421875, 5.8642578125, 6.306640625, 6.7490234375, 7.19140625, 7.6337890625, 8.076171875, 8.5185546875, 8.9609375, 9.4033203125, 9.845703125, 10.2880859375, 10.73046875, 11.1728515625, 11.615234375, 12.0576171875, 12.5]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 3.0, 9.0, 11.0, 11.0, 18.0, 19.0, 24.0, 38.0, 29.0, 38.0, 61.0, 54.0, 71.0, 69.0, 47.0, 68.0, 58.0, 70.0, 49.0, 58.0, 40.0, 33.0, 30.0, 20.0, 13.0, 13.0, 7.0, 12.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.10321044921875, -3.9837646484375, -3.86431884765625, -3.744873046875, -3.62542724609375, -3.5059814453125, -3.38653564453125, -3.26708984375, -3.14764404296875, -3.0281982421875, -2.90875244140625, -2.789306640625, -2.66986083984375, -2.5504150390625, -2.43096923828125, -2.3115234375, -2.19207763671875, -2.0726318359375, -1.95318603515625, -1.833740234375, -1.71429443359375, -1.5948486328125, -1.47540283203125, -1.35595703125, -1.23651123046875, -1.1170654296875, -0.99761962890625, -0.878173828125, -0.75872802734375, -0.6392822265625, -0.51983642578125, -0.400390625, -0.28094482421875, -0.1614990234375, -0.04205322265625, 0.077392578125, 0.19683837890625, 0.3162841796875, 0.43572998046875, 0.55517578125, 0.67462158203125, 0.7940673828125, 0.91351318359375, 1.032958984375, 1.15240478515625, 1.2718505859375, 1.39129638671875, 1.5107421875, 1.63018798828125, 1.7496337890625, 1.86907958984375, 1.988525390625, 2.10797119140625, 2.2274169921875, 2.34686279296875, 2.46630859375, 2.58575439453125, 2.7052001953125, 2.82464599609375, 2.944091796875, 3.06353759765625, 3.1829833984375, 3.30242919921875, 3.421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 12.0, 5.0, 15.0, 9.0, 10.0, 24.0, 20.0, 29.0, 56.0, 68.0, 82.0, 133.0, 226.0, 349.0, 663.0, 1497.0, 3643.0, 10918.0, 44998.0, 287100.0, 591734.0, 80256.0, 17373.0, 5201.0, 1964.0, 919.0, 410.0, 266.0, 160.0, 94.0, 72.0, 53.0, 49.0, 30.0, 25.0, 14.0, 18.0, 10.0, 11.0, 5.0, 7.0, 7.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6171875, -8.349365234375, -8.08154296875, -7.813720703125, -7.5458984375, -7.278076171875, -7.01025390625, -6.742431640625, -6.474609375, -6.206787109375, -5.93896484375, -5.671142578125, -5.4033203125, -5.135498046875, -4.86767578125, -4.599853515625, -4.33203125, -4.064208984375, -3.79638671875, -3.528564453125, -3.2607421875, -2.992919921875, -2.72509765625, -2.457275390625, -2.189453125, -1.921630859375, -1.65380859375, -1.385986328125, -1.1181640625, -0.850341796875, -0.58251953125, -0.314697265625, -0.046875, 0.220947265625, 0.48876953125, 0.756591796875, 1.0244140625, 1.292236328125, 1.56005859375, 1.827880859375, 2.095703125, 2.363525390625, 2.63134765625, 2.899169921875, 3.1669921875, 3.434814453125, 3.70263671875, 3.970458984375, 4.23828125, 4.506103515625, 4.77392578125, 5.041748046875, 5.3095703125, 5.577392578125, 5.84521484375, 6.113037109375, 6.380859375, 6.648681640625, 6.91650390625, 7.184326171875, 7.4521484375, 7.719970703125, 7.98779296875, 8.255615234375, 8.5234375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 9.0, 9.0, 9.0, 10.0, 12.0, 13.0, 34.0, 24.0, 23.0, 28.0, 39.0, 32.0, 43.0, 51.0, 49.0, 67.0, 70.0, 43.0, 56.0, 56.0, 42.0, 54.0, 33.0, 27.0, 30.0, 24.0, 21.0, 21.0, 7.0, 9.0, 19.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-14.8046875, -14.3795166015625, -13.954345703125, -13.5291748046875, -13.10400390625, -12.6788330078125, -12.253662109375, -11.8284912109375, -11.4033203125, -10.9781494140625, -10.552978515625, -10.1278076171875, -9.70263671875, -9.2774658203125, -8.852294921875, -8.4271240234375, -8.001953125, -7.5767822265625, -7.151611328125, -6.7264404296875, -6.30126953125, -5.8760986328125, -5.450927734375, -5.0257568359375, -4.6005859375, -4.1754150390625, -3.750244140625, -3.3250732421875, -2.89990234375, -2.4747314453125, -2.049560546875, -1.6243896484375, -1.19921875, -0.7740478515625, -0.348876953125, 0.0762939453125, 0.50146484375, 0.9266357421875, 1.351806640625, 1.7769775390625, 2.2021484375, 2.6273193359375, 3.052490234375, 3.4776611328125, 3.90283203125, 4.3280029296875, 4.753173828125, 5.1783447265625, 5.603515625, 6.0286865234375, 6.453857421875, 6.8790283203125, 7.30419921875, 7.7293701171875, 8.154541015625, 8.5797119140625, 9.0048828125, 9.4300537109375, 9.855224609375, 10.2803955078125, 10.70556640625, 11.1307373046875, 11.555908203125, 11.9810791015625, 12.40625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 21.0, 41.0, 91.0, 320.0, 2409.0, 694280.0, 348760.0, 2150.0, 319.0, 74.0, 29.0, 23.0, 12.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.265625, -19.514404296875, -18.76318359375, -18.011962890625, -17.2607421875, -16.509521484375, -15.75830078125, -15.007080078125, -14.255859375, -13.504638671875, -12.75341796875, -12.002197265625, -11.2509765625, -10.499755859375, -9.74853515625, -8.997314453125, -8.24609375, -7.494873046875, -6.74365234375, -5.992431640625, -5.2412109375, -4.489990234375, -3.73876953125, -2.987548828125, -2.236328125, -1.485107421875, -0.73388671875, 0.017333984375, 0.7685546875, 1.519775390625, 2.27099609375, 3.022216796875, 3.7734375, 4.524658203125, 5.27587890625, 6.027099609375, 6.7783203125, 7.529541015625, 8.28076171875, 9.031982421875, 9.783203125, 10.534423828125, 11.28564453125, 12.036865234375, 12.7880859375, 13.539306640625, 14.29052734375, 15.041748046875, 15.79296875, 16.544189453125, 17.29541015625, 18.046630859375, 18.7978515625, 19.549072265625, 20.30029296875, 21.051513671875, 21.802734375, 22.553955078125, 23.30517578125, 24.056396484375, 24.8076171875, 25.558837890625, 26.31005859375, 27.061279296875, 27.8125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 8.0, 7.0, 10.0, 11.0, 16.0, 23.0, 25.0, 38.0, 46.0, 54.0, 106.0, 158.0, 173.0, 94.0, 66.0, 44.0, 27.0, 21.0, 19.0, 14.0, 6.0, 9.0, 8.0, 9.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007009506225585938, -0.0006676614284515381, -0.0006343722343444824, -0.0006010830402374268, -0.0005677938461303711, -0.0005345046520233154, -0.0005012154579162598, -0.0004679262638092041, -0.00043463706970214844, -0.0004013478755950928, -0.0003680586814880371, -0.00033476948738098145, -0.0003014802932739258, -0.0002681910991668701, -0.00023490190505981445, -0.0002016127109527588, -0.00016832351684570312, -0.00013503432273864746, -0.0001017451286315918, -6.845593452453613e-05, -3.516674041748047e-05, -1.8775463104248047e-06, 3.141164779663086e-05, 6.470084190368652e-05, 9.799003601074219e-05, 0.00013127923011779785, 0.00016456842422485352, 0.00019785761833190918, 0.00023114681243896484, 0.0002644360065460205, 0.00029772520065307617, 0.00033101439476013184, 0.0003643035888671875, 0.00039759278297424316, 0.00043088197708129883, 0.0004641711711883545, 0.0004974603652954102, 0.0005307495594024658, 0.0005640387535095215, 0.0005973279476165771, 0.0006306171417236328, 0.0006639063358306885, 0.0006971955299377441, 0.0007304847240447998, 0.0007637739181518555, 0.0007970631122589111, 0.0008303523063659668, 0.0008636415004730225, 0.0008969306945800781, 0.0009302198886871338, 0.0009635090827941895, 0.0009967982769012451, 0.0010300874710083008, 0.0010633766651153564, 0.0010966658592224121, 0.0011299550533294678, 0.0011632442474365234, 0.001196533441543579, 0.0012298226356506348, 0.0012631118297576904, 0.001296401023864746, 0.0013296902179718018, 0.0013629794120788574, 0.001396268606185913, 0.0014295578002929688]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 7.0, 9.0, 23.0, 28.0, 54.0, 96.0, 187.0, 374.0, 933.0, 2909.0, 13124.0, 144780.0, 836124.0, 40701.0, 6308.0, 1669.0, 574.0, 268.0, 148.0, 90.0, 47.0, 31.0, 21.0, 14.0, 11.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.140625, -9.8824462890625, -9.624267578125, -9.3660888671875, -9.10791015625, -8.8497314453125, -8.591552734375, -8.3333740234375, -8.0751953125, -7.8170166015625, -7.558837890625, -7.3006591796875, -7.04248046875, -6.7843017578125, -6.526123046875, -6.2679443359375, -6.009765625, -5.7515869140625, -5.493408203125, -5.2352294921875, -4.97705078125, -4.7188720703125, -4.460693359375, -4.2025146484375, -3.9443359375, -3.6861572265625, -3.427978515625, -3.1697998046875, -2.91162109375, -2.6534423828125, -2.395263671875, -2.1370849609375, -1.87890625, -1.6207275390625, -1.362548828125, -1.1043701171875, -0.84619140625, -0.5880126953125, -0.329833984375, -0.0716552734375, 0.1865234375, 0.4447021484375, 0.702880859375, 0.9610595703125, 1.21923828125, 1.4774169921875, 1.735595703125, 1.9937744140625, 2.251953125, 2.5101318359375, 2.768310546875, 3.0264892578125, 3.28466796875, 3.5428466796875, 3.801025390625, 4.0592041015625, 4.3173828125, 4.5755615234375, 4.833740234375, 5.0919189453125, 5.35009765625, 5.6082763671875, 5.866455078125, 6.1246337890625, 6.3828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 8.0, 3.0, 10.0, 11.0, 12.0, 18.0, 19.0, 20.0, 48.0, 56.0, 108.0, 135.0, 158.0, 118.0, 76.0, 49.0, 37.0, 17.0, 18.0, 14.0, 16.0, 9.0, 8.0, 5.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.1243896484375, -5.959716796875, -5.7950439453125, -5.63037109375, -5.4656982421875, -5.301025390625, -5.1363525390625, -4.9716796875, -4.8070068359375, -4.642333984375, -4.4776611328125, -4.31298828125, -4.1483154296875, -3.983642578125, -3.8189697265625, -3.654296875, -3.4896240234375, -3.324951171875, -3.1602783203125, -2.99560546875, -2.8309326171875, -2.666259765625, -2.5015869140625, -2.3369140625, -2.1722412109375, -2.007568359375, -1.8428955078125, -1.67822265625, -1.5135498046875, -1.348876953125, -1.1842041015625, -1.01953125, -0.8548583984375, -0.690185546875, -0.5255126953125, -0.36083984375, -0.1961669921875, -0.031494140625, 0.1331787109375, 0.2978515625, 0.4625244140625, 0.627197265625, 0.7918701171875, 0.95654296875, 1.1212158203125, 1.285888671875, 1.4505615234375, 1.615234375, 1.7799072265625, 1.944580078125, 2.1092529296875, 2.27392578125, 2.4385986328125, 2.603271484375, 2.7679443359375, 2.9326171875, 3.0972900390625, 3.261962890625, 3.4266357421875, 3.59130859375, 3.7559814453125, 3.920654296875, 4.0853271484375, 4.25]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 11.0, 11.0, 24.0, 177.0, 511.0, 201.0, 43.0, 14.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.90744018554688, -208.07186889648438, -201.23629760742188, -194.40072631835938, -187.56517028808594, -180.72959899902344, -173.89402770996094, -167.05845642089844, -160.22288513183594, -153.38731384277344, -146.55174255371094, -139.7161865234375, -132.880615234375, -126.0450439453125, -119.20947265625, -112.3739013671875, -105.53833770751953, -98.70276641845703, -91.86720275878906, -85.03163146972656, -78.19606018066406, -71.36048889160156, -64.5249252319336, -57.689353942871094, -50.85378646850586, -44.018218994140625, -37.182647705078125, -30.34708023071289, -23.511510848999023, -16.675941467285156, -9.840373992919922, -3.004802703857422, 3.8307647705078125, 10.66633415222168, 17.501903533935547, 24.33747100830078, 31.17304039001465, 38.008609771728516, 44.84417724609375, 51.67974853515625, 58.515316009521484, 65.35088348388672, 72.18645477294922, 79.02201843261719, 85.85758972167969, 92.69316101074219, 99.52873229980469, 106.36430358886719, 113.19986724853516, 120.03543853759766, 126.87100219726562, 133.70657348632812, 140.54214477539062, 147.37771606445312, 154.21328735351562, 161.04885864257812, 167.88441467285156, 174.71998596191406, 181.55555725097656, 188.39111328125, 195.2266845703125, 202.062255859375, 208.8978271484375, 215.7333984375, 222.5689697265625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 5.0, 0.0, 5.0, 3.0, 4.0, 12.0, 10.0, 14.0, 23.0, 9.0, 16.0, 14.0, 32.0, 31.0, 26.0, 39.0, 43.0, 49.0, 48.0, 64.0, 59.0, 71.0, 66.0, 51.0, 44.0, 38.0, 32.0, 35.0, 34.0, 26.0, 15.0, 13.0, 20.0, 14.0, 3.0, 7.0, 4.0, 10.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.06634521484375, -45.186431884765625, -43.306522369384766, -41.42660903930664, -39.54669952392578, -37.666786193847656, -35.78687286376953, -33.906959533691406, -32.02705001831055, -30.147138595581055, -28.267227172851562, -26.387313842773438, -24.507402420043945, -22.627490997314453, -20.747577667236328, -18.867666244506836, -16.987754821777344, -15.107843399047852, -13.227931022644043, -11.348018646240234, -9.468107223510742, -7.58819580078125, -5.708283424377441, -3.828371047973633, -1.9484596252441406, -0.06854772567749023, 1.8113641738891602, 3.6912760734558105, 5.571187973022461, 7.451099395751953, 9.331011772155762, 11.21092414855957, 13.090835571289062, 14.970746994018555, 16.850658416748047, 18.730571746826172, 20.610483169555664, 22.490394592285156, 24.37030792236328, 26.250219345092773, 28.130130767822266, 30.010042190551758, 31.88995361328125, 33.769866943359375, 35.6497802734375, 37.52968978881836, 39.409603118896484, 41.289512634277344, 43.16942596435547, 45.049339294433594, 46.92924880981445, 48.80916213989258, 50.68907165527344, 52.56898498535156, 54.44889831542969, 56.32881164550781, 58.20872116088867, 60.0886344909668, 61.968544006347656, 63.84845733642578, 65.7283706665039, 67.6082763671875, 69.48818969726562, 71.36810302734375, 73.24801635742188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 3.0, 4.0, 7.0, 9.0, 16.0, 30.0, 51.0, 64.0, 125.0, 253.0, 587.0, 1756.0, 8332.0, 115132.0, 3865147.0, 187832.0, 10876.0, 2454.0, 895.0, 354.0, 143.0, 83.0, 34.0, 22.0, 10.0, 10.0, 9.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.1290283203125, -12.797119140625, -12.4652099609375, -12.13330078125, -11.8013916015625, -11.469482421875, -11.1375732421875, -10.8056640625, -10.4737548828125, -10.141845703125, -9.8099365234375, -9.47802734375, -9.1461181640625, -8.814208984375, -8.4822998046875, -8.150390625, -7.8184814453125, -7.486572265625, -7.1546630859375, -6.82275390625, -6.4908447265625, -6.158935546875, -5.8270263671875, -5.4951171875, -5.1632080078125, -4.831298828125, -4.4993896484375, -4.16748046875, -3.8355712890625, -3.503662109375, -3.1717529296875, -2.83984375, -2.5079345703125, -2.176025390625, -1.8441162109375, -1.51220703125, -1.1802978515625, -0.848388671875, -0.5164794921875, -0.1845703125, 0.1473388671875, 0.479248046875, 0.8111572265625, 1.14306640625, 1.4749755859375, 1.806884765625, 2.1387939453125, 2.470703125, 2.8026123046875, 3.134521484375, 3.4664306640625, 3.79833984375, 4.1302490234375, 4.462158203125, 4.7940673828125, 5.1259765625, 5.4578857421875, 5.789794921875, 6.1217041015625, 6.45361328125, 6.7855224609375, 7.117431640625, 7.4493408203125, 7.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 9.0, 14.0, 13.0, 26.0, 30.0, 23.0, 40.0, 49.0, 61.0, 73.0, 68.0, 58.0, 47.0, 70.0, 70.0, 72.0, 50.0, 41.0, 36.0, 34.0, 24.0, 19.0, 10.0, 6.0, 14.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-4.73046875, -4.615570068359375, -4.50067138671875, -4.385772705078125, -4.2708740234375, -4.155975341796875, -4.04107666015625, -3.926177978515625, -3.811279296875, -3.696380615234375, -3.58148193359375, -3.466583251953125, -3.3516845703125, -3.236785888671875, -3.12188720703125, -3.006988525390625, -2.89208984375, -2.777191162109375, -2.66229248046875, -2.547393798828125, -2.4324951171875, -2.317596435546875, -2.20269775390625, -2.087799072265625, -1.972900390625, -1.858001708984375, -1.74310302734375, -1.628204345703125, -1.5133056640625, -1.398406982421875, -1.28350830078125, -1.168609619140625, -1.0537109375, -0.938812255859375, -0.82391357421875, -0.709014892578125, -0.5941162109375, -0.479217529296875, -0.36431884765625, -0.249420166015625, -0.134521484375, -0.019622802734375, 0.09527587890625, 0.210174560546875, 0.3250732421875, 0.439971923828125, 0.55487060546875, 0.669769287109375, 0.78466796875, 0.899566650390625, 1.01446533203125, 1.129364013671875, 1.2442626953125, 1.359161376953125, 1.47406005859375, 1.588958740234375, 1.703857421875, 1.818756103515625, 1.93365478515625, 2.048553466796875, 2.1634521484375, 2.278350830078125, 2.39324951171875, 2.508148193359375, 2.623046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 12.0, 13.0, 15.0, 23.0, 28.0, 65.0, 79.0, 104.0, 188.0, 318.0, 663.0, 1926.0, 7609.0, 49660.0, 1856533.0, 2207771.0, 56935.0, 8638.0, 2084.0, 753.0, 316.0, 171.0, 116.0, 69.0, 53.0, 38.0, 20.0, 14.0, 16.0, 10.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.1363525390625, -7.835205078125, -7.5340576171875, -7.23291015625, -6.9317626953125, -6.630615234375, -6.3294677734375, -6.0283203125, -5.7271728515625, -5.426025390625, -5.1248779296875, -4.82373046875, -4.5225830078125, -4.221435546875, -3.9202880859375, -3.619140625, -3.3179931640625, -3.016845703125, -2.7156982421875, -2.41455078125, -2.1134033203125, -1.812255859375, -1.5111083984375, -1.2099609375, -0.9088134765625, -0.607666015625, -0.3065185546875, -0.00537109375, 0.2957763671875, 0.596923828125, 0.8980712890625, 1.19921875, 1.5003662109375, 1.801513671875, 2.1026611328125, 2.40380859375, 2.7049560546875, 3.006103515625, 3.3072509765625, 3.6083984375, 3.9095458984375, 4.210693359375, 4.5118408203125, 4.81298828125, 5.1141357421875, 5.415283203125, 5.7164306640625, 6.017578125, 6.3187255859375, 6.619873046875, 6.9210205078125, 7.22216796875, 7.5233154296875, 7.824462890625, 8.1256103515625, 8.4267578125, 8.7279052734375, 9.029052734375, 9.3302001953125, 9.63134765625, 9.9324951171875, 10.233642578125, 10.5347900390625, 10.8359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 11.0, 9.0, 9.0, 18.0, 35.0, 55.0, 79.0, 157.0, 360.0, 765.0, 1035.0, 744.0, 364.0, 162.0, 98.0, 64.0, 34.0, 19.0, 12.0, 13.0, 10.0, 4.0, 2.0, 6.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.90802001953125, -9.6285400390625, -9.34906005859375, -9.069580078125, -8.79010009765625, -8.5106201171875, -8.23114013671875, -7.95166015625, -7.67218017578125, -7.3927001953125, -7.11322021484375, -6.833740234375, -6.55426025390625, -6.2747802734375, -5.99530029296875, -5.7158203125, -5.43634033203125, -5.1568603515625, -4.87738037109375, -4.597900390625, -4.31842041015625, -4.0389404296875, -3.75946044921875, -3.47998046875, -3.20050048828125, -2.9210205078125, -2.64154052734375, -2.362060546875, -2.08258056640625, -1.8031005859375, -1.52362060546875, -1.244140625, -0.96466064453125, -0.6851806640625, -0.40570068359375, -0.126220703125, 0.15325927734375, 0.4327392578125, 0.71221923828125, 0.99169921875, 1.27117919921875, 1.5506591796875, 1.83013916015625, 2.109619140625, 2.38909912109375, 2.6685791015625, 2.94805908203125, 3.2275390625, 3.50701904296875, 3.7864990234375, 4.06597900390625, 4.345458984375, 4.62493896484375, 4.9044189453125, 5.18389892578125, 5.46337890625, 5.74285888671875, 6.0223388671875, 6.30181884765625, 6.581298828125, 6.86077880859375, 7.1402587890625, 7.41973876953125, 7.69921875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 8.0, 23.0, 40.0, 87.0, 164.0, 222.0, 230.0, 115.0, 57.0, 19.0, 7.0, 6.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.66506576538086, -52.85368347167969, -50.042301177978516, -47.230918884277344, -44.41954040527344, -41.608158111572266, -38.796775817871094, -35.98539733886719, -33.17401123046875, -30.362628936767578, -27.55124855041504, -24.739866256713867, -21.928485870361328, -19.117103576660156, -16.305721282958984, -13.494340896606445, -10.682960510253906, -7.871579170227051, -5.060197353363037, -2.2488155364990234, 0.562565803527832, 3.3739471435546875, 6.185329437255859, 8.996709823608398, 11.80809211730957, 14.619473457336426, 17.43085479736328, 20.242237091064453, 23.053619384765625, 25.864999771118164, 28.676382064819336, 31.487762451171875, 34.29914855957031, 37.110530853271484, 39.921913146972656, 42.73329162597656, 45.544673919677734, 48.356056213378906, 51.16743850708008, 53.97882080078125, 56.790199279785156, 59.60158157348633, 62.4129638671875, 65.2243423461914, 68.03572845458984, 70.84710693359375, 73.65849304199219, 76.4698715209961, 79.28125, 82.0926284790039, 84.90401458740234, 87.71539306640625, 90.52677917480469, 93.3381576538086, 96.1495361328125, 98.96092224121094, 101.77230834960938, 104.58368682861328, 107.39507293701172, 110.20645141601562, 113.01783752441406, 115.82921600341797, 118.64059448242188, 121.45198059082031, 124.26335906982422]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 8.0, 10.0, 5.0, 22.0, 15.0, 19.0, 27.0, 32.0, 27.0, 40.0, 32.0, 40.0, 52.0, 56.0, 60.0, 60.0, 52.0, 62.0, 52.0, 52.0, 51.0, 29.0, 35.0, 28.0, 26.0, 17.0, 16.0, 14.0, 16.0, 11.0, 5.0, 8.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-39.43090057373047, -38.29712677001953, -37.163352966308594, -36.02958297729492, -34.895809173583984, -33.76203536987305, -32.628265380859375, -31.494491577148438, -30.3607177734375, -29.226943969726562, -28.093172073364258, -26.959400177001953, -25.825626373291016, -24.691852569580078, -23.558080673217773, -22.42430877685547, -21.29053497314453, -20.156761169433594, -19.02298927307129, -17.889217376708984, -16.755443572998047, -15.621670722961426, -14.487897872924805, -13.354125022888184, -12.220352172851562, -11.086579322814941, -9.95280647277832, -8.8190336227417, -7.685260772705078, -6.551487922668457, -5.417715072631836, -4.283942222595215, -3.1501731872558594, -2.0164003372192383, -0.8826274871826172, 0.2511453628540039, 1.384918212890625, 2.518691062927246, 3.652463912963867, 4.786236763000488, 5.920009613037109, 7.0537824630737305, 8.187555313110352, 9.321328163146973, 10.455101013183594, 11.588873863220215, 12.722646713256836, 13.856419563293457, 14.990192413330078, 16.123966217041016, 17.25773811340332, 18.391510009765625, 19.525283813476562, 20.6590576171875, 21.792829513549805, 22.92660140991211, 24.060375213623047, 25.194149017333984, 26.32792091369629, 27.461692810058594, 28.59546661376953, 29.72924041748047, 30.863012313842773, 31.996784210205078, 33.130558013916016]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 1.0, 5.0, 8.0, 7.0, 5.0, 9.0, 9.0, 12.0, 19.0, 29.0, 44.0, 107.0, 226.0, 697.0, 3159.0, 25790.0, 391726.0, 580001.0, 41089.0, 4239.0, 835.0, 257.0, 118.0, 48.0, 29.0, 28.0, 17.0, 17.0, 10.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8125, -11.3919677734375, -10.971435546875, -10.5509033203125, -10.13037109375, -9.7098388671875, -9.289306640625, -8.8687744140625, -8.4482421875, -8.0277099609375, -7.607177734375, -7.1866455078125, -6.76611328125, -6.3455810546875, -5.925048828125, -5.5045166015625, -5.083984375, -4.6634521484375, -4.242919921875, -3.8223876953125, -3.40185546875, -2.9813232421875, -2.560791015625, -2.1402587890625, -1.7197265625, -1.2991943359375, -0.878662109375, -0.4581298828125, -0.03759765625, 0.3829345703125, 0.803466796875, 1.2239990234375, 1.64453125, 2.0650634765625, 2.485595703125, 2.9061279296875, 3.32666015625, 3.7471923828125, 4.167724609375, 4.5882568359375, 5.0087890625, 5.4293212890625, 5.849853515625, 6.2703857421875, 6.69091796875, 7.1114501953125, 7.531982421875, 7.9525146484375, 8.373046875, 8.7935791015625, 9.214111328125, 9.6346435546875, 10.05517578125, 10.4757080078125, 10.896240234375, 11.3167724609375, 11.7373046875, 12.1578369140625, 12.578369140625, 12.9989013671875, 13.41943359375, 13.8399658203125, 14.260498046875, 14.6810302734375, 15.1015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 6.0, 18.0, 18.0, 27.0, 22.0, 45.0, 48.0, 47.0, 65.0, 64.0, 76.0, 68.0, 77.0, 81.0, 51.0, 57.0, 38.0, 41.0, 37.0, 24.0, 18.0, 15.0, 13.0, 9.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.418792724609375, -4.29071044921875, -4.162628173828125, -4.0345458984375, -3.906463623046875, -3.77838134765625, -3.650299072265625, -3.522216796875, -3.394134521484375, -3.26605224609375, -3.137969970703125, -3.0098876953125, -2.881805419921875, -2.75372314453125, -2.625640869140625, -2.49755859375, -2.369476318359375, -2.24139404296875, -2.113311767578125, -1.9852294921875, -1.857147216796875, -1.72906494140625, -1.600982666015625, -1.472900390625, -1.344818115234375, -1.21673583984375, -1.088653564453125, -0.9605712890625, -0.832489013671875, -0.70440673828125, -0.576324462890625, -0.4482421875, -0.320159912109375, -0.19207763671875, -0.063995361328125, 0.0640869140625, 0.192169189453125, 0.32025146484375, 0.448333740234375, 0.576416015625, 0.704498291015625, 0.83258056640625, 0.960662841796875, 1.0887451171875, 1.216827392578125, 1.34490966796875, 1.472991943359375, 1.60107421875, 1.729156494140625, 1.85723876953125, 1.985321044921875, 2.1134033203125, 2.241485595703125, 2.36956787109375, 2.497650146484375, 2.625732421875, 2.753814697265625, 2.88189697265625, 3.009979248046875, 3.1380615234375, 3.266143798828125, 3.39422607421875, 3.522308349609375, 3.650390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 11.0, 11.0, 15.0, 30.0, 29.0, 70.0, 85.0, 159.0, 300.0, 633.0, 1529.0, 4576.0, 33670.0, 819600.0, 172510.0, 10939.0, 2414.0, 941.0, 428.0, 226.0, 137.0, 85.0, 55.0, 31.0, 23.0, 13.0, 11.0, 10.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.703125, -19.13623046875, -18.5693359375, -18.00244140625, -17.435546875, -16.86865234375, -16.3017578125, -15.73486328125, -15.16796875, -14.60107421875, -14.0341796875, -13.46728515625, -12.900390625, -12.33349609375, -11.7666015625, -11.19970703125, -10.6328125, -10.06591796875, -9.4990234375, -8.93212890625, -8.365234375, -7.79833984375, -7.2314453125, -6.66455078125, -6.09765625, -5.53076171875, -4.9638671875, -4.39697265625, -3.830078125, -3.26318359375, -2.6962890625, -2.12939453125, -1.5625, -0.99560546875, -0.4287109375, 0.13818359375, 0.705078125, 1.27197265625, 1.8388671875, 2.40576171875, 2.97265625, 3.53955078125, 4.1064453125, 4.67333984375, 5.240234375, 5.80712890625, 6.3740234375, 6.94091796875, 7.5078125, 8.07470703125, 8.6416015625, 9.20849609375, 9.775390625, 10.34228515625, 10.9091796875, 11.47607421875, 12.04296875, 12.60986328125, 13.1767578125, 13.74365234375, 14.310546875, 14.87744140625, 15.4443359375, 16.01123046875, 16.578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 12.0, 16.0, 14.0, 21.0, 27.0, 24.0, 38.0, 31.0, 46.0, 61.0, 54.0, 60.0, 85.0, 70.0, 71.0, 63.0, 46.0, 56.0, 57.0, 26.0, 27.0, 19.0, 21.0, 11.0, 12.0, 8.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.46875, -19.896484375, -19.32421875, -18.751953125, -18.1796875, -17.607421875, -17.03515625, -16.462890625, -15.890625, -15.318359375, -14.74609375, -14.173828125, -13.6015625, -13.029296875, -12.45703125, -11.884765625, -11.3125, -10.740234375, -10.16796875, -9.595703125, -9.0234375, -8.451171875, -7.87890625, -7.306640625, -6.734375, -6.162109375, -5.58984375, -5.017578125, -4.4453125, -3.873046875, -3.30078125, -2.728515625, -2.15625, -1.583984375, -1.01171875, -0.439453125, 0.1328125, 0.705078125, 1.27734375, 1.849609375, 2.421875, 2.994140625, 3.56640625, 4.138671875, 4.7109375, 5.283203125, 5.85546875, 6.427734375, 7.0, 7.572265625, 8.14453125, 8.716796875, 9.2890625, 9.861328125, 10.43359375, 11.005859375, 11.578125, 12.150390625, 12.72265625, 13.294921875, 13.8671875, 14.439453125, 15.01171875, 15.583984375, 16.15625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 7.0, 8.0, 20.0, 17.0, 38.0, 72.0, 115.0, 241.0, 454.0, 1113.0, 3278.0, 13189.0, 114296.0, 847084.0, 55863.0, 8639.0, 2395.0, 849.0, 419.0, 173.0, 120.0, 55.0, 25.0, 27.0, 18.0, 12.0, 4.0, 9.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.609375, -7.3587646484375, -7.108154296875, -6.8575439453125, -6.60693359375, -6.3563232421875, -6.105712890625, -5.8551025390625, -5.6044921875, -5.3538818359375, -5.103271484375, -4.8526611328125, -4.60205078125, -4.3514404296875, -4.100830078125, -3.8502197265625, -3.599609375, -3.3489990234375, -3.098388671875, -2.8477783203125, -2.59716796875, -2.3465576171875, -2.095947265625, -1.8453369140625, -1.5947265625, -1.3441162109375, -1.093505859375, -0.8428955078125, -0.59228515625, -0.3416748046875, -0.091064453125, 0.1595458984375, 0.41015625, 0.6607666015625, 0.911376953125, 1.1619873046875, 1.41259765625, 1.6632080078125, 1.913818359375, 2.1644287109375, 2.4150390625, 2.6656494140625, 2.916259765625, 3.1668701171875, 3.41748046875, 3.6680908203125, 3.918701171875, 4.1693115234375, 4.419921875, 4.6705322265625, 4.921142578125, 5.1717529296875, 5.42236328125, 5.6729736328125, 5.923583984375, 6.1741943359375, 6.4248046875, 6.6754150390625, 6.926025390625, 7.1766357421875, 7.42724609375, 7.6778564453125, 7.928466796875, 8.1790771484375, 8.4296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 6.0, 6.0, 8.0, 6.0, 7.0, 10.0, 10.0, 16.0, 25.0, 23.0, 43.0, 39.0, 69.0, 86.0, 133.0, 147.0, 100.0, 53.0, 52.0, 33.0, 27.0, 30.0, 15.0, 18.0, 9.0, 9.0, 7.0, 9.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0013027191162109375, -0.0012646615505218506, -0.0012266039848327637, -0.0011885464191436768, -0.0011504888534545898, -0.001112431287765503, -0.001074373722076416, -0.001036316156387329, -0.0009982585906982422, -0.0009602010250091553, -0.0009221434593200684, -0.0008840858936309814, -0.0008460283279418945, -0.0008079707622528076, -0.0007699131965637207, -0.0007318556308746338, -0.0006937980651855469, -0.00065574049949646, -0.000617682933807373, -0.0005796253681182861, -0.0005415678024291992, -0.0005035102367401123, -0.0004654526710510254, -0.0004273951053619385, -0.00038933753967285156, -0.00035127997398376465, -0.00031322240829467773, -0.0002751648426055908, -0.0002371072769165039, -0.000199049711227417, -0.00016099214553833008, -0.00012293457984924316, -8.487701416015625e-05, -4.6819448471069336e-05, -8.761882781982422e-06, 2.9295682907104492e-05, 6.73532485961914e-05, 0.00010541081428527832, 0.00014346837997436523, 0.00018152594566345215, 0.00021958351135253906, 0.000257641077041626, 0.0002956986427307129, 0.0003337562084197998, 0.0003718137741088867, 0.00040987133979797363, 0.00044792890548706055, 0.00048598647117614746, 0.0005240440368652344, 0.0005621016025543213, 0.0006001591682434082, 0.0006382167339324951, 0.000676274299621582, 0.0007143318653106689, 0.0007523894309997559, 0.0007904469966888428, 0.0008285045623779297, 0.0008665621280670166, 0.0009046196937561035, 0.0009426772594451904, 0.0009807348251342773, 0.0010187923908233643, 0.0010568499565124512, 0.001094907522201538, 0.001132965087890625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 9.0, 6.0, 7.0, 12.0, 20.0, 33.0, 42.0, 44.0, 110.0, 144.0, 255.0, 457.0, 883.0, 2102.0, 5488.0, 18199.0, 88245.0, 776388.0, 122656.0, 22355.0, 6494.0, 2361.0, 1013.0, 506.0, 249.0, 172.0, 96.0, 66.0, 40.0, 23.0, 26.0, 17.0, 10.0, 14.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83984375, -6.6298828125, -6.419921875, -6.2099609375, -6.0, -5.7900390625, -5.580078125, -5.3701171875, -5.16015625, -4.9501953125, -4.740234375, -4.5302734375, -4.3203125, -4.1103515625, -3.900390625, -3.6904296875, -3.48046875, -3.2705078125, -3.060546875, -2.8505859375, -2.640625, -2.4306640625, -2.220703125, -2.0107421875, -1.80078125, -1.5908203125, -1.380859375, -1.1708984375, -0.9609375, -0.7509765625, -0.541015625, -0.3310546875, -0.12109375, 0.0888671875, 0.298828125, 0.5087890625, 0.71875, 0.9287109375, 1.138671875, 1.3486328125, 1.55859375, 1.7685546875, 1.978515625, 2.1884765625, 2.3984375, 2.6083984375, 2.818359375, 3.0283203125, 3.23828125, 3.4482421875, 3.658203125, 3.8681640625, 4.078125, 4.2880859375, 4.498046875, 4.7080078125, 4.91796875, 5.1279296875, 5.337890625, 5.5478515625, 5.7578125, 5.9677734375, 6.177734375, 6.3876953125, 6.59765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 9.0, 5.0, 2.0, 3.0, 8.0, 7.0, 10.0, 13.0, 11.0, 13.0, 15.0, 22.0, 27.0, 25.0, 30.0, 47.0, 36.0, 62.0, 113.0, 99.0, 77.0, 62.0, 49.0, 42.0, 36.0, 22.0, 23.0, 18.0, 17.0, 17.0, 14.0, 10.0, 7.0, 4.0, 9.0, 4.0, 1.0, 2.0, 8.0, 3.0, 2.0, 9.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.2421875, -4.115386962890625, -3.98858642578125, -3.861785888671875, -3.7349853515625, -3.608184814453125, -3.48138427734375, -3.354583740234375, -3.227783203125, -3.100982666015625, -2.97418212890625, -2.847381591796875, -2.7205810546875, -2.593780517578125, -2.46697998046875, -2.340179443359375, -2.21337890625, -2.086578369140625, -1.95977783203125, -1.832977294921875, -1.7061767578125, -1.579376220703125, -1.45257568359375, -1.325775146484375, -1.198974609375, -1.072174072265625, -0.94537353515625, -0.818572998046875, -0.6917724609375, -0.564971923828125, -0.43817138671875, -0.311370849609375, -0.1845703125, -0.057769775390625, 0.06903076171875, 0.195831298828125, 0.3226318359375, 0.449432373046875, 0.57623291015625, 0.703033447265625, 0.829833984375, 0.956634521484375, 1.08343505859375, 1.210235595703125, 1.3370361328125, 1.463836669921875, 1.59063720703125, 1.717437744140625, 1.84423828125, 1.971038818359375, 2.09783935546875, 2.224639892578125, 2.3514404296875, 2.478240966796875, 2.60504150390625, 2.731842041015625, 2.858642578125, 2.985443115234375, 3.11224365234375, 3.239044189453125, 3.3658447265625, 3.492645263671875, 3.61944580078125, 3.746246337890625, 3.873046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 15.0, 25.0, 64.0, 125.0, 248.0, 214.0, 132.0, 71.0, 35.0, 24.0, 6.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.33662414550781, -96.98323059082031, -93.62983703613281, -90.27644348144531, -86.92304992675781, -83.56965637207031, -80.21625518798828, -76.86286163330078, -73.50946807861328, -70.15607452392578, -66.80268096923828, -63.449283599853516, -60.095890045166016, -56.742496490478516, -53.38909912109375, -50.03570556640625, -46.68231201171875, -43.32891845703125, -39.97552490234375, -36.622127532958984, -33.268733978271484, -29.915340423583984, -26.56194496154785, -23.20854949951172, -19.85515594482422, -16.50176239013672, -13.148366928100586, -9.79497241973877, -6.441577911376953, -3.088184356689453, 0.2652111053466797, 3.6186065673828125, 6.9720001220703125, 10.325394630432129, 13.678789138793945, 17.032184600830078, 20.385578155517578, 23.738971710205078, 27.09236717224121, 30.445762634277344, 33.799156188964844, 37.152549743652344, 40.505943298339844, 43.85934066772461, 47.21273422241211, 50.56612777709961, 53.919525146484375, 57.272918701171875, 60.626312255859375, 63.979705810546875, 67.33309936523438, 70.68649291992188, 74.03988647460938, 77.39328002929688, 80.7466812133789, 84.1000747680664, 87.4534683227539, 90.8068618774414, 94.1602554321289, 97.5136489868164, 100.86705017089844, 104.22044372558594, 107.57383728027344, 110.92723083496094, 114.28062438964844]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 11.0, 9.0, 16.0, 15.0, 21.0, 19.0, 26.0, 21.0, 27.0, 29.0, 28.0, 45.0, 46.0, 51.0, 56.0, 69.0, 77.0, 66.0, 47.0, 45.0, 37.0, 44.0, 19.0, 22.0, 31.0, 16.0, 18.0, 12.0, 13.0, 14.0, 11.0, 2.0, 5.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.255550384521484, -51.40003967285156, -49.544532775878906, -47.689022064208984, -45.83351135253906, -43.978004455566406, -42.122493743896484, -40.26698303222656, -38.411476135253906, -36.555965423583984, -34.70045852661133, -32.844947814941406, -30.989437103271484, -29.133928298950195, -27.278419494628906, -25.422908782958984, -23.567398071289062, -21.711889266967773, -19.85637855529785, -18.000869750976562, -16.14535903930664, -14.289850234985352, -12.434341430664062, -10.578831672668457, -8.723321914672852, -6.867812156677246, -5.012302875518799, -3.1567935943603516, -1.301283836364746, 0.5542259216308594, 2.4097347259521484, 4.265244483947754, 6.120750427246094, 7.976260185241699, 9.831769943237305, 11.687278747558594, 13.5427885055542, 15.398298263549805, 17.253807067871094, 19.109317779541016, 20.964826583862305, 22.820335388183594, 24.675846099853516, 26.531354904174805, 28.386863708496094, 30.242374420166016, 32.09788513183594, 33.953392028808594, 35.808902740478516, 37.66441345214844, 39.519920349121094, 41.375431060791016, 43.23094177246094, 45.086448669433594, 46.941959381103516, 48.79747009277344, 50.652976989746094, 52.508487701416016, 54.36399459838867, 56.219505310058594, 58.075016021728516, 59.93052673339844, 61.786033630371094, 63.641544342041016, 65.49705505371094]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 6.0, 7.0, 7.0, 10.0, 23.0, 31.0, 40.0, 81.0, 135.0, 284.0, 852.0, 3424.0, 27844.0, 2436267.0, 1697260.0, 22860.0, 3471.0, 990.0, 404.0, 151.0, 64.0, 23.0, 18.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0], "bins": [-16.796875, -16.439208984375, -16.08154296875, -15.723876953125, -15.3662109375, -15.008544921875, -14.65087890625, -14.293212890625, -13.935546875, -13.577880859375, -13.22021484375, -12.862548828125, -12.5048828125, -12.147216796875, -11.78955078125, -11.431884765625, -11.07421875, -10.716552734375, -10.35888671875, -10.001220703125, -9.6435546875, -9.285888671875, -8.92822265625, -8.570556640625, -8.212890625, -7.855224609375, -7.49755859375, -7.139892578125, -6.7822265625, -6.424560546875, -6.06689453125, -5.709228515625, -5.3515625, -4.993896484375, -4.63623046875, -4.278564453125, -3.9208984375, -3.563232421875, -3.20556640625, -2.847900390625, -2.490234375, -2.132568359375, -1.77490234375, -1.417236328125, -1.0595703125, -0.701904296875, -0.34423828125, 0.013427734375, 0.37109375, 0.728759765625, 1.08642578125, 1.444091796875, 1.8017578125, 2.159423828125, 2.51708984375, 2.874755859375, 3.232421875, 3.590087890625, 3.94775390625, 4.305419921875, 4.6630859375, 5.020751953125, 5.37841796875, 5.736083984375, 6.09375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 5.0, 6.0, 4.0, 10.0, 11.0, 25.0, 22.0, 24.0, 43.0, 43.0, 63.0, 61.0, 67.0, 77.0, 81.0, 67.0, 64.0, 80.0, 48.0, 44.0, 49.0, 33.0, 17.0, 16.0, 14.0, 10.0, 5.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.16796875, -5.036712646484375, -4.90545654296875, -4.774200439453125, -4.6429443359375, -4.511688232421875, -4.38043212890625, -4.249176025390625, -4.117919921875, -3.986663818359375, -3.85540771484375, -3.724151611328125, -3.5928955078125, -3.461639404296875, -3.33038330078125, -3.199127197265625, -3.06787109375, -2.936614990234375, -2.80535888671875, -2.674102783203125, -2.5428466796875, -2.411590576171875, -2.28033447265625, -2.149078369140625, -2.017822265625, -1.886566162109375, -1.75531005859375, -1.624053955078125, -1.4927978515625, -1.361541748046875, -1.23028564453125, -1.099029541015625, -0.9677734375, -0.836517333984375, -0.70526123046875, -0.574005126953125, -0.4427490234375, -0.311492919921875, -0.18023681640625, -0.048980712890625, 0.082275390625, 0.213531494140625, 0.34478759765625, 0.476043701171875, 0.6072998046875, 0.738555908203125, 0.86981201171875, 1.001068115234375, 1.13232421875, 1.263580322265625, 1.39483642578125, 1.526092529296875, 1.6573486328125, 1.788604736328125, 1.91986083984375, 2.051116943359375, 2.182373046875, 2.313629150390625, 2.44488525390625, 2.576141357421875, 2.7073974609375, 2.838653564453125, 2.96990966796875, 3.101165771484375, 3.232421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 10.0, 6.0, 18.0, 20.0, 21.0, 35.0, 62.0, 104.0, 178.0, 333.0, 660.0, 1304.0, 3083.0, 8855.0, 37153.0, 409046.0, 3487577.0, 207065.0, 26211.0, 7031.0, 2637.0, 1231.0, 680.0, 369.0, 202.0, 144.0, 76.0, 49.0, 33.0, 28.0, 15.0, 17.0, 9.0, 8.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.65625, -8.41168212890625, -8.1671142578125, -7.92254638671875, -7.677978515625, -7.43341064453125, -7.1888427734375, -6.94427490234375, -6.69970703125, -6.45513916015625, -6.2105712890625, -5.96600341796875, -5.721435546875, -5.47686767578125, -5.2322998046875, -4.98773193359375, -4.7431640625, -4.49859619140625, -4.2540283203125, -4.00946044921875, -3.764892578125, -3.52032470703125, -3.2757568359375, -3.03118896484375, -2.78662109375, -2.54205322265625, -2.2974853515625, -2.05291748046875, -1.808349609375, -1.56378173828125, -1.3192138671875, -1.07464599609375, -0.830078125, -0.58551025390625, -0.3409423828125, -0.09637451171875, 0.148193359375, 0.39276123046875, 0.6373291015625, 0.88189697265625, 1.12646484375, 1.37103271484375, 1.6156005859375, 1.86016845703125, 2.104736328125, 2.34930419921875, 2.5938720703125, 2.83843994140625, 3.0830078125, 3.32757568359375, 3.5721435546875, 3.81671142578125, 4.061279296875, 4.30584716796875, 4.5504150390625, 4.79498291015625, 5.03955078125, 5.28411865234375, 5.5286865234375, 5.77325439453125, 6.017822265625, 6.26239013671875, 6.5069580078125, 6.75152587890625, 6.99609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 7.0, 6.0, 8.0, 10.0, 21.0, 33.0, 49.0, 99.0, 192.0, 446.0, 946.0, 1087.0, 644.0, 236.0, 121.0, 76.0, 29.0, 20.0, 18.0, 6.0, 3.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.625, -6.3115234375, -5.998046875, -5.6845703125, -5.37109375, -5.0576171875, -4.744140625, -4.4306640625, -4.1171875, -3.8037109375, -3.490234375, -3.1767578125, -2.86328125, -2.5498046875, -2.236328125, -1.9228515625, -1.609375, -1.2958984375, -0.982421875, -0.6689453125, -0.35546875, -0.0419921875, 0.271484375, 0.5849609375, 0.8984375, 1.2119140625, 1.525390625, 1.8388671875, 2.15234375, 2.4658203125, 2.779296875, 3.0927734375, 3.40625, 3.7197265625, 4.033203125, 4.3466796875, 4.66015625, 4.9736328125, 5.287109375, 5.6005859375, 5.9140625, 6.2275390625, 6.541015625, 6.8544921875, 7.16796875, 7.4814453125, 7.794921875, 8.1083984375, 8.421875, 8.7353515625, 9.048828125, 9.3623046875, 9.67578125, 9.9892578125, 10.302734375, 10.6162109375, 10.9296875, 11.2431640625, 11.556640625, 11.8701171875, 12.18359375, 12.4970703125, 12.810546875, 13.1240234375, 13.4375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 14.0, 18.0, 50.0, 91.0, 202.0, 248.0, 182.0, 95.0, 38.0, 24.0, 13.0, 7.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.48509216308594, -60.520179748535156, -57.55527114868164, -54.59035873413086, -51.625450134277344, -48.66053771972656, -45.69562530517578, -42.730716705322266, -39.76580810546875, -36.80089569091797, -33.83598709106445, -30.871074676513672, -27.906166076660156, -24.941253662109375, -21.976343154907227, -19.011432647705078, -16.046520233154297, -13.081609725952148, -10.11669921875, -7.151787757873535, -4.186877250671387, -1.2219667434692383, 1.7429447174072266, 4.707855224609375, 7.672765731811523, 10.637676239013672, 13.60258674621582, 16.56749725341797, 19.53240966796875, 22.497318267822266, 25.462230682373047, 28.427141189575195, 31.392051696777344, 34.356964111328125, 37.32187271118164, 40.28678512573242, 43.25169372558594, 46.21660614013672, 49.1815185546875, 52.146427154541016, 55.11133575439453, 58.07624816894531, 61.04115676879883, 64.00606536865234, 66.97097778320312, 69.9358901977539, 72.90080261230469, 75.86570739746094, 78.83062744140625, 81.79553985595703, 84.76045227050781, 87.72535705566406, 90.69026947021484, 93.65518188476562, 96.6200942993164, 99.58500671386719, 102.54991149902344, 105.51482391357422, 108.479736328125, 111.44464111328125, 114.40955352783203, 117.37446594238281, 120.3393783569336, 123.30429077148438, 126.26919555664062]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 0.0, 12.0, 15.0, 12.0, 26.0, 37.0, 29.0, 41.0, 43.0, 68.0, 73.0, 65.0, 64.0, 54.0, 71.0, 81.0, 57.0, 46.0, 42.0, 41.0, 33.0, 22.0, 17.0, 13.0, 8.0, 8.0, 5.0, 10.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.485008239746094, -26.17704963684082, -24.869091033935547, -23.561134338378906, -22.253175735473633, -20.94521713256836, -19.63726043701172, -18.329301834106445, -17.021343231201172, -15.713384628295898, -14.405426979064941, -13.097469329833984, -11.789510726928711, -10.481552124023438, -9.17359447479248, -7.865636825561523, -6.55767822265625, -5.249720096588135, -3.9417619705200195, -2.6338038444519043, -1.325845718383789, -0.017887592315673828, 1.2900705337524414, 2.5980281829833984, 3.905986785888672, 5.213944911956787, 6.521903038024902, 7.829861164093018, 9.137819290161133, 10.445777893066406, 11.753735542297363, 13.06169319152832, 14.369651794433594, 15.677610397338867, 16.98556900024414, 18.29352569580078, 19.601484298706055, 20.909442901611328, 22.21739959716797, 23.525358200073242, 24.833316802978516, 26.14127540588379, 27.449234008789062, 28.757190704345703, 30.065149307250977, 31.37310791015625, 32.68106460571289, 33.98902130126953, 35.29698181152344, 36.60493850708008, 37.912899017333984, 39.220855712890625, 40.52881622314453, 41.83677291870117, 43.14472961425781, 44.45269012451172, 45.76064682006836, 47.068603515625, 48.376564025878906, 49.68452072143555, 50.99247741699219, 52.300437927246094, 53.608394622802734, 54.916351318359375, 56.22431182861328]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 7.0, 14.0, 7.0, 13.0, 16.0, 26.0, 43.0, 60.0, 91.0, 162.0, 291.0, 500.0, 1023.0, 2387.0, 7130.0, 25585.0, 123673.0, 537114.0, 278730.0, 51898.0, 12535.0, 3972.0, 1569.0, 751.0, 352.0, 201.0, 131.0, 84.0, 54.0, 37.0, 35.0, 11.0, 8.0, 10.0, 5.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.0234375, -8.77093505859375, -8.5184326171875, -8.26593017578125, -8.013427734375, -7.76092529296875, -7.5084228515625, -7.25592041015625, -7.00341796875, -6.75091552734375, -6.4984130859375, -6.24591064453125, -5.993408203125, -5.74090576171875, -5.4884033203125, -5.23590087890625, -4.9833984375, -4.73089599609375, -4.4783935546875, -4.22589111328125, -3.973388671875, -3.72088623046875, -3.4683837890625, -3.21588134765625, -2.96337890625, -2.71087646484375, -2.4583740234375, -2.20587158203125, -1.953369140625, -1.70086669921875, -1.4483642578125, -1.19586181640625, -0.943359375, -0.69085693359375, -0.4383544921875, -0.18585205078125, 0.066650390625, 0.31915283203125, 0.5716552734375, 0.82415771484375, 1.07666015625, 1.32916259765625, 1.5816650390625, 1.83416748046875, 2.086669921875, 2.33917236328125, 2.5916748046875, 2.84417724609375, 3.0966796875, 3.34918212890625, 3.6016845703125, 3.85418701171875, 4.106689453125, 4.35919189453125, 4.6116943359375, 4.86419677734375, 5.11669921875, 5.36920166015625, 5.6217041015625, 5.87420654296875, 6.126708984375, 6.37921142578125, 6.6317138671875, 6.88421630859375, 7.13671875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 12.0, 13.0, 10.0, 20.0, 18.0, 29.0, 22.0, 20.0, 48.0, 44.0, 54.0, 56.0, 50.0, 56.0, 63.0, 54.0, 65.0, 60.0, 53.0, 38.0, 32.0, 29.0, 31.0, 23.0, 27.0, 11.0, 13.0, 10.0, 8.0, 7.0, 3.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.984375, -2.876678466796875, -2.76898193359375, -2.661285400390625, -2.5535888671875, -2.445892333984375, -2.33819580078125, -2.230499267578125, -2.122802734375, -2.015106201171875, -1.90740966796875, -1.799713134765625, -1.6920166015625, -1.584320068359375, -1.47662353515625, -1.368927001953125, -1.26123046875, -1.153533935546875, -1.04583740234375, -0.938140869140625, -0.8304443359375, -0.722747802734375, -0.61505126953125, -0.507354736328125, -0.399658203125, -0.291961669921875, -0.18426513671875, -0.076568603515625, 0.0311279296875, 0.138824462890625, 0.24652099609375, 0.354217529296875, 0.4619140625, 0.569610595703125, 0.67730712890625, 0.785003662109375, 0.8927001953125, 1.000396728515625, 1.10809326171875, 1.215789794921875, 1.323486328125, 1.431182861328125, 1.53887939453125, 1.646575927734375, 1.7542724609375, 1.861968994140625, 1.96966552734375, 2.077362060546875, 2.18505859375, 2.292755126953125, 2.40045166015625, 2.508148193359375, 2.6158447265625, 2.723541259765625, 2.83123779296875, 2.938934326171875, 3.046630859375, 3.154327392578125, 3.26202392578125, 3.369720458984375, 3.4774169921875, 3.585113525390625, 3.69281005859375, 3.800506591796875, 3.908203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 9.0, 9.0, 13.0, 19.0, 26.0, 43.0, 79.0, 98.0, 146.0, 310.0, 548.0, 1250.0, 3198.0, 13485.0, 152667.0, 821291.0, 44401.0, 6945.0, 2156.0, 885.0, 377.0, 209.0, 116.0, 79.0, 54.0, 37.0, 28.0, 14.0, 10.0, 11.0, 8.0, 4.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.9140625, -14.3868408203125, -13.859619140625, -13.3323974609375, -12.80517578125, -12.2779541015625, -11.750732421875, -11.2235107421875, -10.6962890625, -10.1690673828125, -9.641845703125, -9.1146240234375, -8.58740234375, -8.0601806640625, -7.532958984375, -7.0057373046875, -6.478515625, -5.9512939453125, -5.424072265625, -4.8968505859375, -4.36962890625, -3.8424072265625, -3.315185546875, -2.7879638671875, -2.2607421875, -1.7335205078125, -1.206298828125, -0.6790771484375, -0.15185546875, 0.3753662109375, 0.902587890625, 1.4298095703125, 1.95703125, 2.4842529296875, 3.011474609375, 3.5386962890625, 4.06591796875, 4.5931396484375, 5.120361328125, 5.6475830078125, 6.1748046875, 6.7020263671875, 7.229248046875, 7.7564697265625, 8.28369140625, 8.8109130859375, 9.338134765625, 9.8653564453125, 10.392578125, 10.9197998046875, 11.447021484375, 11.9742431640625, 12.50146484375, 13.0286865234375, 13.555908203125, 14.0831298828125, 14.6103515625, 15.1375732421875, 15.664794921875, 16.1920166015625, 16.71923828125, 17.2464599609375, 17.773681640625, 18.3009033203125, 18.828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 17.0, 16.0, 29.0, 36.0, 41.0, 38.0, 58.0, 65.0, 93.0, 90.0, 69.0, 73.0, 85.0, 54.0, 53.0, 37.0, 36.0, 15.0, 22.0, 21.0, 15.0, 4.0, 1.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.40625, -20.791748046875, -20.17724609375, -19.562744140625, -18.9482421875, -18.333740234375, -17.71923828125, -17.104736328125, -16.490234375, -15.875732421875, -15.26123046875, -14.646728515625, -14.0322265625, -13.417724609375, -12.80322265625, -12.188720703125, -11.57421875, -10.959716796875, -10.34521484375, -9.730712890625, -9.1162109375, -8.501708984375, -7.88720703125, -7.272705078125, -6.658203125, -6.043701171875, -5.42919921875, -4.814697265625, -4.2001953125, -3.585693359375, -2.97119140625, -2.356689453125, -1.7421875, -1.127685546875, -0.51318359375, 0.101318359375, 0.7158203125, 1.330322265625, 1.94482421875, 2.559326171875, 3.173828125, 3.788330078125, 4.40283203125, 5.017333984375, 5.6318359375, 6.246337890625, 6.86083984375, 7.475341796875, 8.08984375, 8.704345703125, 9.31884765625, 9.933349609375, 10.5478515625, 11.162353515625, 11.77685546875, 12.391357421875, 13.005859375, 13.620361328125, 14.23486328125, 14.849365234375, 15.4638671875, 16.078369140625, 16.69287109375, 17.307373046875, 17.921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 4.0, 6.0, 13.0, 16.0, 18.0, 32.0, 32.0, 59.0, 94.0, 120.0, 217.0, 379.0, 774.0, 1902.0, 5705.0, 20679.0, 115909.0, 792219.0, 85356.0, 16937.0, 4818.0, 1610.0, 727.0, 350.0, 189.0, 90.0, 84.0, 49.0, 44.0, 29.0, 17.0, 19.0, 8.0, 11.0, 10.0, 9.0, 3.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8515625, -5.676513671875, -5.50146484375, -5.326416015625, -5.1513671875, -4.976318359375, -4.80126953125, -4.626220703125, -4.451171875, -4.276123046875, -4.10107421875, -3.926025390625, -3.7509765625, -3.575927734375, -3.40087890625, -3.225830078125, -3.05078125, -2.875732421875, -2.70068359375, -2.525634765625, -2.3505859375, -2.175537109375, -2.00048828125, -1.825439453125, -1.650390625, -1.475341796875, -1.30029296875, -1.125244140625, -0.9501953125, -0.775146484375, -0.60009765625, -0.425048828125, -0.25, -0.074951171875, 0.10009765625, 0.275146484375, 0.4501953125, 0.625244140625, 0.80029296875, 0.975341796875, 1.150390625, 1.325439453125, 1.50048828125, 1.675537109375, 1.8505859375, 2.025634765625, 2.20068359375, 2.375732421875, 2.55078125, 2.725830078125, 2.90087890625, 3.075927734375, 3.2509765625, 3.426025390625, 3.60107421875, 3.776123046875, 3.951171875, 4.126220703125, 4.30126953125, 4.476318359375, 4.6513671875, 4.826416015625, 5.00146484375, 5.176513671875, 5.3515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 7.0, 7.0, 9.0, 10.0, 8.0, 6.0, 28.0, 20.0, 32.0, 42.0, 78.0, 157.0, 245.0, 130.0, 61.0, 47.0, 32.0, 20.0, 18.0, 5.0, 11.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016689300537109375, -0.0016138255596160889, -0.0015587210655212402, -0.0015036165714263916, -0.001448512077331543, -0.0013934075832366943, -0.0013383030891418457, -0.001283198595046997, -0.0012280941009521484, -0.0011729896068572998, -0.0011178851127624512, -0.0010627806186676025, -0.001007676124572754, -0.0009525716304779053, -0.0008974671363830566, -0.000842362642288208, -0.0007872581481933594, -0.0007321536540985107, -0.0006770491600036621, -0.0006219446659088135, -0.0005668401718139648, -0.0005117356777191162, -0.0004566311836242676, -0.00040152668952941895, -0.0003464221954345703, -0.0002913177013397217, -0.00023621320724487305, -0.00018110871315002441, -0.00012600421905517578, -7.089972496032715e-05, -1.5795230865478516e-05, 3.930926322937012e-05, 9.441375732421875e-05, 0.00014951825141906738, 0.00020462274551391602, 0.00025972723960876465, 0.0003148317337036133, 0.0003699362277984619, 0.00042504072189331055, 0.0004801452159881592, 0.0005352497100830078, 0.0005903542041778564, 0.0006454586982727051, 0.0007005631923675537, 0.0007556676864624023, 0.000810772180557251, 0.0008658766746520996, 0.0009209811687469482, 0.0009760856628417969, 0.0010311901569366455, 0.0010862946510314941, 0.0011413991451263428, 0.0011965036392211914, 0.00125160813331604, 0.0013067126274108887, 0.0013618171215057373, 0.001416921615600586, 0.0014720261096954346, 0.0015271306037902832, 0.0015822350978851318, 0.0016373395919799805, 0.001692444086074829, 0.0017475485801696777, 0.0018026530742645264, 0.001857757568359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 16.0, 19.0, 29.0, 59.0, 68.0, 142.0, 199.0, 365.0, 756.0, 1972.0, 6691.0, 28306.0, 196033.0, 735931.0, 59823.0, 12542.0, 3285.0, 1116.0, 518.0, 258.0, 150.0, 88.0, 63.0, 39.0, 21.0, 21.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.90087890625, -5.7119140625, -5.52294921875, -5.333984375, -5.14501953125, -4.9560546875, -4.76708984375, -4.578125, -4.38916015625, -4.2001953125, -4.01123046875, -3.822265625, -3.63330078125, -3.4443359375, -3.25537109375, -3.06640625, -2.87744140625, -2.6884765625, -2.49951171875, -2.310546875, -2.12158203125, -1.9326171875, -1.74365234375, -1.5546875, -1.36572265625, -1.1767578125, -0.98779296875, -0.798828125, -0.60986328125, -0.4208984375, -0.23193359375, -0.04296875, 0.14599609375, 0.3349609375, 0.52392578125, 0.712890625, 0.90185546875, 1.0908203125, 1.27978515625, 1.46875, 1.65771484375, 1.8466796875, 2.03564453125, 2.224609375, 2.41357421875, 2.6025390625, 2.79150390625, 2.98046875, 3.16943359375, 3.3583984375, 3.54736328125, 3.736328125, 3.92529296875, 4.1142578125, 4.30322265625, 4.4921875, 4.68115234375, 4.8701171875, 5.05908203125, 5.248046875, 5.43701171875, 5.6259765625, 5.81494140625, 6.00390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 8.0, 9.0, 13.0, 16.0, 11.0, 12.0, 31.0, 27.0, 44.0, 51.0, 66.0, 126.0, 138.0, 114.0, 93.0, 62.0, 44.0, 23.0, 24.0, 12.0, 17.0, 10.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.380615234375, -4.24169921875, -4.102783203125, -3.9638671875, -3.824951171875, -3.68603515625, -3.547119140625, -3.408203125, -3.269287109375, -3.13037109375, -2.991455078125, -2.8525390625, -2.713623046875, -2.57470703125, -2.435791015625, -2.296875, -2.157958984375, -2.01904296875, -1.880126953125, -1.7412109375, -1.602294921875, -1.46337890625, -1.324462890625, -1.185546875, -1.046630859375, -0.90771484375, -0.768798828125, -0.6298828125, -0.490966796875, -0.35205078125, -0.213134765625, -0.07421875, 0.064697265625, 0.20361328125, 0.342529296875, 0.4814453125, 0.620361328125, 0.75927734375, 0.898193359375, 1.037109375, 1.176025390625, 1.31494140625, 1.453857421875, 1.5927734375, 1.731689453125, 1.87060546875, 2.009521484375, 2.1484375, 2.287353515625, 2.42626953125, 2.565185546875, 2.7041015625, 2.843017578125, 2.98193359375, 3.120849609375, 3.259765625, 3.398681640625, 3.53759765625, 3.676513671875, 3.8154296875, 3.954345703125, 4.09326171875, 4.232177734375, 4.37109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 5.0, 6.0, 14.0, 21.0, 53.0, 75.0, 153.0, 240.0, 189.0, 92.0, 63.0, 27.0, 14.0, 11.0, 8.0, 4.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-85.1076889038086, -82.6568603515625, -80.20602416992188, -77.75519561767578, -75.30436706542969, -72.85353088378906, -70.40270233154297, -67.95187377929688, -65.50103759765625, -63.05020523071289, -60.59937286376953, -58.14854431152344, -55.69771194458008, -53.24687957763672, -50.796051025390625, -48.345218658447266, -45.894386291503906, -43.44355392456055, -40.99272155761719, -38.541893005371094, -36.091060638427734, -33.640228271484375, -31.18939781188965, -28.738567352294922, -26.287734985351562, -23.836902618408203, -21.386072158813477, -18.93524169921875, -16.48440933227539, -14.033577919006348, -11.582746505737305, -9.131916046142578, -6.6810760498046875, -4.2302446365356445, -1.7794132232666016, 0.6714181900024414, 3.1222496032714844, 5.573081016540527, 8.02391242980957, 10.474742889404297, 12.925575256347656, 15.3764066696167, 17.827238082885742, 20.27806854248047, 22.728900909423828, 25.179733276367188, 27.630563735961914, 30.08139419555664, 32.5322265625, 34.98305892944336, 37.43389129638672, 39.88471984863281, 42.33555221557617, 44.78638458251953, 47.237213134765625, 49.688045501708984, 52.138877868652344, 54.5897102355957, 57.04054260253906, 59.491371154785156, 61.942203521728516, 64.39303588867188, 66.84386444091797, 69.29469299316406, 71.74552917480469]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 6.0, 6.0, 10.0, 5.0, 11.0, 11.0, 15.0, 14.0, 19.0, 23.0, 28.0, 28.0, 30.0, 42.0, 39.0, 49.0, 67.0, 65.0, 75.0, 62.0, 55.0, 42.0, 25.0, 42.0, 44.0, 33.0, 25.0, 16.0, 37.0, 10.0, 16.0, 5.0, 16.0, 5.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-61.93077087402344, -60.2968864440918, -58.663002014160156, -57.029117584228516, -55.395233154296875, -53.761348724365234, -52.127464294433594, -50.49357986450195, -48.85969543457031, -47.22581100463867, -45.59192657470703, -43.95804214477539, -42.32415771484375, -40.69027328491211, -39.05638885498047, -37.42250442504883, -35.78861999511719, -34.15473556518555, -32.520851135253906, -30.886966705322266, -29.253082275390625, -27.619197845458984, -25.985313415527344, -24.351428985595703, -22.717544555664062, -21.083660125732422, -19.44977569580078, -17.81589126586914, -16.1820068359375, -14.54812240600586, -12.914237976074219, -11.280353546142578, -9.646469116210938, -8.012584686279297, -6.378700256347656, -4.744815826416016, -3.110931396484375, -1.4770469665527344, 0.15683746337890625, 1.7907218933105469, 3.4246063232421875, 5.058490753173828, 6.692375183105469, 8.32625961303711, 9.96014404296875, 11.59402847290039, 13.227912902832031, 14.861797332763672, 16.495681762695312, 18.129566192626953, 19.763450622558594, 21.397335052490234, 23.031219482421875, 24.665103912353516, 26.298988342285156, 27.932872772216797, 29.566757202148438, 31.200641632080078, 32.83452606201172, 34.46841049194336, 36.102294921875, 37.73617935180664, 39.37006378173828, 41.00394821166992, 42.63783264160156]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 4.0, 7.0, 12.0, 14.0, 33.0, 68.0, 150.0, 360.0, 1368.0, 7222.0, 223484.0, 3920355.0, 35792.0, 3850.0, 1040.0, 312.0, 103.0, 47.0, 26.0, 16.0, 3.0, 3.0, 6.0], "bins": [-24.296875, -23.83233642578125, -23.3677978515625, -22.90325927734375, -22.438720703125, -21.97418212890625, -21.5096435546875, -21.04510498046875, -20.58056640625, -20.11602783203125, -19.6514892578125, -19.18695068359375, -18.722412109375, -18.25787353515625, -17.7933349609375, -17.32879638671875, -16.8642578125, -16.39971923828125, -15.9351806640625, -15.47064208984375, -15.006103515625, -14.54156494140625, -14.0770263671875, -13.61248779296875, -13.14794921875, -12.68341064453125, -12.2188720703125, -11.75433349609375, -11.289794921875, -10.82525634765625, -10.3607177734375, -9.89617919921875, -9.431640625, -8.96710205078125, -8.5025634765625, -8.03802490234375, -7.573486328125, -7.10894775390625, -6.6444091796875, -6.17987060546875, -5.71533203125, -5.25079345703125, -4.7862548828125, -4.32171630859375, -3.857177734375, -3.39263916015625, -2.9281005859375, -2.46356201171875, -1.9990234375, -1.53448486328125, -1.0699462890625, -0.60540771484375, -0.140869140625, 0.32366943359375, 0.7882080078125, 1.25274658203125, 1.71728515625, 2.18182373046875, 2.6463623046875, 3.11090087890625, 3.575439453125, 4.03997802734375, 4.5045166015625, 4.96905517578125, 5.43359375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 11.0, 14.0, 15.0, 30.0, 37.0, 52.0, 66.0, 77.0, 79.0, 100.0, 86.0, 81.0, 81.0, 72.0, 59.0, 45.0, 40.0, 15.0, 13.0, 11.0, 9.0, 6.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.55078125, -7.38330078125, -7.2158203125, -7.04833984375, -6.880859375, -6.71337890625, -6.5458984375, -6.37841796875, -6.2109375, -6.04345703125, -5.8759765625, -5.70849609375, -5.541015625, -5.37353515625, -5.2060546875, -5.03857421875, -4.87109375, -4.70361328125, -4.5361328125, -4.36865234375, -4.201171875, -4.03369140625, -3.8662109375, -3.69873046875, -3.53125, -3.36376953125, -3.1962890625, -3.02880859375, -2.861328125, -2.69384765625, -2.5263671875, -2.35888671875, -2.19140625, -2.02392578125, -1.8564453125, -1.68896484375, -1.521484375, -1.35400390625, -1.1865234375, -1.01904296875, -0.8515625, -0.68408203125, -0.5166015625, -0.34912109375, -0.181640625, -0.01416015625, 0.1533203125, 0.32080078125, 0.48828125, 0.65576171875, 0.8232421875, 0.99072265625, 1.158203125, 1.32568359375, 1.4931640625, 1.66064453125, 1.828125, 1.99560546875, 2.1630859375, 2.33056640625, 2.498046875, 2.66552734375, 2.8330078125, 3.00048828125, 3.16796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 13.0, 20.0, 29.0, 38.0, 100.0, 164.0, 322.0, 694.0, 2006.0, 8843.0, 230732.0, 3915381.0, 30461.0, 3533.0, 1088.0, 432.0, 215.0, 82.0, 55.0, 27.0, 9.0, 10.0, 7.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.65625, -18.095458984375, -17.53466796875, -16.973876953125, -16.4130859375, -15.852294921875, -15.29150390625, -14.730712890625, -14.169921875, -13.609130859375, -13.04833984375, -12.487548828125, -11.9267578125, -11.365966796875, -10.80517578125, -10.244384765625, -9.68359375, -9.122802734375, -8.56201171875, -8.001220703125, -7.4404296875, -6.879638671875, -6.31884765625, -5.758056640625, -5.197265625, -4.636474609375, -4.07568359375, -3.514892578125, -2.9541015625, -2.393310546875, -1.83251953125, -1.271728515625, -0.7109375, -0.150146484375, 0.41064453125, 0.971435546875, 1.5322265625, 2.093017578125, 2.65380859375, 3.214599609375, 3.775390625, 4.336181640625, 4.89697265625, 5.457763671875, 6.0185546875, 6.579345703125, 7.14013671875, 7.700927734375, 8.26171875, 8.822509765625, 9.38330078125, 9.944091796875, 10.5048828125, 11.065673828125, 11.62646484375, 12.187255859375, 12.748046875, 13.308837890625, 13.86962890625, 14.430419921875, 14.9912109375, 15.552001953125, 16.11279296875, 16.673583984375, 17.234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 8.0, 11.0, 14.0, 19.0, 29.0, 49.0, 87.0, 180.0, 408.0, 953.0, 1154.0, 653.0, 260.0, 107.0, 55.0, 35.0, 17.0, 11.0, 10.0, 9.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-14.4765625, -14.1563720703125, -13.836181640625, -13.5159912109375, -13.19580078125, -12.8756103515625, -12.555419921875, -12.2352294921875, -11.9150390625, -11.5948486328125, -11.274658203125, -10.9544677734375, -10.63427734375, -10.3140869140625, -9.993896484375, -9.6737060546875, -9.353515625, -9.0333251953125, -8.713134765625, -8.3929443359375, -8.07275390625, -7.7525634765625, -7.432373046875, -7.1121826171875, -6.7919921875, -6.4718017578125, -6.151611328125, -5.8314208984375, -5.51123046875, -5.1910400390625, -4.870849609375, -4.5506591796875, -4.23046875, -3.9102783203125, -3.590087890625, -3.2698974609375, -2.94970703125, -2.6295166015625, -2.309326171875, -1.9891357421875, -1.6689453125, -1.3487548828125, -1.028564453125, -0.7083740234375, -0.38818359375, -0.0679931640625, 0.252197265625, 0.5723876953125, 0.892578125, 1.2127685546875, 1.532958984375, 1.8531494140625, 2.17333984375, 2.4935302734375, 2.813720703125, 3.1339111328125, 3.4541015625, 3.7742919921875, 4.094482421875, 4.4146728515625, 4.73486328125, 5.0550537109375, 5.375244140625, 5.6954345703125, 6.015625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 5.0, 6.0, 24.0, 52.0, 142.0, 279.0, 287.0, 130.0, 43.0, 12.0, 8.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.53944396972656, -184.6129150390625, -180.68638610839844, -176.7598419189453, -172.83331298828125, -168.9067840576172, -164.98025512695312, -161.05372619628906, -157.127197265625, -153.20066833496094, -149.27413940429688, -145.34759521484375, -141.4210662841797, -137.49453735351562, -133.56800842285156, -129.6414794921875, -125.71493530273438, -121.78840637207031, -117.86186981201172, -113.93534088134766, -110.00880432128906, -106.082275390625, -102.15574645996094, -98.22921752929688, -94.30268096923828, -90.37615203857422, -86.44961547851562, -82.52308654785156, -78.5965576171875, -74.6700210571289, -70.74349212646484, -66.81695556640625, -62.89042663574219, -58.96389389038086, -55.03736114501953, -51.11083221435547, -47.18429946899414, -43.25776672363281, -39.33123779296875, -35.40470504760742, -31.478172302246094, -27.551639556884766, -23.62510871887207, -19.698577880859375, -15.772045135498047, -11.845512390136719, -7.918981552124023, -3.992450714111328, -0.06591796875, 3.8606138229370117, 7.787145614624023, 11.713677406311035, 15.640209197998047, 19.566741943359375, 23.49327278137207, 27.419803619384766, 31.346336364746094, 35.27286911010742, 39.19940185546875, 43.12593078613281, 47.05246353149414, 50.97899627685547, 54.90552520751953, 58.83205795288086, 62.75859069824219]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 4.0, 8.0, 4.0, 8.0, 17.0, 17.0, 48.0, 44.0, 44.0, 73.0, 108.0, 88.0, 97.0, 96.0, 98.0, 79.0, 53.0, 39.0, 30.0, 23.0, 15.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.262285232543945, -27.4180908203125, -25.573894500732422, -23.729698181152344, -21.8855037689209, -20.041309356689453, -18.197113037109375, -16.352916717529297, -14.508722305297852, -12.66452693939209, -10.820331573486328, -8.976136207580566, -7.131940841674805, -5.287745475769043, -3.4435501098632812, -1.5993547439575195, 0.2448406219482422, 2.089035987854004, 3.9332313537597656, 5.777426719665527, 7.621622085571289, 9.46581745147705, 11.310012817382812, 13.154208183288574, 14.998403549194336, 16.84259796142578, 18.68679428100586, 20.530990600585938, 22.375185012817383, 24.219379425048828, 26.063575744628906, 27.907772064208984, 29.751968383789062, 31.59616470336914, 33.44036102294922, 35.28455352783203, 37.12874984741211, 38.97294616699219, 40.817138671875, 42.66133499145508, 44.505531311035156, 46.349727630615234, 48.19392395019531, 50.038116455078125, 51.8823127746582, 53.72650909423828, 55.570701599121094, 57.41489791870117, 59.25909423828125, 61.10329055786133, 62.947486877441406, 64.79167938232422, 66.63587951660156, 68.48007202148438, 70.32426452636719, 72.16846466064453, 74.01265716552734, 75.85684967041016, 77.7010498046875, 79.54524230957031, 81.38943481445312, 83.23363494873047, 85.07782745361328, 86.92202758789062, 88.76622009277344]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 11.0, 13.0, 19.0, 26.0, 30.0, 49.0, 71.0, 118.0, 207.0, 331.0, 772.0, 1797.0, 4813.0, 15916.0, 63845.0, 315496.0, 486210.0, 119692.0, 26452.0, 7669.0, 2636.0, 1108.0, 498.0, 287.0, 151.0, 93.0, 64.0, 44.0, 33.0, 33.0, 13.0, 13.0, 4.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.23046875, -6.03076171875, -5.8310546875, -5.63134765625, -5.431640625, -5.23193359375, -5.0322265625, -4.83251953125, -4.6328125, -4.43310546875, -4.2333984375, -4.03369140625, -3.833984375, -3.63427734375, -3.4345703125, -3.23486328125, -3.03515625, -2.83544921875, -2.6357421875, -2.43603515625, -2.236328125, -2.03662109375, -1.8369140625, -1.63720703125, -1.4375, -1.23779296875, -1.0380859375, -0.83837890625, -0.638671875, -0.43896484375, -0.2392578125, -0.03955078125, 0.16015625, 0.35986328125, 0.5595703125, 0.75927734375, 0.958984375, 1.15869140625, 1.3583984375, 1.55810546875, 1.7578125, 1.95751953125, 2.1572265625, 2.35693359375, 2.556640625, 2.75634765625, 2.9560546875, 3.15576171875, 3.35546875, 3.55517578125, 3.7548828125, 3.95458984375, 4.154296875, 4.35400390625, 4.5537109375, 4.75341796875, 4.953125, 5.15283203125, 5.3525390625, 5.55224609375, 5.751953125, 5.95166015625, 6.1513671875, 6.35107421875, 6.55078125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 12.0, 17.0, 18.0, 31.0, 44.0, 61.0, 51.0, 85.0, 78.0, 88.0, 88.0, 79.0, 74.0, 61.0, 58.0, 38.0, 28.0, 27.0, 18.0, 13.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.6949462890625, -4.538330078125, -4.3817138671875, -4.22509765625, -4.0684814453125, -3.911865234375, -3.7552490234375, -3.5986328125, -3.4420166015625, -3.285400390625, -3.1287841796875, -2.97216796875, -2.8155517578125, -2.658935546875, -2.5023193359375, -2.345703125, -2.1890869140625, -2.032470703125, -1.8758544921875, -1.71923828125, -1.5626220703125, -1.406005859375, -1.2493896484375, -1.0927734375, -0.9361572265625, -0.779541015625, -0.6229248046875, -0.46630859375, -0.3096923828125, -0.153076171875, 0.0035400390625, 0.16015625, 0.3167724609375, 0.473388671875, 0.6300048828125, 0.78662109375, 0.9432373046875, 1.099853515625, 1.2564697265625, 1.4130859375, 1.5697021484375, 1.726318359375, 1.8829345703125, 2.03955078125, 2.1961669921875, 2.352783203125, 2.5093994140625, 2.666015625, 2.8226318359375, 2.979248046875, 3.1358642578125, 3.29248046875, 3.4490966796875, 3.605712890625, 3.7623291015625, 3.9189453125, 4.0755615234375, 4.232177734375, 4.3887939453125, 4.54541015625, 4.7020263671875, 4.858642578125, 5.0152587890625, 5.171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 9.0, 16.0, 33.0, 48.0, 68.0, 141.0, 330.0, 914.0, 3236.0, 17225.0, 172693.0, 763627.0, 77335.0, 9699.0, 2043.0, 599.0, 225.0, 123.0, 70.0, 34.0, 28.0, 12.0, 12.0, 1.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.534423828125, -9.20947265625, -8.884521484375, -8.5595703125, -8.234619140625, -7.90966796875, -7.584716796875, -7.259765625, -6.934814453125, -6.60986328125, -6.284912109375, -5.9599609375, -5.635009765625, -5.31005859375, -4.985107421875, -4.66015625, -4.335205078125, -4.01025390625, -3.685302734375, -3.3603515625, -3.035400390625, -2.71044921875, -2.385498046875, -2.060546875, -1.735595703125, -1.41064453125, -1.085693359375, -0.7607421875, -0.435791015625, -0.11083984375, 0.214111328125, 0.5390625, 0.864013671875, 1.18896484375, 1.513916015625, 1.8388671875, 2.163818359375, 2.48876953125, 2.813720703125, 3.138671875, 3.463623046875, 3.78857421875, 4.113525390625, 4.4384765625, 4.763427734375, 5.08837890625, 5.413330078125, 5.73828125, 6.063232421875, 6.38818359375, 6.713134765625, 7.0380859375, 7.363037109375, 7.68798828125, 8.012939453125, 8.337890625, 8.662841796875, 8.98779296875, 9.312744140625, 9.6376953125, 9.962646484375, 10.28759765625, 10.612548828125, 10.9375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 14.0, 15.0, 15.0, 28.0, 38.0, 34.0, 30.0, 33.0, 29.0, 49.0, 52.0, 54.0, 59.0, 70.0, 48.0, 42.0, 45.0, 38.0, 45.0, 29.0, 36.0, 28.0, 24.0, 20.0, 22.0, 13.0, 11.0, 10.0, 13.0, 7.0, 7.0, 7.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.390625, -11.0426025390625, -10.694580078125, -10.3465576171875, -9.99853515625, -9.6505126953125, -9.302490234375, -8.9544677734375, -8.6064453125, -8.2584228515625, -7.910400390625, -7.5623779296875, -7.21435546875, -6.8663330078125, -6.518310546875, -6.1702880859375, -5.822265625, -5.4742431640625, -5.126220703125, -4.7781982421875, -4.43017578125, -4.0821533203125, -3.734130859375, -3.3861083984375, -3.0380859375, -2.6900634765625, -2.342041015625, -1.9940185546875, -1.64599609375, -1.2979736328125, -0.949951171875, -0.6019287109375, -0.25390625, 0.0941162109375, 0.442138671875, 0.7901611328125, 1.13818359375, 1.4862060546875, 1.834228515625, 2.1822509765625, 2.5302734375, 2.8782958984375, 3.226318359375, 3.5743408203125, 3.92236328125, 4.2703857421875, 4.618408203125, 4.9664306640625, 5.314453125, 5.6624755859375, 6.010498046875, 6.3585205078125, 6.70654296875, 7.0545654296875, 7.402587890625, 7.7506103515625, 8.0986328125, 8.4466552734375, 8.794677734375, 9.1427001953125, 9.49072265625, 9.8387451171875, 10.186767578125, 10.5347900390625, 10.8828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 12.0, 7.0, 18.0, 24.0, 56.0, 97.0, 207.0, 422.0, 990.0, 2683.0, 8531.0, 36822.0, 274568.0, 641400.0, 64196.0, 12446.0, 3683.0, 1281.0, 575.0, 255.0, 137.0, 66.0, 34.0, 22.0, 10.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.2586669921875, -3.154052734375, -3.0494384765625, -2.94482421875, -2.8402099609375, -2.735595703125, -2.6309814453125, -2.5263671875, -2.4217529296875, -2.317138671875, -2.2125244140625, -2.10791015625, -2.0032958984375, -1.898681640625, -1.7940673828125, -1.689453125, -1.5848388671875, -1.480224609375, -1.3756103515625, -1.27099609375, -1.1663818359375, -1.061767578125, -0.9571533203125, -0.8525390625, -0.7479248046875, -0.643310546875, -0.5386962890625, -0.43408203125, -0.3294677734375, -0.224853515625, -0.1202392578125, -0.015625, 0.0889892578125, 0.193603515625, 0.2982177734375, 0.40283203125, 0.5074462890625, 0.612060546875, 0.7166748046875, 0.8212890625, 0.9259033203125, 1.030517578125, 1.1351318359375, 1.23974609375, 1.3443603515625, 1.448974609375, 1.5535888671875, 1.658203125, 1.7628173828125, 1.867431640625, 1.9720458984375, 2.07666015625, 2.1812744140625, 2.285888671875, 2.3905029296875, 2.4951171875, 2.5997314453125, 2.704345703125, 2.8089599609375, 2.91357421875, 3.0181884765625, 3.122802734375, 3.2274169921875, 3.33203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 19.0, 11.0, 27.0, 42.0, 78.0, 114.0, 139.0, 152.0, 127.0, 79.0, 65.0, 43.0, 28.0, 16.0, 9.0, 14.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0009713172912597656, -0.000942133367061615, -0.0009129494428634644, -0.0008837655186653137, -0.0008545815944671631, -0.0008253976702690125, -0.0007962137460708618, -0.0007670298218727112, -0.0007378458976745605, -0.0007086619734764099, -0.0006794780492782593, -0.0006502941250801086, -0.000621110200881958, -0.0005919262766838074, -0.0005627423524856567, -0.0005335584282875061, -0.0005043745040893555, -0.00047519057989120483, -0.0004460066556930542, -0.00041682273149490356, -0.00038763880729675293, -0.0003584548830986023, -0.00032927095890045166, -0.000300087034702301, -0.0002709031105041504, -0.00024171918630599976, -0.00021253526210784912, -0.00018335133790969849, -0.00015416741371154785, -0.00012498348951339722, -9.579956531524658e-05, -6.661564111709595e-05, -3.743171691894531e-05, -8.247792720794678e-06, 2.0936131477355957e-05, 5.012005567550659e-05, 7.930397987365723e-05, 0.00010848790407180786, 0.0001376718282699585, 0.00016685575246810913, 0.00019603967666625977, 0.0002252236008644104, 0.00025440752506256104, 0.00028359144926071167, 0.0003127753734588623, 0.00034195929765701294, 0.0003711432218551636, 0.0004003271460533142, 0.00042951107025146484, 0.0004586949944496155, 0.0004878789186477661, 0.0005170628428459167, 0.0005462467670440674, 0.000575430691242218, 0.0006046146154403687, 0.0006337985396385193, 0.0006629824638366699, 0.0006921663880348206, 0.0007213503122329712, 0.0007505342364311218, 0.0007797181606292725, 0.0008089020848274231, 0.0008380860090255737, 0.0008672699332237244, 0.000896453857421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 13.0, 19.0, 28.0, 39.0, 60.0, 124.0, 270.0, 664.0, 1878.0, 5734.0, 20534.0, 105494.0, 689648.0, 180987.0, 30974.0, 7993.0, 2533.0, 850.0, 346.0, 162.0, 68.0, 55.0, 27.0, 16.0, 6.0, 10.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.44287109375, -2.3349609375, -2.22705078125, -2.119140625, -2.01123046875, -1.9033203125, -1.79541015625, -1.6875, -1.57958984375, -1.4716796875, -1.36376953125, -1.255859375, -1.14794921875, -1.0400390625, -0.93212890625, -0.82421875, -0.71630859375, -0.6083984375, -0.50048828125, -0.392578125, -0.28466796875, -0.1767578125, -0.06884765625, 0.0390625, 0.14697265625, 0.2548828125, 0.36279296875, 0.470703125, 0.57861328125, 0.6865234375, 0.79443359375, 0.90234375, 1.01025390625, 1.1181640625, 1.22607421875, 1.333984375, 1.44189453125, 1.5498046875, 1.65771484375, 1.765625, 1.87353515625, 1.9814453125, 2.08935546875, 2.197265625, 2.30517578125, 2.4130859375, 2.52099609375, 2.62890625, 2.73681640625, 2.8447265625, 2.95263671875, 3.060546875, 3.16845703125, 3.2763671875, 3.38427734375, 3.4921875, 3.60009765625, 3.7080078125, 3.81591796875, 3.923828125, 4.03173828125, 4.1396484375, 4.24755859375, 4.35546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 7.0, 6.0, 5.0, 8.0, 9.0, 9.0, 7.0, 18.0, 21.0, 27.0, 38.0, 44.0, 56.0, 97.0, 88.0, 106.0, 96.0, 78.0, 66.0, 58.0, 37.0, 25.0, 23.0, 17.0, 10.0, 9.0, 9.0, 7.0, 5.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75, -2.668365478515625, -2.58673095703125, -2.505096435546875, -2.4234619140625, -2.341827392578125, -2.26019287109375, -2.178558349609375, -2.096923828125, -2.015289306640625, -1.93365478515625, -1.852020263671875, -1.7703857421875, -1.688751220703125, -1.60711669921875, -1.525482177734375, -1.44384765625, -1.362213134765625, -1.28057861328125, -1.198944091796875, -1.1173095703125, -1.035675048828125, -0.95404052734375, -0.872406005859375, -0.790771484375, -0.709136962890625, -0.62750244140625, -0.545867919921875, -0.4642333984375, -0.382598876953125, -0.30096435546875, -0.219329833984375, -0.1376953125, -0.056060791015625, 0.02557373046875, 0.107208251953125, 0.1888427734375, 0.270477294921875, 0.35211181640625, 0.433746337890625, 0.515380859375, 0.597015380859375, 0.67864990234375, 0.760284423828125, 0.8419189453125, 0.923553466796875, 1.00518798828125, 1.086822509765625, 1.16845703125, 1.250091552734375, 1.33172607421875, 1.413360595703125, 1.4949951171875, 1.576629638671875, 1.65826416015625, 1.739898681640625, 1.821533203125, 1.903167724609375, 1.98480224609375, 2.066436767578125, 2.1480712890625, 2.229705810546875, 2.31134033203125, 2.392974853515625, 2.474609375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 8.0, 17.0, 81.0, 209.0, 412.0, 164.0, 60.0, 24.0, 14.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-107.77953338623047, -104.3449478149414, -100.91035461425781, -97.47576904296875, -94.04118347167969, -90.6065902709961, -87.17200469970703, -83.73741149902344, -80.30282592773438, -76.86824035644531, -73.43364715576172, -69.99906158447266, -66.56446838378906, -63.1298828125, -59.69529724121094, -56.26070785522461, -52.82611846923828, -49.39152908325195, -45.956939697265625, -42.52235412597656, -39.087764739990234, -35.653175354003906, -32.218589782714844, -28.784000396728516, -25.349411010742188, -21.91482162475586, -18.480234146118164, -15.045645713806152, -11.61105728149414, -8.176467895507812, -4.741880416870117, -1.3072929382324219, 2.1273040771484375, 5.561892509460449, 8.996480941772461, 12.431069374084473, 15.865657806396484, 19.300247192382812, 22.734834671020508, 26.169422149658203, 29.60401153564453, 33.03860092163086, 36.47319030761719, 39.90777587890625, 43.34236526489258, 46.776954650878906, 50.21154022216797, 53.6461296081543, 57.080718994140625, 60.51530838012695, 63.94989776611328, 67.38448333740234, 70.81907653808594, 74.253662109375, 77.68824768066406, 81.12283325195312, 84.55742645263672, 87.99201202392578, 91.42660522460938, 94.86119079589844, 98.2957763671875, 101.7303695678711, 105.16495513916016, 108.59954833984375, 112.03413391113281]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 12.0, 10.0, 11.0, 16.0, 10.0, 17.0, 27.0, 25.0, 37.0, 40.0, 41.0, 45.0, 63.0, 84.0, 92.0, 76.0, 52.0, 42.0, 49.0, 32.0, 23.0, 23.0, 22.0, 30.0, 24.0, 15.0, 10.0, 16.0, 10.0, 13.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.996734619140625, -39.50214385986328, -38.00755310058594, -36.512962341308594, -35.01837158203125, -33.52377700805664, -32.0291862487793, -30.534595489501953, -29.04000473022461, -27.545413970947266, -26.050823211669922, -24.556230545043945, -23.0616397857666, -21.567049026489258, -20.07245635986328, -18.577865600585938, -17.083274841308594, -15.58868408203125, -14.09409236907959, -12.59950065612793, -11.104909896850586, -9.610319137573242, -8.115727424621582, -6.621135711669922, -5.126544952392578, -3.631953716278076, -2.137362480163574, -0.6427712440490723, 0.8518199920654297, 2.3464112281799316, 3.8410024642944336, 5.335594177246094, 6.830181121826172, 8.324771881103516, 9.819363594055176, 11.313955307006836, 12.80854606628418, 14.303136825561523, 15.797728538513184, 17.292320251464844, 18.786911010742188, 20.28150177001953, 21.776092529296875, 23.27068519592285, 24.765275955200195, 26.25986671447754, 27.754459381103516, 29.24905014038086, 30.743640899658203, 32.23823165893555, 33.73282241821289, 35.227413177490234, 36.722007751464844, 38.21659851074219, 39.71118927001953, 41.205780029296875, 42.70037078857422, 44.19496154785156, 45.689552307128906, 47.18414306640625, 48.678733825683594, 50.1733283996582, 51.66791915893555, 53.16250991821289, 54.657100677490234]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 6.0, 4.0, 8.0, 11.0, 14.0, 44.0, 93.0, 248.0, 742.0, 3134.0, 33449.0, 3973090.0, 174925.0, 6303.0, 1517.0, 470.0, 145.0, 45.0, 12.0, 5.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.84375, -17.3939208984375, -16.944091796875, -16.4942626953125, -16.04443359375, -15.5946044921875, -15.144775390625, -14.6949462890625, -14.2451171875, -13.7952880859375, -13.345458984375, -12.8956298828125, -12.44580078125, -11.9959716796875, -11.546142578125, -11.0963134765625, -10.646484375, -10.1966552734375, -9.746826171875, -9.2969970703125, -8.84716796875, -8.3973388671875, -7.947509765625, -7.4976806640625, -7.0478515625, -6.5980224609375, -6.148193359375, -5.6983642578125, -5.24853515625, -4.7987060546875, -4.348876953125, -3.8990478515625, -3.44921875, -2.9993896484375, -2.549560546875, -2.0997314453125, -1.64990234375, -1.2000732421875, -0.750244140625, -0.3004150390625, 0.1494140625, 0.5992431640625, 1.049072265625, 1.4989013671875, 1.94873046875, 2.3985595703125, 2.848388671875, 3.2982177734375, 3.748046875, 4.1978759765625, 4.647705078125, 5.0975341796875, 5.54736328125, 5.9971923828125, 6.447021484375, 6.8968505859375, 7.3466796875, 7.7965087890625, 8.246337890625, 8.6961669921875, 9.14599609375, 9.5958251953125, 10.045654296875, 10.4954833984375, 10.9453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 10.0, 11.0, 24.0, 37.0, 51.0, 49.0, 83.0, 80.0, 83.0, 95.0, 100.0, 107.0, 79.0, 60.0, 60.0, 30.0, 18.0, 12.0, 7.0, 3.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.351776123046875, -8.16448974609375, -7.977203369140625, -7.7899169921875, -7.602630615234375, -7.41534423828125, -7.228057861328125, -7.040771484375, -6.853485107421875, -6.66619873046875, -6.478912353515625, -6.2916259765625, -6.104339599609375, -5.91705322265625, -5.729766845703125, -5.54248046875, -5.355194091796875, -5.16790771484375, -4.980621337890625, -4.7933349609375, -4.606048583984375, -4.41876220703125, -4.231475830078125, -4.044189453125, -3.856903076171875, -3.66961669921875, -3.482330322265625, -3.2950439453125, -3.107757568359375, -2.92047119140625, -2.733184814453125, -2.5458984375, -2.358612060546875, -2.17132568359375, -1.984039306640625, -1.7967529296875, -1.609466552734375, -1.42218017578125, -1.234893798828125, -1.047607421875, -0.860321044921875, -0.67303466796875, -0.485748291015625, -0.2984619140625, -0.111175537109375, 0.07611083984375, 0.263397216796875, 0.45068359375, 0.637969970703125, 0.82525634765625, 1.012542724609375, 1.1998291015625, 1.387115478515625, 1.57440185546875, 1.761688232421875, 1.948974609375, 2.136260986328125, 2.32354736328125, 2.510833740234375, 2.6981201171875, 2.885406494140625, 3.07269287109375, 3.259979248046875, 3.447265625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 14.0, 14.0, 18.0, 45.0, 65.0, 75.0, 171.0, 446.0, 1931.0, 20443.0, 3781665.0, 380512.0, 7264.0, 981.0, 301.0, 124.0, 76.0, 45.0, 26.0, 18.0, 11.0, 11.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1875, -18.6517333984375, -18.115966796875, -17.5802001953125, -17.04443359375, -16.5086669921875, -15.972900390625, -15.4371337890625, -14.9013671875, -14.3656005859375, -13.829833984375, -13.2940673828125, -12.75830078125, -12.2225341796875, -11.686767578125, -11.1510009765625, -10.615234375, -10.0794677734375, -9.543701171875, -9.0079345703125, -8.47216796875, -7.9364013671875, -7.400634765625, -6.8648681640625, -6.3291015625, -5.7933349609375, -5.257568359375, -4.7218017578125, -4.18603515625, -3.6502685546875, -3.114501953125, -2.5787353515625, -2.04296875, -1.5072021484375, -0.971435546875, -0.4356689453125, 0.10009765625, 0.6358642578125, 1.171630859375, 1.7073974609375, 2.2431640625, 2.7789306640625, 3.314697265625, 3.8504638671875, 4.38623046875, 4.9219970703125, 5.457763671875, 5.9935302734375, 6.529296875, 7.0650634765625, 7.600830078125, 8.1365966796875, 8.67236328125, 9.2081298828125, 9.743896484375, 10.2796630859375, 10.8154296875, 11.3511962890625, 11.886962890625, 12.4227294921875, 12.95849609375, 13.4942626953125, 14.030029296875, 14.5657958984375, 15.1015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 6.0, 3.0, 8.0, 14.0, 16.0, 32.0, 49.0, 89.0, 181.0, 346.0, 768.0, 1055.0, 769.0, 342.0, 158.0, 84.0, 58.0, 33.0, 23.0, 12.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.28125, -11.02203369140625, -10.7628173828125, -10.50360107421875, -10.244384765625, -9.98516845703125, -9.7259521484375, -9.46673583984375, -9.20751953125, -8.94830322265625, -8.6890869140625, -8.42987060546875, -8.170654296875, -7.91143798828125, -7.6522216796875, -7.39300537109375, -7.1337890625, -6.87457275390625, -6.6153564453125, -6.35614013671875, -6.096923828125, -5.83770751953125, -5.5784912109375, -5.31927490234375, -5.06005859375, -4.80084228515625, -4.5416259765625, -4.28240966796875, -4.023193359375, -3.76397705078125, -3.5047607421875, -3.24554443359375, -2.986328125, -2.72711181640625, -2.4678955078125, -2.20867919921875, -1.949462890625, -1.69024658203125, -1.4310302734375, -1.17181396484375, -0.91259765625, -0.65338134765625, -0.3941650390625, -0.13494873046875, 0.124267578125, 0.38348388671875, 0.6427001953125, 0.90191650390625, 1.1611328125, 1.42034912109375, 1.6795654296875, 1.93878173828125, 2.197998046875, 2.45721435546875, 2.7164306640625, 2.97564697265625, 3.23486328125, 3.49407958984375, 3.7532958984375, 4.01251220703125, 4.271728515625, 4.53094482421875, 4.7901611328125, 5.04937744140625, 5.30859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 17.0, 35.0, 59.0, 101.0, 135.0, 172.0, 183.0, 126.0, 72.0, 34.0, 25.0, 16.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.9763069152832, -62.090187072753906, -60.204063415527344, -58.31794357299805, -56.43182373046875, -54.54570007324219, -52.65958023071289, -50.773460388183594, -48.88733673095703, -47.001216888427734, -45.11509323120117, -43.228973388671875, -41.34285354614258, -39.45673370361328, -37.57061004638672, -35.68449020385742, -33.798370361328125, -31.912248611450195, -30.0261287689209, -28.14000701904297, -26.253887176513672, -24.367765426635742, -22.481643676757812, -20.595523834228516, -18.709402084350586, -16.823280334472656, -14.93716049194336, -13.05103874206543, -11.164917945861816, -9.278797149658203, -7.392675399780273, -5.50655460357666, -3.6204376220703125, -1.7343165874481201, 0.15180444717407227, 2.0379257202148438, 3.924046516418457, 5.81016731262207, 7.6962890625, 9.582409858703613, 11.468530654907227, 13.35465145111084, 15.240772247314453, 17.126893997192383, 19.013015747070312, 20.89913558959961, 22.78525733947754, 24.67137908935547, 26.557498931884766, 28.443620681762695, 30.329740524291992, 32.21586227416992, 34.10198211669922, 35.98810577392578, 37.87422561645508, 39.760345458984375, 41.64646911621094, 43.532588958740234, 45.4187126159668, 47.304832458496094, 49.19095230102539, 51.07707214355469, 52.96319580078125, 54.84931564331055, 56.735435485839844]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 8.0, 6.0, 13.0, 14.0, 17.0, 14.0, 16.0, 22.0, 26.0, 32.0, 39.0, 37.0, 31.0, 37.0, 44.0, 31.0, 34.0, 30.0, 48.0, 41.0, 39.0, 37.0, 49.0, 37.0, 37.0, 33.0, 36.0, 30.0, 14.0, 24.0, 19.0, 17.0, 16.0, 9.0, 10.0, 8.0, 12.0, 6.0, 9.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-21.838489532470703, -21.08622932434082, -20.333969116210938, -19.581708908081055, -18.829448699951172, -18.07718849182129, -17.324928283691406, -16.572669982910156, -15.820408821105957, -15.068148612976074, -14.315888404846191, -13.563629150390625, -12.811368942260742, -12.05910873413086, -11.306848526000977, -10.554588317871094, -9.802328109741211, -9.050067901611328, -8.297807693481445, -7.545547962188721, -6.793287754058838, -6.041027545928955, -5.2887678146362305, -4.536507606506348, -3.784247398376465, -3.031987190246582, -2.2797272205352783, -1.5274672508239746, -0.7752070426940918, -0.022946834564208984, 0.7293128967285156, 1.4815731048583984, 2.2338333129882812, 2.986093521118164, 3.7383534908294678, 4.4906134605407715, 5.242873668670654, 5.995133876800537, 6.747393608093262, 7.4996538162231445, 8.251914024353027, 9.00417423248291, 9.756434440612793, 10.50869369506836, 11.260953903198242, 12.013214111328125, 12.765474319458008, 13.51773452758789, 14.269994735717773, 15.022254943847656, 15.774515151977539, 16.526775360107422, 17.279035568237305, 18.031295776367188, 18.783554077148438, 19.535816192626953, 20.288074493408203, 21.040334701538086, 21.79259490966797, 22.54485511779785, 23.297115325927734, 24.049375534057617, 24.8016357421875, 25.55389404296875, 26.306156158447266]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 10.0, 2.0, 8.0, 17.0, 33.0, 48.0, 74.0, 149.0, 266.0, 628.0, 1544.0, 4680.0, 20301.0, 125945.0, 676924.0, 182321.0, 26197.0, 6209.0, 1763.0, 701.0, 331.0, 157.0, 86.0, 54.0, 26.0, 19.0, 13.0, 15.0, 8.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.1015625, -9.78173828125, -9.4619140625, -9.14208984375, -8.822265625, -8.50244140625, -8.1826171875, -7.86279296875, -7.54296875, -7.22314453125, -6.9033203125, -6.58349609375, -6.263671875, -5.94384765625, -5.6240234375, -5.30419921875, -4.984375, -4.66455078125, -4.3447265625, -4.02490234375, -3.705078125, -3.38525390625, -3.0654296875, -2.74560546875, -2.42578125, -2.10595703125, -1.7861328125, -1.46630859375, -1.146484375, -0.82666015625, -0.5068359375, -0.18701171875, 0.1328125, 0.45263671875, 0.7724609375, 1.09228515625, 1.412109375, 1.73193359375, 2.0517578125, 2.37158203125, 2.69140625, 3.01123046875, 3.3310546875, 3.65087890625, 3.970703125, 4.29052734375, 4.6103515625, 4.93017578125, 5.25, 5.56982421875, 5.8896484375, 6.20947265625, 6.529296875, 6.84912109375, 7.1689453125, 7.48876953125, 7.80859375, 8.12841796875, 8.4482421875, 8.76806640625, 9.087890625, 9.40771484375, 9.7275390625, 10.04736328125, 10.3671875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 14.0, 11.0, 18.0, 32.0, 33.0, 46.0, 47.0, 72.0, 80.0, 79.0, 78.0, 84.0, 86.0, 68.0, 67.0, 51.0, 50.0, 37.0, 14.0, 9.0, 12.0, 9.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0], "bins": [-7.85546875, -7.6873779296875, -7.519287109375, -7.3511962890625, -7.18310546875, -7.0150146484375, -6.846923828125, -6.6788330078125, -6.5107421875, -6.3426513671875, -6.174560546875, -6.0064697265625, -5.83837890625, -5.6702880859375, -5.502197265625, -5.3341064453125, -5.166015625, -4.9979248046875, -4.829833984375, -4.6617431640625, -4.49365234375, -4.3255615234375, -4.157470703125, -3.9893798828125, -3.8212890625, -3.6531982421875, -3.485107421875, -3.3170166015625, -3.14892578125, -2.9808349609375, -2.812744140625, -2.6446533203125, -2.4765625, -2.3084716796875, -2.140380859375, -1.9722900390625, -1.80419921875, -1.6361083984375, -1.468017578125, -1.2999267578125, -1.1318359375, -0.9637451171875, -0.795654296875, -0.6275634765625, -0.45947265625, -0.2913818359375, -0.123291015625, 0.0447998046875, 0.212890625, 0.3809814453125, 0.549072265625, 0.7171630859375, 0.88525390625, 1.0533447265625, 1.221435546875, 1.3895263671875, 1.5576171875, 1.7257080078125, 1.893798828125, 2.0618896484375, 2.22998046875, 2.3980712890625, 2.566162109375, 2.7342529296875, 2.90234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 3.0, 6.0, 8.0, 13.0, 13.0, 32.0, 37.0, 67.0, 105.0, 156.0, 285.0, 446.0, 872.0, 2182.0, 5722.0, 21613.0, 133080.0, 753310.0, 103656.0, 18134.0, 5094.0, 1796.0, 823.0, 407.0, 254.0, 145.0, 91.0, 56.0, 46.0, 27.0, 25.0, 10.0, 13.0, 8.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.11309814453125, -9.8277587890625, -9.54241943359375, -9.257080078125, -8.97174072265625, -8.6864013671875, -8.40106201171875, -8.11572265625, -7.83038330078125, -7.5450439453125, -7.25970458984375, -6.974365234375, -6.68902587890625, -6.4036865234375, -6.11834716796875, -5.8330078125, -5.54766845703125, -5.2623291015625, -4.97698974609375, -4.691650390625, -4.40631103515625, -4.1209716796875, -3.83563232421875, -3.55029296875, -3.26495361328125, -2.9796142578125, -2.69427490234375, -2.408935546875, -2.12359619140625, -1.8382568359375, -1.55291748046875, -1.267578125, -0.98223876953125, -0.6968994140625, -0.41156005859375, -0.126220703125, 0.15911865234375, 0.4444580078125, 0.72979736328125, 1.01513671875, 1.30047607421875, 1.5858154296875, 1.87115478515625, 2.156494140625, 2.44183349609375, 2.7271728515625, 3.01251220703125, 3.2978515625, 3.58319091796875, 3.8685302734375, 4.15386962890625, 4.439208984375, 4.72454833984375, 5.0098876953125, 5.29522705078125, 5.58056640625, 5.86590576171875, 6.1512451171875, 6.43658447265625, 6.721923828125, 7.00726318359375, 7.2926025390625, 7.57794189453125, 7.86328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 6.0, 6.0, 8.0, 17.0, 13.0, 26.0, 23.0, 27.0, 26.0, 38.0, 47.0, 59.0, 46.0, 54.0, 53.0, 61.0, 57.0, 56.0, 50.0, 56.0, 29.0, 34.0, 30.0, 32.0, 26.0, 19.0, 17.0, 20.0, 7.0, 12.0, 4.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.3203125, -12.9134521484375, -12.506591796875, -12.0997314453125, -11.69287109375, -11.2860107421875, -10.879150390625, -10.4722900390625, -10.0654296875, -9.6585693359375, -9.251708984375, -8.8448486328125, -8.43798828125, -8.0311279296875, -7.624267578125, -7.2174072265625, -6.810546875, -6.4036865234375, -5.996826171875, -5.5899658203125, -5.18310546875, -4.7762451171875, -4.369384765625, -3.9625244140625, -3.5556640625, -3.1488037109375, -2.741943359375, -2.3350830078125, -1.92822265625, -1.5213623046875, -1.114501953125, -0.7076416015625, -0.30078125, 0.1060791015625, 0.512939453125, 0.9197998046875, 1.32666015625, 1.7335205078125, 2.140380859375, 2.5472412109375, 2.9541015625, 3.3609619140625, 3.767822265625, 4.1746826171875, 4.58154296875, 4.9884033203125, 5.395263671875, 5.8021240234375, 6.208984375, 6.6158447265625, 7.022705078125, 7.4295654296875, 7.83642578125, 8.2432861328125, 8.650146484375, 9.0570068359375, 9.4638671875, 9.8707275390625, 10.277587890625, 10.6844482421875, 11.09130859375, 11.4981689453125, 11.905029296875, 12.3118896484375, 12.71875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 9.0, 11.0, 22.0, 19.0, 37.0, 46.0, 54.0, 85.0, 129.0, 169.0, 274.0, 403.0, 620.0, 940.0, 1504.0, 2581.0, 4431.0, 8701.0, 19601.0, 50909.0, 212055.0, 618381.0, 76221.0, 26287.0, 11399.0, 5614.0, 3159.0, 1719.0, 1079.0, 678.0, 436.0, 264.0, 220.0, 131.0, 119.0, 64.0, 56.0, 43.0, 16.0, 19.0, 13.0, 12.0, 8.0, 4.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0], "bins": [-3.759765625, -3.652862548828125, -3.54595947265625, -3.439056396484375, -3.3321533203125, -3.225250244140625, -3.11834716796875, -3.011444091796875, -2.904541015625, -2.797637939453125, -2.69073486328125, -2.583831787109375, -2.4769287109375, -2.370025634765625, -2.26312255859375, -2.156219482421875, -2.04931640625, -1.942413330078125, -1.83551025390625, -1.728607177734375, -1.6217041015625, -1.514801025390625, -1.40789794921875, -1.300994873046875, -1.194091796875, -1.087188720703125, -0.98028564453125, -0.873382568359375, -0.7664794921875, -0.659576416015625, -0.55267333984375, -0.445770263671875, -0.3388671875, -0.231964111328125, -0.12506103515625, -0.018157958984375, 0.0887451171875, 0.195648193359375, 0.30255126953125, 0.409454345703125, 0.516357421875, 0.623260498046875, 0.73016357421875, 0.837066650390625, 0.9439697265625, 1.050872802734375, 1.15777587890625, 1.264678955078125, 1.37158203125, 1.478485107421875, 1.58538818359375, 1.692291259765625, 1.7991943359375, 1.906097412109375, 2.01300048828125, 2.119903564453125, 2.226806640625, 2.333709716796875, 2.44061279296875, 2.547515869140625, 2.6544189453125, 2.761322021484375, 2.86822509765625, 2.975128173828125, 3.08203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 3.0, 14.0, 24.0, 20.0, 26.0, 57.0, 63.0, 99.0, 180.0, 175.0, 92.0, 74.0, 53.0, 25.0, 17.0, 11.0, 7.0, 4.0, 8.0, 4.0, 3.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001674652099609375, -0.0016317814588546753, -0.0015889108180999756, -0.0015460401773452759, -0.0015031695365905762, -0.0014602988958358765, -0.0014174282550811768, -0.001374557614326477, -0.0013316869735717773, -0.0012888163328170776, -0.001245945692062378, -0.0012030750513076782, -0.0011602044105529785, -0.0011173337697982788, -0.001074463129043579, -0.0010315924882888794, -0.0009887218475341797, -0.00094585120677948, -0.0009029805660247803, -0.0008601099252700806, -0.0008172392845153809, -0.0007743686437606812, -0.0007314980030059814, -0.0006886273622512817, -0.000645756721496582, -0.0006028860807418823, -0.0005600154399871826, -0.0005171447992324829, -0.0004742741584777832, -0.0004314035177230835, -0.0003885328769683838, -0.0003456622362136841, -0.0003027915954589844, -0.00025992095470428467, -0.00021705031394958496, -0.00017417967319488525, -0.00013130903244018555, -8.843839168548584e-05, -4.556775093078613e-05, -2.6971101760864258e-06, 4.017353057861328e-05, 8.304417133331299e-05, 0.0001259148120880127, 0.0001687854528427124, 0.0002116560935974121, 0.0002545267343521118, 0.0002973973751068115, 0.00034026801586151123, 0.00038313865661621094, 0.00042600929737091064, 0.00046887993812561035, 0.0005117505788803101, 0.0005546212196350098, 0.0005974918603897095, 0.0006403625011444092, 0.0006832331418991089, 0.0007261037826538086, 0.0007689744234085083, 0.000811845064163208, 0.0008547157049179077, 0.0008975863456726074, 0.0009404569864273071, 0.0009833276271820068, 0.0010261982679367065, 0.0010690689086914062]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 10.0, 9.0, 14.0, 23.0, 31.0, 51.0, 83.0, 177.0, 351.0, 831.0, 2639.0, 10889.0, 83740.0, 871936.0, 64711.0, 9298.0, 2308.0, 762.0, 298.0, 143.0, 82.0, 70.0, 30.0, 19.0, 12.0, 16.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.93359375, -7.67303466796875, -7.4124755859375, -7.15191650390625, -6.891357421875, -6.63079833984375, -6.3702392578125, -6.10968017578125, -5.84912109375, -5.58856201171875, -5.3280029296875, -5.06744384765625, -4.806884765625, -4.54632568359375, -4.2857666015625, -4.02520751953125, -3.7646484375, -3.50408935546875, -3.2435302734375, -2.98297119140625, -2.722412109375, -2.46185302734375, -2.2012939453125, -1.94073486328125, -1.68017578125, -1.41961669921875, -1.1590576171875, -0.89849853515625, -0.637939453125, -0.37738037109375, -0.1168212890625, 0.14373779296875, 0.404296875, 0.66485595703125, 0.9254150390625, 1.18597412109375, 1.446533203125, 1.70709228515625, 1.9676513671875, 2.22821044921875, 2.48876953125, 2.74932861328125, 3.0098876953125, 3.27044677734375, 3.531005859375, 3.79156494140625, 4.0521240234375, 4.31268310546875, 4.5732421875, 4.83380126953125, 5.0943603515625, 5.35491943359375, 5.615478515625, 5.87603759765625, 6.1365966796875, 6.39715576171875, 6.65771484375, 6.91827392578125, 7.1788330078125, 7.43939208984375, 7.699951171875, 7.96051025390625, 8.2210693359375, 8.48162841796875, 8.7421875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 6.0, 8.0, 4.0, 9.0, 8.0, 11.0, 15.0, 18.0, 19.0, 23.0, 49.0, 45.0, 75.0, 82.0, 121.0, 105.0, 82.0, 81.0, 45.0, 45.0, 30.0, 21.0, 26.0, 16.0, 9.0, 14.0, 10.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.931640625, -3.8310546875, -3.73046875, -3.6298828125, -3.529296875, -3.4287109375, -3.328125, -3.2275390625, -3.126953125, -3.0263671875, -2.92578125, -2.8251953125, -2.724609375, -2.6240234375, -2.5234375, -2.4228515625, -2.322265625, -2.2216796875, -2.12109375, -2.0205078125, -1.919921875, -1.8193359375, -1.71875, -1.6181640625, -1.517578125, -1.4169921875, -1.31640625, -1.2158203125, -1.115234375, -1.0146484375, -0.9140625, -0.8134765625, -0.712890625, -0.6123046875, -0.51171875, -0.4111328125, -0.310546875, -0.2099609375, -0.109375, -0.0087890625, 0.091796875, 0.1923828125, 0.29296875, 0.3935546875, 0.494140625, 0.5947265625, 0.6953125, 0.7958984375, 0.896484375, 0.9970703125, 1.09765625, 1.1982421875, 1.298828125, 1.3994140625, 1.5, 1.6005859375, 1.701171875, 1.8017578125, 1.90234375, 2.0029296875, 2.103515625, 2.2041015625, 2.3046875, 2.4052734375, 2.505859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 11.0, 20.0, 60.0, 147.0, 328.0, 157.0, 118.0, 51.0, 39.0, 22.0, 15.0, 9.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.82377624511719, -97.62581634521484, -94.42784881591797, -91.22988891601562, -88.03192138671875, -84.8339614868164, -81.63600158691406, -78.43803405761719, -75.24006652832031, -72.04210662841797, -68.8441390991211, -65.64617919921875, -62.448211669921875, -59.25025177001953, -56.05228805541992, -52.85432434082031, -49.65636444091797, -46.45840072631836, -43.26043701171875, -40.062477111816406, -36.86450958251953, -33.66654968261719, -30.468585968017578, -27.27062225341797, -24.07265853881836, -20.87469482421875, -17.67673110961914, -14.478769302368164, -11.280805587768555, -8.082841873168945, -4.884880065917969, -1.6869163513183594, 1.51104736328125, 4.709010601043701, 7.906973838806152, 11.104936599731445, 14.302900314331055, 17.500864028930664, 20.69882583618164, 23.89678955078125, 27.09475326538086, 30.29271697998047, 33.49068069458008, 36.68864440917969, 39.88660430908203, 43.084571838378906, 46.28253173828125, 49.48049545288086, 52.67845916748047, 55.87642288208008, 59.07438659667969, 62.27234649658203, 65.4703140258789, 68.66827392578125, 71.86624145507812, 75.06420135498047, 78.26216125488281, 81.46012115478516, 84.65808868408203, 87.85604858398438, 91.05401611328125, 94.2519760131836, 97.44993591308594, 100.64790344238281, 103.84587097167969]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 9.0, 4.0, 4.0, 7.0, 5.0, 14.0, 18.0, 16.0, 18.0, 23.0, 27.0, 32.0, 30.0, 32.0, 21.0, 50.0, 53.0, 91.0, 107.0, 86.0, 52.0, 29.0, 34.0, 26.0, 23.0, 24.0, 28.0, 29.0, 23.0, 12.0, 13.0, 9.0, 9.0, 7.0, 14.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-45.551727294921875, -43.94677734375, -42.34182357788086, -40.736873626708984, -39.13192367553711, -37.52696990966797, -35.922019958496094, -34.31707000732422, -32.712120056152344, -31.107168197631836, -29.50221824645996, -27.897266387939453, -26.292316436767578, -24.68736457824707, -23.082412719726562, -21.477462768554688, -19.872509002685547, -18.26755714416504, -16.662607192993164, -15.057655334472656, -13.452704429626465, -11.847753524780273, -10.242801666259766, -8.637850761413574, -7.032899856567383, -5.427948951721191, -3.822997570037842, -2.218046188354492, -0.6130952835083008, 0.9918556213378906, 2.5968074798583984, 4.20175838470459, 5.806709289550781, 7.411660194396973, 9.016611099243164, 10.621562957763672, 12.226513862609863, 13.831464767456055, 15.436416625976562, 17.041366577148438, 18.646318435668945, 20.251270294189453, 21.856220245361328, 23.461172103881836, 25.066123962402344, 26.67107391357422, 28.276025772094727, 29.880977630615234, 31.48592758178711, 33.090877532958984, 34.695831298828125, 36.30078125, 37.905731201171875, 39.51068115234375, 41.11563491821289, 42.720584869384766, 44.325538635253906, 45.93048858642578, 47.53544235229492, 49.1403923034668, 50.74534225463867, 52.35029602050781, 53.95524597167969, 55.56019592285156, 57.16514587402344]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 12.0, 23.0, 35.0, 43.0, 67.0, 114.0, 218.0, 413.0, 1190.0, 5520.0, 150746.0, 4000428.0, 30549.0, 3369.0, 850.0, 345.0, 142.0, 90.0, 37.0, 25.0, 18.0, 12.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-26.578125, -25.9786376953125, -25.379150390625, -24.7796630859375, -24.18017578125, -23.5806884765625, -22.981201171875, -22.3817138671875, -21.7822265625, -21.1827392578125, -20.583251953125, -19.9837646484375, -19.38427734375, -18.7847900390625, -18.185302734375, -17.5858154296875, -16.986328125, -16.3868408203125, -15.787353515625, -15.1878662109375, -14.58837890625, -13.9888916015625, -13.389404296875, -12.7899169921875, -12.1904296875, -11.5909423828125, -10.991455078125, -10.3919677734375, -9.79248046875, -9.1929931640625, -8.593505859375, -7.9940185546875, -7.39453125, -6.7950439453125, -6.195556640625, -5.5960693359375, -4.99658203125, -4.3970947265625, -3.797607421875, -3.1981201171875, -2.5986328125, -1.9991455078125, -1.399658203125, -0.8001708984375, -0.20068359375, 0.3988037109375, 0.998291015625, 1.5977783203125, 2.197265625, 2.7967529296875, 3.396240234375, 3.9957275390625, 4.59521484375, 5.1947021484375, 5.794189453125, 6.3936767578125, 6.9931640625, 7.5926513671875, 8.192138671875, 8.7916259765625, 9.39111328125, 9.9906005859375, 10.590087890625, 11.1895751953125, 11.7890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 10.0, 9.0, 14.0, 13.0, 23.0, 21.0, 24.0, 34.0, 35.0, 46.0, 58.0, 56.0, 55.0, 65.0, 45.0, 55.0, 56.0, 44.0, 59.0, 44.0, 37.0, 36.0, 32.0, 31.0, 24.0, 11.0, 13.0, 9.0, 8.0, 5.0, 9.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.236328125, -3.118865966796875, -3.00140380859375, -2.883941650390625, -2.7664794921875, -2.649017333984375, -2.53155517578125, -2.414093017578125, -2.296630859375, -2.179168701171875, -2.06170654296875, -1.944244384765625, -1.8267822265625, -1.709320068359375, -1.59185791015625, -1.474395751953125, -1.35693359375, -1.239471435546875, -1.12200927734375, -1.004547119140625, -0.8870849609375, -0.769622802734375, -0.65216064453125, -0.534698486328125, -0.417236328125, -0.299774169921875, -0.18231201171875, -0.064849853515625, 0.0526123046875, 0.170074462890625, 0.28753662109375, 0.404998779296875, 0.5224609375, 0.639923095703125, 0.75738525390625, 0.874847412109375, 0.9923095703125, 1.109771728515625, 1.22723388671875, 1.344696044921875, 1.462158203125, 1.579620361328125, 1.69708251953125, 1.814544677734375, 1.9320068359375, 2.049468994140625, 2.16693115234375, 2.284393310546875, 2.40185546875, 2.519317626953125, 2.63677978515625, 2.754241943359375, 2.8717041015625, 2.989166259765625, 3.10662841796875, 3.224090576171875, 3.341552734375, 3.459014892578125, 3.57647705078125, 3.693939208984375, 3.8114013671875, 3.928863525390625, 4.04632568359375, 4.163787841796875, 4.28125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 12.0, 21.0, 23.0, 38.0, 79.0, 142.0, 259.0, 563.0, 1675.0, 11358.0, 2611832.0, 1555981.0, 9779.0, 1463.0, 533.0, 236.0, 111.0, 69.0, 37.0, 24.0, 12.0, 11.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.1875, -15.51220703125, -14.8369140625, -14.16162109375, -13.486328125, -12.81103515625, -12.1357421875, -11.46044921875, -10.78515625, -10.10986328125, -9.4345703125, -8.75927734375, -8.083984375, -7.40869140625, -6.7333984375, -6.05810546875, -5.3828125, -4.70751953125, -4.0322265625, -3.35693359375, -2.681640625, -2.00634765625, -1.3310546875, -0.65576171875, 0.01953125, 0.69482421875, 1.3701171875, 2.04541015625, 2.720703125, 3.39599609375, 4.0712890625, 4.74658203125, 5.421875, 6.09716796875, 6.7724609375, 7.44775390625, 8.123046875, 8.79833984375, 9.4736328125, 10.14892578125, 10.82421875, 11.49951171875, 12.1748046875, 12.85009765625, 13.525390625, 14.20068359375, 14.8759765625, 15.55126953125, 16.2265625, 16.90185546875, 17.5771484375, 18.25244140625, 18.927734375, 19.60302734375, 20.2783203125, 20.95361328125, 21.62890625, 22.30419921875, 22.9794921875, 23.65478515625, 24.330078125, 25.00537109375, 25.6806640625, 26.35595703125, 27.03125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 11.0, 13.0, 17.0, 19.0, 33.0, 39.0, 74.0, 141.0, 279.0, 521.0, 884.0, 867.0, 535.0, 303.0, 128.0, 77.0, 34.0, 27.0, 20.0, 10.0, 12.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1171875, -9.820068359375, -9.52294921875, -9.225830078125, -8.9287109375, -8.631591796875, -8.33447265625, -8.037353515625, -7.740234375, -7.443115234375, -7.14599609375, -6.848876953125, -6.5517578125, -6.254638671875, -5.95751953125, -5.660400390625, -5.36328125, -5.066162109375, -4.76904296875, -4.471923828125, -4.1748046875, -3.877685546875, -3.58056640625, -3.283447265625, -2.986328125, -2.689208984375, -2.39208984375, -2.094970703125, -1.7978515625, -1.500732421875, -1.20361328125, -0.906494140625, -0.609375, -0.312255859375, -0.01513671875, 0.281982421875, 0.5791015625, 0.876220703125, 1.17333984375, 1.470458984375, 1.767578125, 2.064697265625, 2.36181640625, 2.658935546875, 2.9560546875, 3.253173828125, 3.55029296875, 3.847412109375, 4.14453125, 4.441650390625, 4.73876953125, 5.035888671875, 5.3330078125, 5.630126953125, 5.92724609375, 6.224365234375, 6.521484375, 6.818603515625, 7.11572265625, 7.412841796875, 7.7099609375, 8.007080078125, 8.30419921875, 8.601318359375, 8.8984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 5.0, 8.0, 10.0, 9.0, 14.0, 17.0, 31.0, 51.0, 77.0, 136.0, 160.0, 191.0, 131.0, 71.0, 32.0, 25.0, 11.0, 8.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.07937622070312, -96.48065948486328, -93.88194274902344, -91.2832260131836, -88.68450927734375, -86.0857925415039, -83.48707580566406, -80.88835906982422, -78.28964233398438, -75.69092559814453, -73.09220886230469, -70.49349212646484, -67.894775390625, -65.29605865478516, -62.69734191894531, -60.09862518310547, -57.499908447265625, -54.90119171142578, -52.30247497558594, -49.703758239746094, -47.10504150390625, -44.506324768066406, -41.90760803222656, -39.30889129638672, -36.710174560546875, -34.11145782470703, -31.512741088867188, -28.914024353027344, -26.3153076171875, -23.716590881347656, -21.117874145507812, -18.51915740966797, -15.920440673828125, -13.321723937988281, -10.723007202148438, -8.124290466308594, -5.52557373046875, -2.9268569946289062, -0.3281402587890625, 2.2705764770507812, 4.869293212890625, 7.468009948730469, 10.066726684570312, 12.665443420410156, 15.26416015625, 17.862876892089844, 20.461593627929688, 23.06031036376953, 25.659027099609375, 28.25774383544922, 30.856460571289062, 33.455177307128906, 36.05389404296875, 38.652610778808594, 41.25132751464844, 43.85004425048828, 46.448760986328125, 49.04747772216797, 51.64619445800781, 54.244911193847656, 56.8436279296875, 59.442344665527344, 62.04106140136719, 64.63977813720703, 67.23849487304688]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 5.0, 12.0, 10.0, 24.0, 10.0, 24.0, 31.0, 30.0, 32.0, 29.0, 42.0, 39.0, 39.0, 51.0, 55.0, 41.0, 44.0, 52.0, 44.0, 42.0, 50.0, 32.0, 35.0, 37.0, 45.0, 26.0, 19.0, 17.0, 19.0, 9.0, 10.0, 9.0, 8.0, 7.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.138973236083984, -29.904857635498047, -28.67074203491211, -27.43662452697754, -26.2025089263916, -24.968393325805664, -23.734275817871094, -22.500160217285156, -21.26604461669922, -20.03192901611328, -18.797813415527344, -17.563695907592773, -16.329580307006836, -15.095464706420898, -13.861348152160645, -12.62723159790039, -11.393115997314453, -10.159000396728516, -8.924883842468262, -7.690767765045166, -6.45665168762207, -5.222535610198975, -3.988419532775879, -2.754302978515625, -1.5201873779296875, -0.2860713005065918, 0.9480447769165039, 2.1821608543395996, 3.4162769317626953, 4.650393009185791, 5.884509086608887, 7.118625640869141, 8.352745056152344, 9.586860656738281, 10.820977210998535, 12.055093765258789, 13.289209365844727, 14.523324966430664, 15.757441520690918, 16.991558074951172, 18.22567367553711, 19.459789276123047, 20.693904876708984, 21.928022384643555, 23.162137985229492, 24.39625358581543, 25.63037109375, 26.864486694335938, 28.098602294921875, 29.332717895507812, 30.56683349609375, 31.80095100402832, 33.035064697265625, 34.26918411254883, 35.503299713134766, 36.7374153137207, 37.97153091430664, 39.20564651489258, 40.439762115478516, 41.67387771606445, 42.907997131347656, 44.142112731933594, 45.37622833251953, 46.61034393310547, 47.844459533691406]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 8.0, 23.0, 29.0, 54.0, 127.0, 228.0, 690.0, 2766.0, 16681.0, 182825.0, 758936.0, 74856.0, 8842.0, 1667.0, 455.0, 177.0, 76.0, 41.0, 26.0, 12.0, 14.0, 7.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.6676025390625, -8.296142578125, -7.9246826171875, -7.55322265625, -7.1817626953125, -6.810302734375, -6.4388427734375, -6.0673828125, -5.6959228515625, -5.324462890625, -4.9530029296875, -4.58154296875, -4.2100830078125, -3.838623046875, -3.4671630859375, -3.095703125, -2.7242431640625, -2.352783203125, -1.9813232421875, -1.60986328125, -1.2384033203125, -0.866943359375, -0.4954833984375, -0.1240234375, 0.2474365234375, 0.618896484375, 0.9903564453125, 1.36181640625, 1.7332763671875, 2.104736328125, 2.4761962890625, 2.84765625, 3.2191162109375, 3.590576171875, 3.9620361328125, 4.33349609375, 4.7049560546875, 5.076416015625, 5.4478759765625, 5.8193359375, 6.1907958984375, 6.562255859375, 6.9337158203125, 7.30517578125, 7.6766357421875, 8.048095703125, 8.4195556640625, 8.791015625, 9.1624755859375, 9.533935546875, 9.9053955078125, 10.27685546875, 10.6483154296875, 11.019775390625, 11.3912353515625, 11.7626953125, 12.1341552734375, 12.505615234375, 12.8770751953125, 13.24853515625, 13.6199951171875, 13.991455078125, 14.3629150390625, 14.734375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 7.0, 14.0, 10.0, 20.0, 27.0, 43.0, 55.0, 58.0, 73.0, 84.0, 76.0, 78.0, 80.0, 72.0, 58.0, 50.0, 49.0, 49.0, 38.0, 22.0, 11.0, 10.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.875, -6.691162109375, -6.50732421875, -6.323486328125, -6.1396484375, -5.955810546875, -5.77197265625, -5.588134765625, -5.404296875, -5.220458984375, -5.03662109375, -4.852783203125, -4.6689453125, -4.485107421875, -4.30126953125, -4.117431640625, -3.93359375, -3.749755859375, -3.56591796875, -3.382080078125, -3.1982421875, -3.014404296875, -2.83056640625, -2.646728515625, -2.462890625, -2.279052734375, -2.09521484375, -1.911376953125, -1.7275390625, -1.543701171875, -1.35986328125, -1.176025390625, -0.9921875, -0.808349609375, -0.62451171875, -0.440673828125, -0.2568359375, -0.072998046875, 0.11083984375, 0.294677734375, 0.478515625, 0.662353515625, 0.84619140625, 1.030029296875, 1.2138671875, 1.397705078125, 1.58154296875, 1.765380859375, 1.94921875, 2.133056640625, 2.31689453125, 2.500732421875, 2.6845703125, 2.868408203125, 3.05224609375, 3.236083984375, 3.419921875, 3.603759765625, 3.78759765625, 3.971435546875, 4.1552734375, 4.339111328125, 4.52294921875, 4.706787109375, 4.890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 10.0, 18.0, 22.0, 29.0, 42.0, 66.0, 94.0, 188.0, 334.0, 707.0, 1735.0, 6870.0, 79908.0, 908782.0, 41976.0, 5030.0, 1390.0, 582.0, 290.0, 163.0, 104.0, 60.0, 44.0, 34.0, 18.0, 9.0, 15.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2734375, -14.802001953125, -14.33056640625, -13.859130859375, -13.3876953125, -12.916259765625, -12.44482421875, -11.973388671875, -11.501953125, -11.030517578125, -10.55908203125, -10.087646484375, -9.6162109375, -9.144775390625, -8.67333984375, -8.201904296875, -7.73046875, -7.259033203125, -6.78759765625, -6.316162109375, -5.8447265625, -5.373291015625, -4.90185546875, -4.430419921875, -3.958984375, -3.487548828125, -3.01611328125, -2.544677734375, -2.0732421875, -1.601806640625, -1.13037109375, -0.658935546875, -0.1875, 0.283935546875, 0.75537109375, 1.226806640625, 1.6982421875, 2.169677734375, 2.64111328125, 3.112548828125, 3.583984375, 4.055419921875, 4.52685546875, 4.998291015625, 5.4697265625, 5.941162109375, 6.41259765625, 6.884033203125, 7.35546875, 7.826904296875, 8.29833984375, 8.769775390625, 9.2412109375, 9.712646484375, 10.18408203125, 10.655517578125, 11.126953125, 11.598388671875, 12.06982421875, 12.541259765625, 13.0126953125, 13.484130859375, 13.95556640625, 14.427001953125, 14.8984375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 11.0, 7.0, 15.0, 19.0, 28.0, 29.0, 49.0, 52.0, 86.0, 78.0, 82.0, 91.0, 91.0, 83.0, 56.0, 51.0, 43.0, 39.0, 17.0, 21.0, 12.0, 10.0, 5.0, 8.0, 6.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.59375, -18.87548828125, -18.1572265625, -17.43896484375, -16.720703125, -16.00244140625, -15.2841796875, -14.56591796875, -13.84765625, -13.12939453125, -12.4111328125, -11.69287109375, -10.974609375, -10.25634765625, -9.5380859375, -8.81982421875, -8.1015625, -7.38330078125, -6.6650390625, -5.94677734375, -5.228515625, -4.51025390625, -3.7919921875, -3.07373046875, -2.35546875, -1.63720703125, -0.9189453125, -0.20068359375, 0.517578125, 1.23583984375, 1.9541015625, 2.67236328125, 3.390625, 4.10888671875, 4.8271484375, 5.54541015625, 6.263671875, 6.98193359375, 7.7001953125, 8.41845703125, 9.13671875, 9.85498046875, 10.5732421875, 11.29150390625, 12.009765625, 12.72802734375, 13.4462890625, 14.16455078125, 14.8828125, 15.60107421875, 16.3193359375, 17.03759765625, 17.755859375, 18.47412109375, 19.1923828125, 19.91064453125, 20.62890625, 21.34716796875, 22.0654296875, 22.78369140625, 23.501953125, 24.22021484375, 24.9384765625, 25.65673828125, 26.375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 5.0, 6.0, 3.0, 8.0, 10.0, 15.0, 22.0, 18.0, 21.0, 45.0, 51.0, 87.0, 140.0, 241.0, 381.0, 792.0, 1836.0, 4942.0, 16634.0, 94434.0, 828256.0, 77989.0, 14630.0, 4490.0, 1716.0, 766.0, 402.0, 201.0, 116.0, 79.0, 58.0, 35.0, 35.0, 26.0, 15.0, 11.0, 9.0, 6.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.8671875, -3.75811767578125, -3.6490478515625, -3.53997802734375, -3.430908203125, -3.32183837890625, -3.2127685546875, -3.10369873046875, -2.99462890625, -2.88555908203125, -2.7764892578125, -2.66741943359375, -2.558349609375, -2.44927978515625, -2.3402099609375, -2.23114013671875, -2.1220703125, -2.01300048828125, -1.9039306640625, -1.79486083984375, -1.685791015625, -1.57672119140625, -1.4676513671875, -1.35858154296875, -1.24951171875, -1.14044189453125, -1.0313720703125, -0.92230224609375, -0.813232421875, -0.70416259765625, -0.5950927734375, -0.48602294921875, -0.376953125, -0.26788330078125, -0.1588134765625, -0.04974365234375, 0.059326171875, 0.16839599609375, 0.2774658203125, 0.38653564453125, 0.49560546875, 0.60467529296875, 0.7137451171875, 0.82281494140625, 0.931884765625, 1.04095458984375, 1.1500244140625, 1.25909423828125, 1.3681640625, 1.47723388671875, 1.5863037109375, 1.69537353515625, 1.804443359375, 1.91351318359375, 2.0225830078125, 2.13165283203125, 2.24072265625, 2.34979248046875, 2.4588623046875, 2.56793212890625, 2.677001953125, 2.78607177734375, 2.8951416015625, 3.00421142578125, 3.11328125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 9.0, 2.0, 16.0, 16.0, 27.0, 29.0, 90.0, 174.0, 269.0, 165.0, 87.0, 41.0, 17.0, 15.0, 4.0, 12.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009775161743164062, -0.0009319484233856201, -0.000886380672454834, -0.0008408129215240479, -0.0007952451705932617, -0.0007496774196624756, -0.0007041096687316895, -0.0006585419178009033, -0.0006129741668701172, -0.0005674064159393311, -0.0005218386650085449, -0.0004762709140777588, -0.00043070316314697266, -0.0003851354122161865, -0.0003395676612854004, -0.00029399991035461426, -0.0002484321594238281, -0.000202864408493042, -0.00015729665756225586, -0.00011172890663146973, -6.61611557006836e-05, -2.059340476989746e-05, 2.4974346160888672e-05, 7.05420970916748e-05, 0.00011610984802246094, 0.00016167759895324707, 0.0002072453498840332, 0.00025281310081481934, 0.00029838085174560547, 0.0003439486026763916, 0.00038951635360717773, 0.00043508410453796387, 0.00048065185546875, 0.0005262196063995361, 0.0005717873573303223, 0.0006173551082611084, 0.0006629228591918945, 0.0007084906101226807, 0.0007540583610534668, 0.0007996261119842529, 0.0008451938629150391, 0.0008907616138458252, 0.0009363293647766113, 0.0009818971157073975, 0.0010274648666381836, 0.0010730326175689697, 0.0011186003684997559, 0.001164168119430542, 0.0012097358703613281, 0.0012553036212921143, 0.0013008713722229004, 0.0013464391231536865, 0.0013920068740844727, 0.0014375746250152588, 0.001483142375946045, 0.001528710126876831, 0.0015742778778076172, 0.0016198456287384033, 0.0016654133796691895, 0.0017109811305999756, 0.0017565488815307617, 0.0018021166324615479, 0.001847684383392334, 0.0018932521343231201, 0.0019388198852539062]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 7.0, 4.0, 10.0, 6.0, 10.0, 16.0, 12.0, 22.0, 35.0, 49.0, 88.0, 145.0, 250.0, 437.0, 774.0, 1587.0, 3715.0, 10285.0, 36753.0, 226655.0, 682974.0, 60569.0, 15007.0, 4989.0, 2033.0, 902.0, 482.0, 304.0, 152.0, 87.0, 61.0, 43.0, 25.0, 18.0, 17.0, 8.0, 7.0, 7.0, 6.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.09375, -2.007080078125, -1.92041015625, -1.833740234375, -1.7470703125, -1.660400390625, -1.57373046875, -1.487060546875, -1.400390625, -1.313720703125, -1.22705078125, -1.140380859375, -1.0537109375, -0.967041015625, -0.88037109375, -0.793701171875, -0.70703125, -0.620361328125, -0.53369140625, -0.447021484375, -0.3603515625, -0.273681640625, -0.18701171875, -0.100341796875, -0.013671875, 0.072998046875, 0.15966796875, 0.246337890625, 0.3330078125, 0.419677734375, 0.50634765625, 0.593017578125, 0.6796875, 0.766357421875, 0.85302734375, 0.939697265625, 1.0263671875, 1.113037109375, 1.19970703125, 1.286376953125, 1.373046875, 1.459716796875, 1.54638671875, 1.633056640625, 1.7197265625, 1.806396484375, 1.89306640625, 1.979736328125, 2.06640625, 2.153076171875, 2.23974609375, 2.326416015625, 2.4130859375, 2.499755859375, 2.58642578125, 2.673095703125, 2.759765625, 2.846435546875, 2.93310546875, 3.019775390625, 3.1064453125, 3.193115234375, 3.27978515625, 3.366455078125, 3.453125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 8.0, 3.0, 5.0, 3.0, 9.0, 7.0, 10.0, 18.0, 15.0, 19.0, 25.0, 21.0, 41.0, 35.0, 52.0, 66.0, 90.0, 64.0, 72.0, 75.0, 54.0, 50.0, 59.0, 30.0, 33.0, 15.0, 20.0, 16.0, 18.0, 6.0, 13.0, 10.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7412109375, -1.6834716796875, -1.625732421875, -1.5679931640625, -1.51025390625, -1.4525146484375, -1.394775390625, -1.3370361328125, -1.279296875, -1.2215576171875, -1.163818359375, -1.1060791015625, -1.04833984375, -0.9906005859375, -0.932861328125, -0.8751220703125, -0.8173828125, -0.7596435546875, -0.701904296875, -0.6441650390625, -0.58642578125, -0.5286865234375, -0.470947265625, -0.4132080078125, -0.35546875, -0.2977294921875, -0.239990234375, -0.1822509765625, -0.12451171875, -0.0667724609375, -0.009033203125, 0.0487060546875, 0.1064453125, 0.1641845703125, 0.221923828125, 0.2796630859375, 0.33740234375, 0.3951416015625, 0.452880859375, 0.5106201171875, 0.568359375, 0.6260986328125, 0.683837890625, 0.7415771484375, 0.79931640625, 0.8570556640625, 0.914794921875, 0.9725341796875, 1.0302734375, 1.0880126953125, 1.145751953125, 1.2034912109375, 1.26123046875, 1.3189697265625, 1.376708984375, 1.4344482421875, 1.4921875, 1.5499267578125, 1.607666015625, 1.6654052734375, 1.72314453125, 1.7808837890625, 1.838623046875, 1.8963623046875, 1.9541015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 8.0, 36.0, 152.0, 588.0, 175.0, 31.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.16714477539062, -176.7618865966797, -170.3566131591797, -163.95135498046875, -157.5460968017578, -151.1408233642578, -144.73556518554688, -138.33029174804688, -131.92503356933594, -125.51976776123047, -119.11450958251953, -112.70924377441406, -106.3039779663086, -99.89871215820312, -93.49345397949219, -87.08818817138672, -80.68292999267578, -74.27766418457031, -67.87240600585938, -61.467140197753906, -55.06187438964844, -48.656612396240234, -42.25135040283203, -35.84608459472656, -29.44082260131836, -23.035558700561523, -16.630294799804688, -10.225032806396484, -3.8197689056396484, 2.5854949951171875, 8.99075698852539, 15.39602279663086, 21.801284790039062, 28.2065486907959, 34.611812591552734, 41.01707458496094, 47.422340393066406, 53.82760238647461, 60.23286437988281, 66.63813018798828, 73.04339599609375, 79.44866180419922, 85.85391998291016, 92.25918579101562, 98.6644515991211, 105.06971740722656, 111.4749755859375, 117.88024139404297, 124.2854995727539, 130.69076538085938, 137.0960235595703, 143.50128173828125, 149.90655517578125, 156.3118133544922, 162.71707153320312, 169.12234497070312, 175.52760314941406, 181.932861328125, 188.338134765625, 194.74339294433594, 201.14865112304688, 207.55392456054688, 213.9591827392578, 220.36444091796875, 226.76971435546875]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 8.0, 11.0, 7.0, 9.0, 21.0, 18.0, 18.0, 23.0, 34.0, 32.0, 20.0, 49.0, 52.0, 57.0, 144.0, 134.0, 54.0, 55.0, 35.0, 40.0, 24.0, 25.0, 24.0, 21.0, 13.0, 13.0, 15.0, 13.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-86.34188842773438, -84.12348175048828, -81.90506744384766, -79.68666076660156, -77.46825408935547, -75.24983978271484, -73.03143310546875, -70.81302642822266, -68.59461212158203, -66.37620544433594, -64.15779113769531, -61.93938446044922, -59.72097396850586, -57.5025634765625, -55.284156799316406, -53.06574630737305, -50.84733963012695, -48.628929138183594, -46.4105224609375, -44.19211196899414, -41.97370147705078, -39.75529479980469, -37.53688430786133, -35.31847381591797, -33.100067138671875, -30.88165855407715, -28.66324806213379, -26.444839477539062, -24.226428985595703, -22.008020401000977, -19.78961181640625, -17.57120132446289, -15.352787017822266, -13.134377479553223, -10.91596794128418, -8.697559356689453, -6.47914981842041, -4.260740280151367, -2.0423316955566406, 0.17607784271240234, 2.3944873809814453, 4.612896919250488, 6.831305980682373, 9.049715042114258, 11.2681245803833, 13.486534118652344, 15.70494270324707, 17.923351287841797, 20.141761779785156, 22.360170364379883, 24.578580856323242, 26.79698944091797, 29.015399932861328, 31.233808517456055, 33.45221710205078, 35.67062759399414, 37.8890380859375, 40.10744857788086, 42.32585525512695, 44.54426574707031, 46.76267623901367, 48.98108673095703, 51.199493408203125, 53.417903900146484, 55.63631057739258]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 7.0, 21.0, 15.0, 20.0, 24.0, 55.0, 77.0, 143.0, 336.0, 820.0, 2774.0, 12388.0, 182744.0, 3555789.0, 412636.0, 20113.0, 4276.0, 1251.0, 434.0, 179.0, 73.0, 45.0, 24.0, 9.0, 10.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.8125, -20.3458251953125, -19.879150390625, -19.4124755859375, -18.94580078125, -18.4791259765625, -18.012451171875, -17.5457763671875, -17.0791015625, -16.6124267578125, -16.145751953125, -15.6790771484375, -15.21240234375, -14.7457275390625, -14.279052734375, -13.8123779296875, -13.345703125, -12.8790283203125, -12.412353515625, -11.9456787109375, -11.47900390625, -11.0123291015625, -10.545654296875, -10.0789794921875, -9.6123046875, -9.1456298828125, -8.678955078125, -8.2122802734375, -7.74560546875, -7.2789306640625, -6.812255859375, -6.3455810546875, -5.87890625, -5.4122314453125, -4.945556640625, -4.4788818359375, -4.01220703125, -3.5455322265625, -3.078857421875, -2.6121826171875, -2.1455078125, -1.6788330078125, -1.212158203125, -0.7454833984375, -0.27880859375, 0.1878662109375, 0.654541015625, 1.1212158203125, 1.587890625, 2.0545654296875, 2.521240234375, 2.9879150390625, 3.45458984375, 3.9212646484375, 4.387939453125, 4.8546142578125, 5.3212890625, 5.7879638671875, 6.254638671875, 6.7213134765625, 7.18798828125, 7.6546630859375, 8.121337890625, 8.5880126953125, 9.0546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 10.0, 7.0, 10.0, 10.0, 13.0, 26.0, 30.0, 23.0, 47.0, 30.0, 49.0, 54.0, 56.0, 61.0, 58.0, 69.0, 49.0, 58.0, 51.0, 55.0, 45.0, 50.0, 30.0, 27.0, 19.0, 19.0, 14.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0], "bins": [-5.89453125, -5.75970458984375, -5.6248779296875, -5.49005126953125, -5.355224609375, -5.22039794921875, -5.0855712890625, -4.95074462890625, -4.81591796875, -4.68109130859375, -4.5462646484375, -4.41143798828125, -4.276611328125, -4.14178466796875, -4.0069580078125, -3.87213134765625, -3.7373046875, -3.60247802734375, -3.4676513671875, -3.33282470703125, -3.197998046875, -3.06317138671875, -2.9283447265625, -2.79351806640625, -2.65869140625, -2.52386474609375, -2.3890380859375, -2.25421142578125, -2.119384765625, -1.98455810546875, -1.8497314453125, -1.71490478515625, -1.580078125, -1.44525146484375, -1.3104248046875, -1.17559814453125, -1.040771484375, -0.90594482421875, -0.7711181640625, -0.63629150390625, -0.50146484375, -0.36663818359375, -0.2318115234375, -0.09698486328125, 0.037841796875, 0.17266845703125, 0.3074951171875, 0.44232177734375, 0.5771484375, 0.71197509765625, 0.8468017578125, 0.98162841796875, 1.116455078125, 1.25128173828125, 1.3861083984375, 1.52093505859375, 1.65576171875, 1.79058837890625, 1.9254150390625, 2.06024169921875, 2.195068359375, 2.32989501953125, 2.4647216796875, 2.59954833984375, 2.734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 13.0, 25.0, 23.0, 57.0, 112.0, 270.0, 982.0, 6457.0, 4123920.0, 59474.0, 2125.0, 507.0, 186.0, 57.0, 39.0, 14.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.3125, -62.51318359375, -60.7138671875, -58.91455078125, -57.115234375, -55.31591796875, -53.5166015625, -51.71728515625, -49.91796875, -48.11865234375, -46.3193359375, -44.52001953125, -42.720703125, -40.92138671875, -39.1220703125, -37.32275390625, -35.5234375, -33.72412109375, -31.9248046875, -30.12548828125, -28.326171875, -26.52685546875, -24.7275390625, -22.92822265625, -21.12890625, -19.32958984375, -17.5302734375, -15.73095703125, -13.931640625, -12.13232421875, -10.3330078125, -8.53369140625, -6.734375, -4.93505859375, -3.1357421875, -1.33642578125, 0.462890625, 2.26220703125, 4.0615234375, 5.86083984375, 7.66015625, 9.45947265625, 11.2587890625, 13.05810546875, 14.857421875, 16.65673828125, 18.4560546875, 20.25537109375, 22.0546875, 23.85400390625, 25.6533203125, 27.45263671875, 29.251953125, 31.05126953125, 32.8505859375, 34.64990234375, 36.44921875, 38.24853515625, 40.0478515625, 41.84716796875, 43.646484375, 45.44580078125, 47.2451171875, 49.04443359375, 50.84375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 9.0, 16.0, 29.0, 72.0, 195.0, 457.0, 1305.0, 1213.0, 475.0, 162.0, 78.0, 33.0, 17.0, 10.0, 4.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.0, -43.0638427734375, -42.127685546875, -41.1915283203125, -40.25537109375, -39.3192138671875, -38.383056640625, -37.4468994140625, -36.5107421875, -35.5745849609375, -34.638427734375, -33.7022705078125, -32.76611328125, -31.8299560546875, -30.893798828125, -29.9576416015625, -29.021484375, -28.0853271484375, -27.149169921875, -26.2130126953125, -25.27685546875, -24.3406982421875, -23.404541015625, -22.4683837890625, -21.5322265625, -20.5960693359375, -19.659912109375, -18.7237548828125, -17.78759765625, -16.8514404296875, -15.915283203125, -14.9791259765625, -14.04296875, -13.1068115234375, -12.170654296875, -11.2344970703125, -10.29833984375, -9.3621826171875, -8.426025390625, -7.4898681640625, -6.5537109375, -5.6175537109375, -4.681396484375, -3.7452392578125, -2.80908203125, -1.8729248046875, -0.936767578125, -0.0006103515625, 0.935546875, 1.8717041015625, 2.807861328125, 3.7440185546875, 4.68017578125, 5.6163330078125, 6.552490234375, 7.4886474609375, 8.4248046875, 9.3609619140625, 10.297119140625, 11.2332763671875, 12.16943359375, 13.1055908203125, 14.041748046875, 14.9779052734375, 15.9140625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 5.0, 9.0, 12.0, 30.0, 59.0, 125.0, 211.0, 225.0, 151.0, 73.0, 34.0, 16.0, 12.0, 10.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.0352325439453, -140.95846557617188, -134.88169860839844, -128.804931640625, -122.72816467285156, -116.65139770507812, -110.57463073730469, -104.49786376953125, -98.42109680175781, -92.34432983398438, -86.26756286621094, -80.1907958984375, -74.11402893066406, -68.03726196289062, -61.96049499511719, -55.88372802734375, -49.80696105957031, -43.730194091796875, -37.65342712402344, -31.57666015625, -25.499893188476562, -19.423126220703125, -13.346359252929688, -7.26959228515625, -1.1928253173828125, 4.883941650390625, 10.960708618164062, 17.0374755859375, 23.114242553710938, 29.191009521484375, 35.26777648925781, 41.34454345703125, 47.42132568359375, 53.49809265136719, 59.574859619140625, 65.65162658691406, 71.7283935546875, 77.80516052246094, 83.88192749023438, 89.95869445800781, 96.03546142578125, 102.11222839355469, 108.18899536132812, 114.26576232910156, 120.342529296875, 126.41929626464844, 132.49606323242188, 138.5728302001953, 144.64959716796875, 150.7263641357422, 156.80313110351562, 162.87989807128906, 168.9566650390625, 175.03343200683594, 181.11019897460938, 187.1869659423828, 193.26373291015625, 199.3404998779297, 205.41726684570312, 211.49403381347656, 217.57080078125, 223.64756774902344, 229.72433471679688, 235.8011016845703, 241.87786865234375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 10.0, 10.0, 8.0, 10.0, 18.0, 16.0, 28.0, 35.0, 59.0, 53.0, 71.0, 73.0, 89.0, 113.0, 80.0, 76.0, 53.0, 41.0, 30.0, 27.0, 22.0, 22.0, 22.0, 9.0, 3.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.29942321777344, -93.79444885253906, -90.28946685791016, -86.78449249267578, -83.27951049804688, -79.7745361328125, -76.26956176757812, -72.76457977294922, -69.25959777832031, -65.75462341308594, -62.24964141845703, -58.744667053222656, -55.23968505859375, -51.734710693359375, -48.229732513427734, -44.724754333496094, -41.21977996826172, -37.71480178833008, -34.20982360839844, -30.70484733581543, -27.19986915588379, -23.69489097595215, -20.18991470336914, -16.6849365234375, -13.17995834350586, -9.674980163574219, -6.1700029373168945, -2.6650257110595703, 0.8399524688720703, 4.344930648803711, 7.849906921386719, 11.35488510131836, 14.859855651855469, 18.36483383178711, 21.86981201171875, 25.374788284301758, 28.8797664642334, 32.384742736816406, 35.88972091674805, 39.39469909667969, 42.89967727661133, 46.40465545654297, 49.90963363647461, 53.41461181640625, 56.919586181640625, 60.42456817626953, 63.929542541503906, 67.43452453613281, 70.93949890136719, 74.44447326660156, 77.94945526123047, 81.45442962646484, 84.95941162109375, 88.46438598632812, 91.9693603515625, 95.4743423461914, 98.97932434082031, 102.48429870605469, 105.9892807006836, 109.49425506591797, 112.99923706054688, 116.50421142578125, 120.00918579101562, 123.51416778564453, 127.0191421508789]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 6.0, 19.0, 11.0, 25.0, 53.0, 45.0, 84.0, 151.0, 257.0, 408.0, 876.0, 1985.0, 5252.0, 19716.0, 128497.0, 764974.0, 101054.0, 16832.0, 4767.0, 1785.0, 753.0, 408.0, 230.0, 121.0, 81.0, 50.0, 47.0, 22.0, 13.0, 15.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.109375, -8.8197021484375, -8.530029296875, -8.2403564453125, -7.95068359375, -7.6610107421875, -7.371337890625, -7.0816650390625, -6.7919921875, -6.5023193359375, -6.212646484375, -5.9229736328125, -5.63330078125, -5.3436279296875, -5.053955078125, -4.7642822265625, -4.474609375, -4.1849365234375, -3.895263671875, -3.6055908203125, -3.31591796875, -3.0262451171875, -2.736572265625, -2.4468994140625, -2.1572265625, -1.8675537109375, -1.577880859375, -1.2882080078125, -0.99853515625, -0.7088623046875, -0.419189453125, -0.1295166015625, 0.16015625, 0.4498291015625, 0.739501953125, 1.0291748046875, 1.31884765625, 1.6085205078125, 1.898193359375, 2.1878662109375, 2.4775390625, 2.7672119140625, 3.056884765625, 3.3465576171875, 3.63623046875, 3.9259033203125, 4.215576171875, 4.5052490234375, 4.794921875, 5.0845947265625, 5.374267578125, 5.6639404296875, 5.95361328125, 6.2432861328125, 6.532958984375, 6.8226318359375, 7.1123046875, 7.4019775390625, 7.691650390625, 7.9813232421875, 8.27099609375, 8.5606689453125, 8.850341796875, 9.1400146484375, 9.4296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 9.0, 11.0, 16.0, 23.0, 12.0, 21.0, 42.0, 59.0, 74.0, 80.0, 77.0, 94.0, 87.0, 86.0, 74.0, 61.0, 57.0, 38.0, 33.0, 13.0, 13.0, 11.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.0546875, -8.8013916015625, -8.548095703125, -8.2947998046875, -8.04150390625, -7.7882080078125, -7.534912109375, -7.2816162109375, -7.0283203125, -6.7750244140625, -6.521728515625, -6.2684326171875, -6.01513671875, -5.7618408203125, -5.508544921875, -5.2552490234375, -5.001953125, -4.7486572265625, -4.495361328125, -4.2420654296875, -3.98876953125, -3.7354736328125, -3.482177734375, -3.2288818359375, -2.9755859375, -2.7222900390625, -2.468994140625, -2.2156982421875, -1.96240234375, -1.7091064453125, -1.455810546875, -1.2025146484375, -0.94921875, -0.6959228515625, -0.442626953125, -0.1893310546875, 0.06396484375, 0.3172607421875, 0.570556640625, 0.8238525390625, 1.0771484375, 1.3304443359375, 1.583740234375, 1.8370361328125, 2.09033203125, 2.3436279296875, 2.596923828125, 2.8502197265625, 3.103515625, 3.3568115234375, 3.610107421875, 3.8634033203125, 4.11669921875, 4.3699951171875, 4.623291015625, 4.8765869140625, 5.1298828125, 5.3831787109375, 5.636474609375, 5.8897705078125, 6.14306640625, 6.3963623046875, 6.649658203125, 6.9029541015625, 7.15625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 5.0, 7.0, 6.0, 13.0, 10.0, 10.0, 24.0, 18.0, 34.0, 39.0, 67.0, 91.0, 120.0, 206.0, 380.0, 724.0, 1863.0, 6650.0, 54050.0, 915498.0, 58082.0, 6965.0, 1833.0, 751.0, 387.0, 227.0, 152.0, 92.0, 54.0, 49.0, 30.0, 35.0, 18.0, 8.0, 17.0, 12.0, 6.0, 5.0, 8.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.1015625, -9.781005859375, -9.46044921875, -9.139892578125, -8.8193359375, -8.498779296875, -8.17822265625, -7.857666015625, -7.537109375, -7.216552734375, -6.89599609375, -6.575439453125, -6.2548828125, -5.934326171875, -5.61376953125, -5.293212890625, -4.97265625, -4.652099609375, -4.33154296875, -4.010986328125, -3.6904296875, -3.369873046875, -3.04931640625, -2.728759765625, -2.408203125, -2.087646484375, -1.76708984375, -1.446533203125, -1.1259765625, -0.805419921875, -0.48486328125, -0.164306640625, 0.15625, 0.476806640625, 0.79736328125, 1.117919921875, 1.4384765625, 1.759033203125, 2.07958984375, 2.400146484375, 2.720703125, 3.041259765625, 3.36181640625, 3.682373046875, 4.0029296875, 4.323486328125, 4.64404296875, 4.964599609375, 5.28515625, 5.605712890625, 5.92626953125, 6.246826171875, 6.5673828125, 6.887939453125, 7.20849609375, 7.529052734375, 7.849609375, 8.170166015625, 8.49072265625, 8.811279296875, 9.1318359375, 9.452392578125, 9.77294921875, 10.093505859375, 10.4140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 6.0, 10.0, 7.0, 15.0, 11.0, 25.0, 27.0, 29.0, 35.0, 34.0, 44.0, 49.0, 65.0, 72.0, 90.0, 76.0, 63.0, 49.0, 49.0, 47.0, 35.0, 32.0, 22.0, 21.0, 20.0, 14.0, 14.0, 4.0, 6.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.576904296875, -16.93505859375, -16.293212890625, -15.6513671875, -15.009521484375, -14.36767578125, -13.725830078125, -13.083984375, -12.442138671875, -11.80029296875, -11.158447265625, -10.5166015625, -9.874755859375, -9.23291015625, -8.591064453125, -7.94921875, -7.307373046875, -6.66552734375, -6.023681640625, -5.3818359375, -4.739990234375, -4.09814453125, -3.456298828125, -2.814453125, -2.172607421875, -1.53076171875, -0.888916015625, -0.2470703125, 0.394775390625, 1.03662109375, 1.678466796875, 2.3203125, 2.962158203125, 3.60400390625, 4.245849609375, 4.8876953125, 5.529541015625, 6.17138671875, 6.813232421875, 7.455078125, 8.096923828125, 8.73876953125, 9.380615234375, 10.0224609375, 10.664306640625, 11.30615234375, 11.947998046875, 12.58984375, 13.231689453125, 13.87353515625, 14.515380859375, 15.1572265625, 15.799072265625, 16.44091796875, 17.082763671875, 17.724609375, 18.366455078125, 19.00830078125, 19.650146484375, 20.2919921875, 20.933837890625, 21.57568359375, 22.217529296875, 22.859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 11.0, 14.0, 20.0, 34.0, 60.0, 95.0, 203.0, 448.0, 1210.0, 5101.0, 55131.0, 957649.0, 23786.0, 3183.0, 835.0, 328.0, 155.0, 108.0, 57.0, 39.0, 19.0, 23.0, 9.0, 10.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.884765625, -2.7864990234375, -2.688232421875, -2.5899658203125, -2.49169921875, -2.3934326171875, -2.295166015625, -2.1968994140625, -2.0986328125, -2.0003662109375, -1.902099609375, -1.8038330078125, -1.70556640625, -1.6072998046875, -1.509033203125, -1.4107666015625, -1.3125, -1.2142333984375, -1.115966796875, -1.0177001953125, -0.91943359375, -0.8211669921875, -0.722900390625, -0.6246337890625, -0.5263671875, -0.4281005859375, -0.329833984375, -0.2315673828125, -0.13330078125, -0.0350341796875, 0.063232421875, 0.1614990234375, 0.259765625, 0.3580322265625, 0.456298828125, 0.5545654296875, 0.65283203125, 0.7510986328125, 0.849365234375, 0.9476318359375, 1.0458984375, 1.1441650390625, 1.242431640625, 1.3406982421875, 1.43896484375, 1.5372314453125, 1.635498046875, 1.7337646484375, 1.83203125, 1.9302978515625, 2.028564453125, 2.1268310546875, 2.22509765625, 2.3233642578125, 2.421630859375, 2.5198974609375, 2.6181640625, 2.7164306640625, 2.814697265625, 2.9129638671875, 3.01123046875, 3.1094970703125, 3.207763671875, 3.3060302734375, 3.404296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 6.0, 7.0, 12.0, 10.0, 18.0, 23.0, 50.0, 57.0, 148.0, 229.0, 192.0, 92.0, 40.0, 35.0, 21.0, 10.0, 8.0, 9.0, 4.0, 11.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007281303405761719, -0.0007044821977615356, -0.0006808340549468994, -0.0006571859121322632, -0.000633537769317627, -0.0006098896265029907, -0.0005862414836883545, -0.0005625933408737183, -0.000538945198059082, -0.0005152970552444458, -0.0004916489124298096, -0.00046800076961517334, -0.0004443526268005371, -0.0004207044839859009, -0.00039705634117126465, -0.0003734081983566284, -0.0003497600555419922, -0.00032611191272735596, -0.0003024637699127197, -0.0002788156270980835, -0.00025516748428344727, -0.00023151934146881104, -0.0002078711986541748, -0.00018422305583953857, -0.00016057491302490234, -0.0001369267702102661, -0.00011327862739562988, -8.963048458099365e-05, -6.598234176635742e-05, -4.233419895172119e-05, -1.868605613708496e-05, 4.9620866775512695e-06, 2.86102294921875e-05, 5.225837230682373e-05, 7.590651512145996e-05, 9.955465793609619e-05, 0.00012320280075073242, 0.00014685094356536865, 0.00017049908638000488, 0.0001941472291946411, 0.00021779537200927734, 0.00024144351482391357, 0.0002650916576385498, 0.00028873980045318604, 0.00031238794326782227, 0.0003360360860824585, 0.0003596842288970947, 0.00038333237171173096, 0.0004069805145263672, 0.0004306286573410034, 0.00045427680015563965, 0.0004779249429702759, 0.0005015730857849121, 0.0005252212285995483, 0.0005488693714141846, 0.0005725175142288208, 0.000596165657043457, 0.0006198137998580933, 0.0006434619426727295, 0.0006671100854873657, 0.000690758228302002, 0.0007144063711166382, 0.0007380545139312744, 0.0007617026567459106, 0.0007853507995605469]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 20.0, 29.0, 45.0, 72.0, 154.0, 295.0, 630.0, 1556.0, 5149.0, 24820.0, 828984.0, 165490.0, 15387.0, 3644.0, 1190.0, 492.0, 232.0, 134.0, 69.0, 50.0, 28.0, 17.0, 16.0, 14.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.31317138671875, -2.2357177734375, -2.15826416015625, -2.080810546875, -2.00335693359375, -1.9259033203125, -1.84844970703125, -1.77099609375, -1.69354248046875, -1.6160888671875, -1.53863525390625, -1.461181640625, -1.38372802734375, -1.3062744140625, -1.22882080078125, -1.1513671875, -1.07391357421875, -0.9964599609375, -0.91900634765625, -0.841552734375, -0.76409912109375, -0.6866455078125, -0.60919189453125, -0.53173828125, -0.45428466796875, -0.3768310546875, -0.29937744140625, -0.221923828125, -0.14447021484375, -0.0670166015625, 0.01043701171875, 0.087890625, 0.16534423828125, 0.2427978515625, 0.32025146484375, 0.397705078125, 0.47515869140625, 0.5526123046875, 0.63006591796875, 0.70751953125, 0.78497314453125, 0.8624267578125, 0.93988037109375, 1.017333984375, 1.09478759765625, 1.1722412109375, 1.24969482421875, 1.3271484375, 1.40460205078125, 1.4820556640625, 1.55950927734375, 1.636962890625, 1.71441650390625, 1.7918701171875, 1.86932373046875, 1.94677734375, 2.02423095703125, 2.1016845703125, 2.17913818359375, 2.256591796875, 2.33404541015625, 2.4114990234375, 2.48895263671875, 2.56640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 7.0, 3.0, 6.0, 12.0, 11.0, 11.0, 15.0, 20.0, 22.0, 29.0, 44.0, 58.0, 99.0, 131.0, 108.0, 118.0, 73.0, 63.0, 31.0, 24.0, 21.0, 16.0, 19.0, 8.0, 12.0, 5.0, 8.0, 8.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6259765625, -1.5701141357421875, -1.514251708984375, -1.4583892822265625, -1.40252685546875, -1.3466644287109375, -1.290802001953125, -1.2349395751953125, -1.1790771484375, -1.1232147216796875, -1.067352294921875, -1.0114898681640625, -0.95562744140625, -0.8997650146484375, -0.843902587890625, -0.7880401611328125, -0.732177734375, -0.6763153076171875, -0.620452880859375, -0.5645904541015625, -0.50872802734375, -0.4528656005859375, -0.397003173828125, -0.3411407470703125, -0.2852783203125, -0.2294158935546875, -0.173553466796875, -0.1176910400390625, -0.06182861328125, -0.0059661865234375, 0.049896240234375, 0.1057586669921875, 0.16162109375, 0.2174835205078125, 0.273345947265625, 0.3292083740234375, 0.38507080078125, 0.4409332275390625, 0.496795654296875, 0.5526580810546875, 0.6085205078125, 0.6643829345703125, 0.720245361328125, 0.7761077880859375, 0.83197021484375, 0.8878326416015625, 0.943695068359375, 0.9995574951171875, 1.055419921875, 1.1112823486328125, 1.167144775390625, 1.2230072021484375, 1.27886962890625, 1.3347320556640625, 1.390594482421875, 1.4464569091796875, 1.5023193359375, 1.5581817626953125, 1.614044189453125, 1.6699066162109375, 1.72576904296875, 1.7816314697265625, 1.837493896484375, 1.8933563232421875, 1.94921875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 14.0, 29.0, 76.0, 190.0, 498.0, 99.0, 40.0, 24.0, 9.0, 3.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.94486999511719, -46.84848403930664, -43.752098083496094, -40.65570831298828, -37.559322357177734, -34.46293640136719, -31.36655044555664, -28.27016258239746, -25.173776626586914, -22.077390670776367, -18.981002807617188, -15.88461685180664, -12.788229942321777, -9.691843032836914, -6.595457077026367, -3.4990692138671875, -0.4026832580566406, 2.6937034130096436, 5.790090084075928, 8.886476516723633, 11.982863426208496, 15.07925033569336, 18.175636291503906, 21.272024154663086, 24.368410110473633, 27.46479606628418, 30.56118392944336, 33.657569885253906, 36.75395584106445, 39.850341796875, 42.94673156738281, 46.04311752319336, 49.139503479003906, 52.23588943481445, 55.332275390625, 58.42866516113281, 61.52505111694336, 64.6214370727539, 67.71781921386719, 70.814208984375, 73.91059875488281, 77.00698852539062, 80.1033706665039, 83.19976043701172, 86.296142578125, 89.39253234863281, 92.48892211914062, 95.5853042602539, 98.68168640136719, 101.778076171875, 104.87445831298828, 107.9708480834961, 111.06723022460938, 114.16361999511719, 117.260009765625, 120.35639190673828, 123.4527816772461, 126.5491714477539, 129.6455535888672, 132.741943359375, 135.8383331298828, 138.93472290039062, 142.03109741210938, 145.1274871826172, 148.223876953125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 15.0, 22.0, 27.0, 43.0, 49.0, 91.0, 390.0, 134.0, 56.0, 40.0, 36.0, 36.0, 18.0, 6.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.80511474609375, -129.36587524414062, -125.9266357421875, -122.48739624023438, -119.04815673828125, -115.60891723632812, -112.169677734375, -108.73043823242188, -105.29119873046875, -101.85195922851562, -98.4127197265625, -94.97348022460938, -91.53424072265625, -88.09500122070312, -84.65576171875, -81.21652221679688, -77.77729034423828, -74.33805084228516, -70.89881134033203, -67.4595718383789, -64.02033233642578, -60.581092834472656, -57.1418571472168, -53.70261764526367, -50.26337814331055, -46.82413864135742, -43.3848991394043, -39.94566345214844, -36.50642395019531, -33.06718444824219, -29.627944946289062, -26.188705444335938, -22.749465942382812, -19.310226440429688, -15.870987892150879, -12.43174934387207, -8.992509841918945, -5.55327033996582, -2.114032745361328, 1.3252067565917969, 4.764446258544922, 8.203685760498047, 11.642924308776855, 15.082162857055664, 18.52140235900879, 21.960641860961914, 25.399879455566406, 28.83911895751953, 32.278358459472656, 35.71759796142578, 39.156837463378906, 42.59607696533203, 46.035316467285156, 49.47455596923828, 52.91379165649414, 56.353031158447266, 59.79227066040039, 63.231510162353516, 66.67074584960938, 70.1099853515625, 73.54922485351562, 76.98846435546875, 80.42770385742188, 83.866943359375, 87.30618286132812]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 8.0, 6.0, 11.0, 12.0, 17.0, 35.0, 32.0, 59.0, 54.0, 123.0, 294.0, 67.0, 74.0, 55.0, 30.0, 30.0, 28.0, 16.0, 9.0, 12.0, 8.0, 5.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.375, -7.1539306640625, -6.932861328125, -6.7117919921875, -6.49072265625, -6.2696533203125, -6.048583984375, -5.8275146484375, -5.6064453125, -5.3853759765625, -5.164306640625, -4.9432373046875, -4.72216796875, -4.5010986328125, -4.280029296875, -4.0589599609375, -3.837890625, -3.6168212890625, -3.395751953125, -3.1746826171875, -2.95361328125, -2.7325439453125, -2.511474609375, -2.2904052734375, -2.0693359375, -1.8482666015625, -1.627197265625, -1.4061279296875, -1.18505859375, -0.9639892578125, -0.742919921875, -0.5218505859375, -0.30078125, -0.0797119140625, 0.141357421875, 0.3624267578125, 0.58349609375, 0.8045654296875, 1.025634765625, 1.2467041015625, 1.4677734375, 1.6888427734375, 1.909912109375, 2.1309814453125, 2.35205078125, 2.5731201171875, 2.794189453125, 3.0152587890625, 3.236328125, 3.4573974609375, 3.678466796875, 3.8995361328125, 4.12060546875, 4.3416748046875, 4.562744140625, 4.7838134765625, 5.0048828125, 5.2259521484375, 5.447021484375, 5.6680908203125, 5.88916015625, 6.1102294921875, 6.331298828125, 6.5523681640625, 6.7734375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 11.0, 5.0, 1.0, 6.0, 15.0, 16.0, 28.0, 32.0, 96.0, 139.0, 316.0, 1561.0, 22387.0, 8358579.0, 4280.0, 658.0, 214.0, 71.0, 58.0, 44.0, 17.0, 10.0, 14.0, 8.0, 10.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-73.26998138427734, -70.76465606689453, -68.25933837890625, -65.75401306152344, -63.248695373535156, -60.74337387084961, -58.23805236816406, -55.73272705078125, -53.22740936279297, -50.72208786010742, -48.216766357421875, -45.71144485473633, -43.20612335205078, -40.700801849365234, -38.19548034667969, -35.690155029296875, -33.18483352661133, -30.67951202392578, -28.174190521240234, -25.668869018554688, -23.16354751586914, -20.658226013183594, -18.152902603149414, -15.647581100463867, -13.14225959777832, -10.636938095092773, -8.131616592407227, -5.626294136047363, -3.1209726333618164, -0.6156511306762695, 1.8896713256835938, 4.394992828369141, 6.9003143310546875, 9.405635833740234, 11.910957336425781, 14.416279792785645, 16.921600341796875, 19.426921844482422, 21.9322452545166, 24.43756675720215, 26.942888259887695, 29.448209762573242, 31.95353126525879, 34.45885467529297, 36.964176177978516, 39.46949768066406, 41.97481918334961, 44.480140686035156, 46.9854621887207, 49.49078369140625, 51.9961051940918, 54.501426696777344, 57.00674819946289, 59.51206970214844, 62.01739501953125, 64.52271270751953, 67.02803802490234, 69.53336334228516, 72.03868103027344, 74.54400634765625, 77.04932403564453, 79.55464935302734, 82.05996704101562, 84.56529235839844, 87.07061004638672]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 2.0, 5.0, 4.0, 7.0, 2.0, 5.0, 3.0, 1.0, 6.0, 3.0, 4.0, 3.0, 5.0, 2.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.47355651855469, -63.188907623291016, -60.904258728027344, -58.61960983276367, -56.3349609375, -54.05030822753906, -51.76565933227539, -49.48101043701172, -47.19636154174805, -44.911712646484375, -42.6270637512207, -40.34241485595703, -38.057762145996094, -35.77311706542969, -33.48846435546875, -31.203815460205078, -28.919166564941406, -26.634517669677734, -24.349868774414062, -22.065217971801758, -19.780569076538086, -17.495920181274414, -15.211270332336426, -12.926620483398438, -10.641971588134766, -8.357322692871094, -6.0726728439331055, -3.7880234718322754, -1.5033740997314453, 0.7812747955322266, 3.065924644470215, 5.350574493408203, 7.635231018066406, 9.919879913330078, 12.204529762268066, 14.489179611206055, 16.773828506469727, 19.0584774017334, 21.343128204345703, 23.627777099609375, 25.912425994873047, 28.19707489013672, 30.48172378540039, 32.76637268066406, 35.051025390625, 37.335670471191406, 39.620323181152344, 41.904972076416016, 44.18962097167969, 46.47426986694336, 48.75891876220703, 51.0435676574707, 53.328216552734375, 55.61286926269531, 57.897518157958984, 60.182167053222656, 62.46681594848633, 64.75146484375, 67.03611755371094, 69.32076263427734, 71.60541534423828, 73.89006042480469, 76.17471313476562, 78.45936584472656, 80.74401092529297]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 13.0, 7.0, 6.0, 15.0, 26.0, 29.0, 41.0, 54.0, 81.0, 96.0, 123.0, 111.0, 104.0, 82.0, 65.0, 45.0, 29.0, 24.0, 22.0, 12.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16796875, -3.069976806640625, -2.97198486328125, -2.873992919921875, -2.7760009765625, -2.678009033203125, -2.58001708984375, -2.482025146484375, -2.384033203125, -2.286041259765625, -2.18804931640625, -2.090057373046875, -1.9920654296875, -1.894073486328125, -1.79608154296875, -1.698089599609375, -1.60009765625, -1.502105712890625, -1.40411376953125, -1.306121826171875, -1.2081298828125, -1.110137939453125, -1.01214599609375, -0.914154052734375, -0.816162109375, -0.718170166015625, -0.62017822265625, -0.522186279296875, -0.4241943359375, -0.326202392578125, -0.22821044921875, -0.130218505859375, -0.0322265625, 0.065765380859375, 0.16375732421875, 0.261749267578125, 0.3597412109375, 0.457733154296875, 0.55572509765625, 0.653717041015625, 0.751708984375, 0.849700927734375, 0.94769287109375, 1.045684814453125, 1.1436767578125, 1.241668701171875, 1.33966064453125, 1.437652587890625, 1.53564453125, 1.633636474609375, 1.73162841796875, 1.829620361328125, 1.9276123046875, 2.025604248046875, 2.12359619140625, 2.221588134765625, 2.319580078125, 2.417572021484375, 2.51556396484375, 2.613555908203125, 2.7115478515625, 2.809539794921875, 2.90753173828125, 3.005523681640625, 3.103515625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 1.0, 3.0, 11.0, 10.0, 16.0, 14.0, 20.0, 43.0, 104.0, 160.0, 342.0, 757.0, 2190.0, 7876.0, 43583.0, 252545.0, 180232.0, 27736.0, 5566.0, 1754.0, 670.0, 301.0, 150.0, 69.0, 53.0, 22.0, 9.0, 7.0, 8.0, 4.0, 1.0, 2.0], "bins": [-80.875, -79.18603515625, -77.4970703125, -75.80810546875, -74.119140625, -72.43017578125, -70.7412109375, -69.05224609375, -67.36328125, -65.67431640625, -63.9853515625, -62.29638671875, -60.607421875, -58.91845703125, -57.2294921875, -55.54052734375, -53.8515625, -52.16259765625, -50.4736328125, -48.78466796875, -47.095703125, -45.40673828125, -43.7177734375, -42.02880859375, -40.33984375, -38.65087890625, -36.9619140625, -35.27294921875, -33.583984375, -31.89501953125, -30.2060546875, -28.51708984375, -26.828125, -25.13916015625, -23.4501953125, -21.76123046875, -20.072265625, -18.38330078125, -16.6943359375, -15.00537109375, -13.31640625, -11.62744140625, -9.9384765625, -8.24951171875, -6.560546875, -4.87158203125, -3.1826171875, -1.49365234375, 0.1953125, 1.88427734375, 3.5732421875, 5.26220703125, 6.951171875, 8.64013671875, 10.3291015625, 12.01806640625, 13.70703125, 15.39599609375, 17.0849609375, 18.77392578125, 20.462890625, 22.15185546875, 23.8408203125, 25.52978515625, 27.21875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 7.0, 4.0, 8.0, 21.0, 22.0, 26.0, 33.0, 48.0, 53.0, 97.0, 87.0, 91.0, 114.0, 80.0, 72.0, 65.0, 39.0, 38.0, 27.0, 19.0, 17.0, 11.0, 7.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0], "bins": [-10.8671875, -10.62615966796875, -10.3851318359375, -10.14410400390625, -9.903076171875, -9.66204833984375, -9.4210205078125, -9.17999267578125, -8.93896484375, -8.69793701171875, -8.4569091796875, -8.21588134765625, -7.974853515625, -7.73382568359375, -7.4927978515625, -7.25177001953125, -7.0107421875, -6.76971435546875, -6.5286865234375, -6.28765869140625, -6.046630859375, -5.80560302734375, -5.5645751953125, -5.32354736328125, -5.08251953125, -4.84149169921875, -4.6004638671875, -4.35943603515625, -4.118408203125, -3.87738037109375, -3.6363525390625, -3.39532470703125, -3.154296875, -2.91326904296875, -2.6722412109375, -2.43121337890625, -2.190185546875, -1.94915771484375, -1.7081298828125, -1.46710205078125, -1.22607421875, -0.98504638671875, -0.7440185546875, -0.50299072265625, -0.261962890625, -0.02093505859375, 0.2200927734375, 0.46112060546875, 0.7021484375, 0.94317626953125, 1.1842041015625, 1.42523193359375, 1.666259765625, 1.90728759765625, 2.1483154296875, 2.38934326171875, 2.63037109375, 2.87139892578125, 3.1124267578125, 3.35345458984375, 3.594482421875, 3.83551025390625, 4.0765380859375, 4.31756591796875, 4.55859375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 7.0, 5.0, 8.0, 18.0, 28.0, 38.0, 68.0, 75.0, 72.0, 66.0, 30.0, 19.0, 14.0, 3.0, 7.0, 5.0, 7.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.89596176147461, -31.626115798950195, -30.356271743774414, -29.08642578125, -27.81658172607422, -26.546735763549805, -25.27688980102539, -24.00704574584961, -22.737199783325195, -21.46735382080078, -20.197509765625, -18.927663803100586, -17.657817840576172, -16.38797378540039, -15.118127822875977, -13.848282814025879, -12.578437805175781, -11.308592796325684, -10.038747787475586, -8.768901824951172, -7.499056816101074, -6.229211807250977, -4.959366321563721, -3.689520835876465, -2.419675827026367, -1.1498305797576904, 0.12001466751098633, 1.389859914779663, 2.65970516204834, 3.9295501708984375, 5.199395656585693, 6.469241142272949, 7.7390899658203125, 9.00893497467041, 10.278779983520508, 11.548625946044922, 12.81847095489502, 14.088315963745117, 15.358161926269531, 16.628005981445312, 17.897851943969727, 19.16769790649414, 20.437541961669922, 21.707387924194336, 22.97723388671875, 24.24707794189453, 25.516923904418945, 26.78676986694336, 28.05661392211914, 29.326459884643555, 30.596303939819336, 31.86614990234375, 33.13599395751953, 34.40583801269531, 35.67568588256836, 36.94552993774414, 38.21537780761719, 39.48522186279297, 40.755069732666016, 42.0249137878418, 43.29475784301758, 44.564605712890625, 45.834449768066406, 47.10429382324219, 48.37413787841797]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 3.0, 8.0, 10.0, 20.0, 22.0, 32.0, 58.0, 67.0, 76.0, 51.0, 36.0, 27.0, 17.0, 14.0, 10.0, 5.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.92654800415039, -33.86155700683594, -32.79656982421875, -31.73158073425293, -30.66659164428711, -29.60160255432129, -28.53661346435547, -27.47162437438965, -26.406635284423828, -25.341646194458008, -24.276657104492188, -23.211668014526367, -22.146678924560547, -21.081689834594727, -20.016700744628906, -18.951711654663086, -17.886722564697266, -16.821733474731445, -15.756744384765625, -14.691755294799805, -13.626766204833984, -12.561777114868164, -11.496788024902344, -10.431798934936523, -9.366809844970703, -8.301820755004883, -7.2368316650390625, -6.171842575073242, -5.106853485107422, -4.041864395141602, -2.9768753051757812, -1.911886215209961, -0.846893310546875, 0.2180957794189453, 1.2830848693847656, 2.348073959350586, 3.4130630493164062, 4.478052139282227, 5.543041229248047, 6.608030319213867, 7.6730194091796875, 8.738008499145508, 9.802997589111328, 10.867986679077148, 11.932975769042969, 12.997964859008789, 14.06295394897461, 15.12794303894043, 16.19293212890625, 17.25792121887207, 18.32291030883789, 19.38789939880371, 20.45288848876953, 21.51787757873535, 22.582866668701172, 23.647855758666992, 24.712844848632812, 25.777833938598633, 26.842823028564453, 27.907812118530273, 28.972801208496094, 30.037790298461914, 31.102779388427734, 32.16777038574219, 33.232757568359375]}, "eval/loss": 5.443604946136475, "eval/wer": 1.5227687425624752, "eval/runtime": 664.731, "eval/samples_per_second": 3.975, "eval/steps_per_second": 0.498} \ No newline at end of file +{"train/loss": 4.7343, "train/learning_rate": 2.622394366197183e-05, "train/epoch": 4.13, "train/global_step": 3684, "_runtime": 21859, "_timestamp": 1647966361, "_step": 3685, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 16.0, 18.0, 16.0, 17.0, 18.0, 34.0, 31.0, 30.0, 58.0, 44.0, 46.0, 56.0, 56.0, 60.0, 53.0, 60.0, 49.0, 39.0, 42.0, 42.0, 20.0, 32.0, 14.0, 25.0, 26.0, 20.0, 14.0, 14.0, 11.0, 3.0, 3.0, 5.0, 3.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.070314407348633, -18.440237045288086, -17.810157775878906, -17.18008041381836, -16.55000114440918, -15.919923782348633, -15.28984546661377, -14.659767150878906, -14.029688835144043, -13.39961051940918, -12.769532203674316, -12.139453887939453, -11.509376525878906, -10.879297256469727, -10.24921989440918, -9.619141578674316, -8.989063262939453, -8.35898494720459, -7.728906631469727, -7.0988287925720215, -6.468750476837158, -5.838672161102295, -5.20859432220459, -4.578516006469727, -3.9484376907348633, -3.318359375, -2.688281297683716, -2.0582032203674316, -1.4281249046325684, -0.7980465888977051, -0.1679685115814209, 0.4621095657348633, 1.0921878814697266, 1.7222660779953003, 2.352344274520874, 2.982422351837158, 3.6125006675720215, 4.242578983306885, 4.87265682220459, 5.502735137939453, 6.132813453674316, 6.76289176940918, 7.392970085144043, 8.023048400878906, 8.653125762939453, 9.283205032348633, 9.91328239440918, 10.543360710144043, 11.173439025878906, 11.80351734161377, 12.433595657348633, 13.063673973083496, 13.69375228881836, 14.323829650878906, 14.95390796661377, 15.583986282348633, 16.214065551757812, 16.84414291381836, 17.47422218322754, 18.104299545288086, 18.734378814697266, 19.364456176757812, 19.994535446166992, 20.62461280822754, 21.254690170288086]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 10.0, 8.0, 15.0, 18.0, 19.0, 18.0, 17.0, 34.0, 16.0, 26.0, 37.0, 30.0, 37.0, 29.0, 45.0, 41.0, 41.0, 34.0, 48.0, 44.0, 33.0, 32.0, 30.0, 29.0, 33.0, 23.0, 38.0, 33.0, 25.0, 19.0, 15.0, 21.0, 21.0, 12.0, 15.0, 15.0, 10.0, 2.0, 4.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.996646881103516, -15.441826820373535, -14.887006759643555, -14.332185745239258, -13.777365684509277, -13.222545623779297, -12.667724609375, -12.11290454864502, -11.558084487915039, -11.003264427185059, -10.448444366455078, -9.893623352050781, -9.3388032913208, -8.78398323059082, -8.229162216186523, -7.674342155456543, -7.1195220947265625, -6.564702033996582, -6.009881496429443, -5.455060958862305, -4.900240898132324, -4.345420837402344, -3.790600299835205, -3.2357800006866455, -2.680959701538086, -2.1261394023895264, -1.5713191032409668, -1.0164988040924072, -0.46167850494384766, 0.09314179420471191, 0.6479620933532715, 1.202782392501831, 1.7576007843017578, 2.3124210834503174, 2.867241382598877, 3.4220616817474365, 3.976881980895996, 4.531702041625977, 5.086522579193115, 5.641343116760254, 6.196163177490234, 6.750983238220215, 7.3058037757873535, 7.860624313354492, 8.415444374084473, 8.970264434814453, 9.52508544921875, 10.07990550994873, 10.634725570678711, 11.189545631408691, 11.744365692138672, 12.299186706542969, 12.85400676727295, 13.40882682800293, 13.963647842407227, 14.518467903137207, 15.073287963867188, 15.628108024597168, 16.18292808532715, 16.737749099731445, 17.29256820678711, 17.847389221191406, 18.402210235595703, 18.957029342651367, 19.511850357055664]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 9.0, 15.0, 20.0, 48.0, 66.0, 130.0, 200.0, 325.0, 552.0, 961.0, 1498.0, 2552.0, 4349.0, 7331.0, 12545.0, 21308.0, 37425.0, 65250.0, 111689.0, 188601.0, 298220.0, 431039.0, 546743.0, 603219.0, 568521.0, 458882.0, 326569.0, 208463.0, 124248.0, 72367.0, 41342.0, 24224.0, 14150.0, 8344.0, 5165.0, 3009.0, 1824.0, 1136.0, 719.0, 455.0, 290.0, 185.0, 100.0, 73.0, 43.0, 25.0, 20.0, 10.0, 5.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0], "bins": [-10.375, -10.056884765625, -9.73876953125, -9.420654296875, -9.1025390625, -8.784423828125, -8.46630859375, -8.148193359375, -7.830078125, -7.511962890625, -7.19384765625, -6.875732421875, -6.5576171875, -6.239501953125, -5.92138671875, -5.603271484375, -5.28515625, -4.967041015625, -4.64892578125, -4.330810546875, -4.0126953125, -3.694580078125, -3.37646484375, -3.058349609375, -2.740234375, -2.422119140625, -2.10400390625, -1.785888671875, -1.4677734375, -1.149658203125, -0.83154296875, -0.513427734375, -0.1953125, 0.122802734375, 0.44091796875, 0.759033203125, 1.0771484375, 1.395263671875, 1.71337890625, 2.031494140625, 2.349609375, 2.667724609375, 2.98583984375, 3.303955078125, 3.6220703125, 3.940185546875, 4.25830078125, 4.576416015625, 4.89453125, 5.212646484375, 5.53076171875, 5.848876953125, 6.1669921875, 6.485107421875, 6.80322265625, 7.121337890625, 7.439453125, 7.757568359375, 8.07568359375, 8.393798828125, 8.7119140625, 9.030029296875, 9.34814453125, 9.666259765625, 9.984375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 5.0, 11.0, 13.0, 16.0, 14.0, 21.0, 29.0, 25.0, 20.0, 27.0, 24.0, 30.0, 30.0, 32.0, 33.0, 41.0, 38.0, 38.0, 43.0, 39.0, 43.0, 39.0, 34.0, 20.0, 23.0, 35.0, 34.0, 26.0, 29.0, 24.0, 21.0, 25.0, 16.0, 14.0, 15.0, 16.0, 12.0, 5.0, 9.0, 0.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-13.4375, -12.9930419921875, -12.548583984375, -12.1041259765625, -11.65966796875, -11.2152099609375, -10.770751953125, -10.3262939453125, -9.8818359375, -9.4373779296875, -8.992919921875, -8.5484619140625, -8.10400390625, -7.6595458984375, -7.215087890625, -6.7706298828125, -6.326171875, -5.8817138671875, -5.437255859375, -4.9927978515625, -4.54833984375, -4.1038818359375, -3.659423828125, -3.2149658203125, -2.7705078125, -2.3260498046875, -1.881591796875, -1.4371337890625, -0.99267578125, -0.5482177734375, -0.103759765625, 0.3406982421875, 0.78515625, 1.2296142578125, 1.674072265625, 2.1185302734375, 2.56298828125, 3.0074462890625, 3.451904296875, 3.8963623046875, 4.3408203125, 4.7852783203125, 5.229736328125, 5.6741943359375, 6.11865234375, 6.5631103515625, 7.007568359375, 7.4520263671875, 7.896484375, 8.3409423828125, 8.785400390625, 9.2298583984375, 9.67431640625, 10.1187744140625, 10.563232421875, 11.0076904296875, 11.4521484375, 11.8966064453125, 12.341064453125, 12.7855224609375, 13.22998046875, 13.6744384765625, 14.118896484375, 14.5633544921875, 15.0078125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 8.0, 9.0, 20.0, 26.0, 57.0, 115.0, 212.0, 357.0, 577.0, 1125.0, 2098.0, 3989.0, 7677.0, 14911.0, 28439.0, 54907.0, 103350.0, 189753.0, 329878.0, 524154.0, 722495.0, 756774.0, 586677.0, 380691.0, 224306.0, 123403.0, 65974.0, 34630.0, 17910.0, 9250.0, 4906.0, 2584.0, 1345.0, 749.0, 393.0, 233.0, 123.0, 78.0, 44.0, 30.0, 14.0, 12.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1953125, -12.7425537109375, -12.289794921875, -11.8370361328125, -11.38427734375, -10.9315185546875, -10.478759765625, -10.0260009765625, -9.5732421875, -9.1204833984375, -8.667724609375, -8.2149658203125, -7.76220703125, -7.3094482421875, -6.856689453125, -6.4039306640625, -5.951171875, -5.4984130859375, -5.045654296875, -4.5928955078125, -4.14013671875, -3.6873779296875, -3.234619140625, -2.7818603515625, -2.3291015625, -1.8763427734375, -1.423583984375, -0.9708251953125, -0.51806640625, -0.0653076171875, 0.387451171875, 0.8402099609375, 1.29296875, 1.7457275390625, 2.198486328125, 2.6512451171875, 3.10400390625, 3.5567626953125, 4.009521484375, 4.4622802734375, 4.9150390625, 5.3677978515625, 5.820556640625, 6.2733154296875, 6.72607421875, 7.1788330078125, 7.631591796875, 8.0843505859375, 8.537109375, 8.9898681640625, 9.442626953125, 9.8953857421875, 10.34814453125, 10.8009033203125, 11.253662109375, 11.7064208984375, 12.1591796875, 12.6119384765625, 13.064697265625, 13.5174560546875, 13.97021484375, 14.4229736328125, 14.875732421875, 15.3284912109375, 15.78125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 0.0, 5.0, 5.0, 3.0, 7.0, 14.0, 22.0, 19.0, 30.0, 26.0, 45.0, 55.0, 72.0, 92.0, 106.0, 138.0, 151.0, 170.0, 218.0, 227.0, 236.0, 262.0, 261.0, 244.0, 266.0, 225.0, 199.0, 163.0, 147.0, 129.0, 93.0, 92.0, 63.0, 69.0, 48.0, 34.0, 25.0, 26.0, 20.0, 24.0, 8.0, 7.0, 10.0, 3.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.4818115234375, -5.299560546875, -5.1173095703125, -4.93505859375, -4.7528076171875, -4.570556640625, -4.3883056640625, -4.2060546875, -4.0238037109375, -3.841552734375, -3.6593017578125, -3.47705078125, -3.2947998046875, -3.112548828125, -2.9302978515625, -2.748046875, -2.5657958984375, -2.383544921875, -2.2012939453125, -2.01904296875, -1.8367919921875, -1.654541015625, -1.4722900390625, -1.2900390625, -1.1077880859375, -0.925537109375, -0.7432861328125, -0.56103515625, -0.3787841796875, -0.196533203125, -0.0142822265625, 0.16796875, 0.3502197265625, 0.532470703125, 0.7147216796875, 0.89697265625, 1.0792236328125, 1.261474609375, 1.4437255859375, 1.6259765625, 1.8082275390625, 1.990478515625, 2.1727294921875, 2.35498046875, 2.5372314453125, 2.719482421875, 2.9017333984375, 3.083984375, 3.2662353515625, 3.448486328125, 3.6307373046875, 3.81298828125, 3.9952392578125, 4.177490234375, 4.3597412109375, 4.5419921875, 4.7242431640625, 4.906494140625, 5.0887451171875, 5.27099609375, 5.4532470703125, 5.635498046875, 5.8177490234375, 6.0]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 11.0, 9.0, 9.0, 22.0, 23.0, 25.0, 28.0, 31.0, 33.0, 44.0, 48.0, 49.0, 53.0, 43.0, 62.0, 42.0, 55.0, 53.0, 38.0, 47.0, 30.0, 24.0, 28.0, 28.0, 26.0, 19.0, 16.0, 11.0, 13.0, 12.0, 10.0, 6.0, 2.0, 10.0, 3.0, 4.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.821730613708496, -13.331482887268066, -12.841236114501953, -12.350988388061523, -11.860740661621094, -11.37049388885498, -10.88024616241455, -10.389999389648438, -9.899751663208008, -9.409503936767578, -8.919257164001465, -8.429009437561035, -7.938762187957764, -7.448514938354492, -6.9582672119140625, -6.468019962310791, -5.9777727127075195, -5.487525463104248, -4.997278213500977, -4.507030487060547, -4.016783237457275, -3.526535987854004, -3.0362884998321533, -2.5460410118103027, -2.0557937622070312, -1.5655463933944702, -1.0752990245819092, -0.5850516557693481, -0.09480428695678711, 0.3954429626464844, 0.885690450668335, 1.3759379386901855, 1.8661842346191406, 2.356431484222412, 2.8466789722442627, 3.3369264602661133, 3.8271737098693848, 4.317420959472656, 4.807668685913086, 5.297915935516357, 5.788163185119629, 6.2784104347229, 6.768657684326172, 7.258905410766602, 7.749152660369873, 8.239399909973145, 8.729647636413574, 9.219894409179688, 9.710142135620117, 10.200389862060547, 10.69063663482666, 11.18088436126709, 11.671131134033203, 12.161378860473633, 12.651626586914062, 13.141874313354492, 13.632121086120605, 14.122368812561035, 14.612615585327148, 15.102863311767578, 15.593111038208008, 16.083358764648438, 16.573604583740234, 17.063852310180664, 17.554100036621094]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 6.0, 10.0, 12.0, 12.0, 20.0, 21.0, 25.0, 18.0, 29.0, 29.0, 31.0, 33.0, 38.0, 41.0, 43.0, 32.0, 53.0, 28.0, 39.0, 31.0, 39.0, 40.0, 37.0, 36.0, 34.0, 30.0, 34.0, 17.0, 19.0, 25.0, 13.0, 23.0, 18.0, 21.0, 15.0, 5.0, 7.0, 10.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0], "bins": [-16.34392547607422, -15.839371681213379, -15.334818840026855, -14.830265045166016, -14.325712203979492, -13.821158409118652, -13.316604614257812, -12.812051773071289, -12.30749797821045, -11.80294418334961, -11.298391342163086, -10.793837547302246, -10.289283752441406, -9.784730911254883, -9.280177116394043, -8.775623321533203, -8.27107048034668, -7.766517162322998, -7.261963844299316, -6.757410049438477, -6.252856731414795, -5.748303413391113, -5.243749618530273, -4.739196300506592, -4.23464298248291, -3.7300896644592285, -3.2255361080169678, -2.720982551574707, -2.2164292335510254, -1.7118759155273438, -1.207322359085083, -0.7027688026428223, -0.1982135772705078, 0.3063398599624634, 0.8108932971954346, 1.3154467344284058, 1.820000171661377, 2.3245534896850586, 2.8291070461273193, 3.33366060256958, 3.8382139205932617, 4.342767238616943, 4.847320556640625, 5.351874351501465, 5.8564276695251465, 6.360980987548828, 6.865534782409668, 7.37008810043335, 7.874641418457031, 8.379195213317871, 8.883748054504395, 9.388301849365234, 9.892854690551758, 10.397408485412598, 10.901962280273438, 11.406515121459961, 11.9110689163208, 12.41562271118164, 12.920175552368164, 13.424729347229004, 13.929283142089844, 14.433835983276367, 14.938389778137207, 15.442943572998047, 15.94749641418457]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 0.0, 2.0, 5.0, 9.0, 5.0, 17.0, 23.0, 35.0, 61.0, 103.0, 115.0, 163.0, 252.0, 438.0, 674.0, 1054.0, 1682.0, 3145.0, 5548.0, 10851.0, 23377.0, 55026.0, 130097.0, 254621.0, 277405.0, 158865.0, 68316.0, 28493.0, 12987.0, 6368.0, 3533.0, 1996.0, 1147.0, 743.0, 461.0, 303.0, 211.0, 163.0, 92.0, 55.0, 35.0, 34.0, 11.0, 16.0, 10.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1015625, -12.6666259765625, -12.231689453125, -11.7967529296875, -11.36181640625, -10.9268798828125, -10.491943359375, -10.0570068359375, -9.6220703125, -9.1871337890625, -8.752197265625, -8.3172607421875, -7.88232421875, -7.4473876953125, -7.012451171875, -6.5775146484375, -6.142578125, -5.7076416015625, -5.272705078125, -4.8377685546875, -4.40283203125, -3.9678955078125, -3.532958984375, -3.0980224609375, -2.6630859375, -2.2281494140625, -1.793212890625, -1.3582763671875, -0.92333984375, -0.4884033203125, -0.053466796875, 0.3814697265625, 0.81640625, 1.2513427734375, 1.686279296875, 2.1212158203125, 2.55615234375, 2.9910888671875, 3.426025390625, 3.8609619140625, 4.2958984375, 4.7308349609375, 5.165771484375, 5.6007080078125, 6.03564453125, 6.4705810546875, 6.905517578125, 7.3404541015625, 7.775390625, 8.2103271484375, 8.645263671875, 9.0802001953125, 9.51513671875, 9.9500732421875, 10.385009765625, 10.8199462890625, 11.2548828125, 11.6898193359375, 12.124755859375, 12.5596923828125, 12.99462890625, 13.4295654296875, 13.864501953125, 14.2994384765625, 14.734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 7.0, 6.0, 3.0, 9.0, 15.0, 13.0, 17.0, 25.0, 24.0, 37.0, 26.0, 31.0, 31.0, 22.0, 42.0, 43.0, 30.0, 48.0, 31.0, 36.0, 48.0, 28.0, 48.0, 36.0, 31.0, 37.0, 34.0, 21.0, 20.0, 20.0, 18.0, 27.0, 18.0, 22.0, 17.0, 15.0, 17.0, 12.0, 5.0, 8.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 0.0, 1.0, 0.0, 3.0], "bins": [-16.171875, -15.6826171875, -15.193359375, -14.7041015625, -14.21484375, -13.7255859375, -13.236328125, -12.7470703125, -12.2578125, -11.7685546875, -11.279296875, -10.7900390625, -10.30078125, -9.8115234375, -9.322265625, -8.8330078125, -8.34375, -7.8544921875, -7.365234375, -6.8759765625, -6.38671875, -5.8974609375, -5.408203125, -4.9189453125, -4.4296875, -3.9404296875, -3.451171875, -2.9619140625, -2.47265625, -1.9833984375, -1.494140625, -1.0048828125, -0.515625, -0.0263671875, 0.462890625, 0.9521484375, 1.44140625, 1.9306640625, 2.419921875, 2.9091796875, 3.3984375, 3.8876953125, 4.376953125, 4.8662109375, 5.35546875, 5.8447265625, 6.333984375, 6.8232421875, 7.3125, 7.8017578125, 8.291015625, 8.7802734375, 9.26953125, 9.7587890625, 10.248046875, 10.7373046875, 11.2265625, 11.7158203125, 12.205078125, 12.6943359375, 13.18359375, 13.6728515625, 14.162109375, 14.6513671875, 15.140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 16.0, 14.0, 31.0, 34.0, 52.0, 73.0, 103.0, 146.0, 232.0, 368.0, 561.0, 979.0, 1605.0, 2944.0, 6768.0, 17323.0, 55004.0, 203067.0, 431924.0, 229507.0, 63296.0, 19514.0, 7272.0, 3296.0, 1759.0, 915.0, 606.0, 364.0, 238.0, 169.0, 106.0, 78.0, 42.0, 33.0, 37.0, 24.0, 11.0, 8.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.390625, -15.8870849609375, -15.383544921875, -14.8800048828125, -14.37646484375, -13.8729248046875, -13.369384765625, -12.8658447265625, -12.3623046875, -11.8587646484375, -11.355224609375, -10.8516845703125, -10.34814453125, -9.8446044921875, -9.341064453125, -8.8375244140625, -8.333984375, -7.8304443359375, -7.326904296875, -6.8233642578125, -6.31982421875, -5.8162841796875, -5.312744140625, -4.8092041015625, -4.3056640625, -3.8021240234375, -3.298583984375, -2.7950439453125, -2.29150390625, -1.7879638671875, -1.284423828125, -0.7808837890625, -0.27734375, 0.2261962890625, 0.729736328125, 1.2332763671875, 1.73681640625, 2.2403564453125, 2.743896484375, 3.2474365234375, 3.7509765625, 4.2545166015625, 4.758056640625, 5.2615966796875, 5.76513671875, 6.2686767578125, 6.772216796875, 7.2757568359375, 7.779296875, 8.2828369140625, 8.786376953125, 9.2899169921875, 9.79345703125, 10.2969970703125, 10.800537109375, 11.3040771484375, 11.8076171875, 12.3111572265625, 12.814697265625, 13.3182373046875, 13.82177734375, 14.3253173828125, 14.828857421875, 15.3323974609375, 15.8359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 2.0, 18.0, 10.0, 17.0, 12.0, 28.0, 26.0, 26.0, 23.0, 39.0, 27.0, 34.0, 42.0, 44.0, 52.0, 48.0, 48.0, 45.0, 32.0, 42.0, 52.0, 31.0, 46.0, 25.0, 23.0, 28.0, 35.0, 18.0, 17.0, 26.0, 16.0, 12.0, 9.0, 8.0, 7.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2109375, -12.7841796875, -12.357421875, -11.9306640625, -11.50390625, -11.0771484375, -10.650390625, -10.2236328125, -9.796875, -9.3701171875, -8.943359375, -8.5166015625, -8.08984375, -7.6630859375, -7.236328125, -6.8095703125, -6.3828125, -5.9560546875, -5.529296875, -5.1025390625, -4.67578125, -4.2490234375, -3.822265625, -3.3955078125, -2.96875, -2.5419921875, -2.115234375, -1.6884765625, -1.26171875, -0.8349609375, -0.408203125, 0.0185546875, 0.4453125, 0.8720703125, 1.298828125, 1.7255859375, 2.15234375, 2.5791015625, 3.005859375, 3.4326171875, 3.859375, 4.2861328125, 4.712890625, 5.1396484375, 5.56640625, 5.9931640625, 6.419921875, 6.8466796875, 7.2734375, 7.7001953125, 8.126953125, 8.5537109375, 8.98046875, 9.4072265625, 9.833984375, 10.2607421875, 10.6875, 11.1142578125, 11.541015625, 11.9677734375, 12.39453125, 12.8212890625, 13.248046875, 13.6748046875, 14.1015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 9.0, 12.0, 13.0, 16.0, 26.0, 38.0, 43.0, 81.0, 107.0, 158.0, 233.0, 418.0, 560.0, 1009.0, 1783.0, 3475.0, 6651.0, 14822.0, 37861.0, 122952.0, 428385.0, 301158.0, 78668.0, 26651.0, 11227.0, 5412.0, 2784.0, 1545.0, 916.0, 510.0, 323.0, 212.0, 140.0, 82.0, 72.0, 52.0, 39.0, 26.0, 22.0, 11.0, 13.0, 6.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.88671875, -7.638916015625, -7.39111328125, -7.143310546875, -6.8955078125, -6.647705078125, -6.39990234375, -6.152099609375, -5.904296875, -5.656494140625, -5.40869140625, -5.160888671875, -4.9130859375, -4.665283203125, -4.41748046875, -4.169677734375, -3.921875, -3.674072265625, -3.42626953125, -3.178466796875, -2.9306640625, -2.682861328125, -2.43505859375, -2.187255859375, -1.939453125, -1.691650390625, -1.44384765625, -1.196044921875, -0.9482421875, -0.700439453125, -0.45263671875, -0.204833984375, 0.04296875, 0.290771484375, 0.53857421875, 0.786376953125, 1.0341796875, 1.281982421875, 1.52978515625, 1.777587890625, 2.025390625, 2.273193359375, 2.52099609375, 2.768798828125, 3.0166015625, 3.264404296875, 3.51220703125, 3.760009765625, 4.0078125, 4.255615234375, 4.50341796875, 4.751220703125, 4.9990234375, 5.246826171875, 5.49462890625, 5.742431640625, 5.990234375, 6.238037109375, 6.48583984375, 6.733642578125, 6.9814453125, 7.229248046875, 7.47705078125, 7.724853515625, 7.97265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 9.0, 6.0, 5.0, 11.0, 17.0, 27.0, 38.0, 58.0, 89.0, 126.0, 117.0, 141.0, 106.0, 77.0, 45.0, 29.0, 24.0, 17.0, 7.0, 9.0, 8.0, 6.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005903244018554688, -0.0005682706832885742, -0.0005462169647216797, -0.0005241632461547852, -0.0005021095275878906, -0.0004800558090209961, -0.00045800209045410156, -0.00043594837188720703, -0.0004138946533203125, -0.00039184093475341797, -0.00036978721618652344, -0.0003477334976196289, -0.0003256797790527344, -0.00030362606048583984, -0.0002815723419189453, -0.0002595186233520508, -0.00023746490478515625, -0.00021541118621826172, -0.0001933574676513672, -0.00017130374908447266, -0.00014925003051757812, -0.0001271963119506836, -0.00010514259338378906, -8.308887481689453e-05, -6.103515625e-05, -3.898143768310547e-05, -1.6927719116210938e-05, 5.125999450683594e-06, 2.7179718017578125e-05, 4.9233436584472656e-05, 7.128715515136719e-05, 9.334087371826172e-05, 0.00011539459228515625, 0.00013744831085205078, 0.0001595020294189453, 0.00018155574798583984, 0.00020360946655273438, 0.0002256631851196289, 0.00024771690368652344, 0.00026977062225341797, 0.0002918243408203125, 0.00031387805938720703, 0.00033593177795410156, 0.0003579854965209961, 0.0003800392150878906, 0.00040209293365478516, 0.0004241466522216797, 0.0004462003707885742, 0.00046825408935546875, 0.0004903078079223633, 0.0005123615264892578, 0.0005344152450561523, 0.0005564689636230469, 0.0005785226821899414, 0.0006005764007568359, 0.0006226301193237305, 0.000644683837890625, 0.0006667375564575195, 0.0006887912750244141, 0.0007108449935913086, 0.0007328987121582031, 0.0007549524307250977, 0.0007770061492919922, 0.0007990598678588867, 0.0008211135864257812]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 8.0, 9.0, 14.0, 10.0, 25.0, 28.0, 46.0, 64.0, 95.0, 151.0, 218.0, 325.0, 481.0, 727.0, 1153.0, 1665.0, 2667.0, 4343.0, 6677.0, 10509.0, 17650.0, 30908.0, 59610.0, 124719.0, 237901.0, 254641.0, 141567.0, 67070.0, 34508.0, 19122.0, 11621.0, 7066.0, 4442.0, 2931.0, 1869.0, 1235.0, 804.0, 531.0, 367.0, 261.0, 173.0, 94.0, 72.0, 51.0, 31.0, 35.0, 16.0, 15.0, 9.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.59765625, -5.428466796875, -5.25927734375, -5.090087890625, -4.9208984375, -4.751708984375, -4.58251953125, -4.413330078125, -4.244140625, -4.074951171875, -3.90576171875, -3.736572265625, -3.5673828125, -3.398193359375, -3.22900390625, -3.059814453125, -2.890625, -2.721435546875, -2.55224609375, -2.383056640625, -2.2138671875, -2.044677734375, -1.87548828125, -1.706298828125, -1.537109375, -1.367919921875, -1.19873046875, -1.029541015625, -0.8603515625, -0.691162109375, -0.52197265625, -0.352783203125, -0.18359375, -0.014404296875, 0.15478515625, 0.323974609375, 0.4931640625, 0.662353515625, 0.83154296875, 1.000732421875, 1.169921875, 1.339111328125, 1.50830078125, 1.677490234375, 1.8466796875, 2.015869140625, 2.18505859375, 2.354248046875, 2.5234375, 2.692626953125, 2.86181640625, 3.031005859375, 3.2001953125, 3.369384765625, 3.53857421875, 3.707763671875, 3.876953125, 4.046142578125, 4.21533203125, 4.384521484375, 4.5537109375, 4.722900390625, 4.89208984375, 5.061279296875, 5.23046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 11.0, 8.0, 12.0, 17.0, 21.0, 20.0, 49.0, 61.0, 74.0, 76.0, 139.0, 103.0, 92.0, 67.0, 57.0, 35.0, 30.0, 28.0, 15.0, 10.0, 11.0, 14.0, 9.0, 10.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05078125, -2.958770751953125, -2.86676025390625, -2.774749755859375, -2.6827392578125, -2.590728759765625, -2.49871826171875, -2.406707763671875, -2.314697265625, -2.222686767578125, -2.13067626953125, -2.038665771484375, -1.9466552734375, -1.854644775390625, -1.76263427734375, -1.670623779296875, -1.57861328125, -1.486602783203125, -1.39459228515625, -1.302581787109375, -1.2105712890625, -1.118560791015625, -1.02655029296875, -0.934539794921875, -0.842529296875, -0.750518798828125, -0.65850830078125, -0.566497802734375, -0.4744873046875, -0.382476806640625, -0.29046630859375, -0.198455810546875, -0.1064453125, -0.014434814453125, 0.07757568359375, 0.169586181640625, 0.2615966796875, 0.353607177734375, 0.44561767578125, 0.537628173828125, 0.629638671875, 0.721649169921875, 0.81365966796875, 0.905670166015625, 0.9976806640625, 1.089691162109375, 1.18170166015625, 1.273712158203125, 1.36572265625, 1.457733154296875, 1.54974365234375, 1.641754150390625, 1.7337646484375, 1.825775146484375, 1.91778564453125, 2.009796142578125, 2.101806640625, 2.193817138671875, 2.28582763671875, 2.377838134765625, 2.4698486328125, 2.561859130859375, 2.65386962890625, 2.745880126953125, 2.837890625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 3.0, 9.0, 9.0, 10.0, 12.0, 20.0, 23.0, 24.0, 35.0, 39.0, 40.0, 48.0, 48.0, 49.0, 62.0, 55.0, 57.0, 57.0, 51.0, 34.0, 46.0, 38.0, 31.0, 30.0, 22.0, 28.0, 24.0, 22.0, 13.0, 8.0, 12.0, 7.0, 7.0, 8.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.8696870803833, -12.364608764648438, -11.85953140258789, -11.354453086853027, -10.849374771118164, -10.344297409057617, -9.839219093322754, -9.33414077758789, -8.829063415527344, -8.32398509979248, -7.818907737731934, -7.31382942199707, -6.808751583099365, -6.30367374420166, -5.798595428466797, -5.293517589569092, -4.788439750671387, -4.283361911773682, -3.7782838344573975, -3.2732057571411133, -2.768127918243408, -2.263050079345703, -1.757972002029419, -1.2528939247131348, -0.7478160858154297, -0.24273812770843506, 0.26233983039855957, 0.7674177885055542, 1.2724957466125488, 1.777573585510254, 2.282651662826538, 2.7877297401428223, 3.292806625366211, 3.797884464263916, 4.302962303161621, 4.808040618896484, 5.3131184577941895, 5.8181962966918945, 6.323274612426758, 6.828352451324463, 7.333430290222168, 7.838508129119873, 8.343585968017578, 8.848664283752441, 9.353742599487305, 9.858819961547852, 10.363898277282715, 10.868976593017578, 11.374053955078125, 11.879132270812988, 12.384209632873535, 12.889287948608398, 13.394365310668945, 13.899443626403809, 14.404521942138672, 14.909599304199219, 15.414677619934082, 15.919755935668945, 16.424833297729492, 16.92991065979004, 17.43498992919922, 17.940067291259766, 18.445144653320312, 18.950223922729492, 19.45530128479004]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 7.0, 8.0, 12.0, 8.0, 12.0, 21.0, 17.0, 20.0, 26.0, 19.0, 19.0, 36.0, 39.0, 34.0, 50.0, 36.0, 34.0, 48.0, 36.0, 34.0, 27.0, 32.0, 51.0, 41.0, 30.0, 46.0, 32.0, 29.0, 17.0, 17.0, 24.0, 24.0, 20.0, 17.0, 22.0, 10.0, 10.0, 8.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.150748252868652, -14.656880378723145, -14.16301155090332, -13.669143676757812, -13.175275802612305, -12.681407928466797, -12.187540054321289, -11.693671226501465, -11.199803352355957, -10.70593547821045, -10.212066650390625, -9.718198776245117, -9.22433090209961, -8.730463027954102, -8.236595153808594, -7.7427263259887695, -7.248858451843262, -6.754990577697754, -6.261122226715088, -5.767253875732422, -5.273386001586914, -4.779518127441406, -4.28564977645874, -3.7917816638946533, -3.2979135513305664, -2.8040454387664795, -2.3101773262023926, -1.8163092136383057, -1.3224411010742188, -0.8285729885101318, -0.3347048759460449, 0.159163236618042, 0.6530323028564453, 1.1469004154205322, 1.6407685279846191, 2.134636640548706, 2.628504753112793, 3.12237286567688, 3.616240978240967, 4.110109329223633, 4.603977203369141, 5.097845077514648, 5.5917134284973145, 6.0855817794799805, 6.579449653625488, 7.073317527770996, 7.567185878753662, 8.061054229736328, 8.554922103881836, 9.048789978027344, 9.542657852172852, 10.036526679992676, 10.530394554138184, 11.024262428283691, 11.518131256103516, 12.011999130249023, 12.505867004394531, 12.999734878540039, 13.493602752685547, 13.987471580505371, 14.481339454650879, 14.975207328796387, 15.469076156616211, 15.962944030761719, 16.456811904907227]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 8.0, 3.0, 8.0, 5.0, 16.0, 34.0, 48.0, 60.0, 104.0, 170.0, 230.0, 385.0, 614.0, 967.0, 1519.0, 2533.0, 4422.0, 7186.0, 12105.0, 20538.0, 33703.0, 53443.0, 77913.0, 105755.0, 128928.0, 137892.0, 129632.0, 107662.0, 80254.0, 54482.0, 35096.0, 21172.0, 12735.0, 7486.0, 4441.0, 2692.0, 1628.0, 973.0, 612.0, 430.0, 209.0, 150.0, 113.0, 70.0, 47.0, 28.0, 20.0, 16.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.421875, -11.0596923828125, -10.697509765625, -10.3353271484375, -9.97314453125, -9.6109619140625, -9.248779296875, -8.8865966796875, -8.5244140625, -8.1622314453125, -7.800048828125, -7.4378662109375, -7.07568359375, -6.7135009765625, -6.351318359375, -5.9891357421875, -5.626953125, -5.2647705078125, -4.902587890625, -4.5404052734375, -4.17822265625, -3.8160400390625, -3.453857421875, -3.0916748046875, -2.7294921875, -2.3673095703125, -2.005126953125, -1.6429443359375, -1.28076171875, -0.9185791015625, -0.556396484375, -0.1942138671875, 0.16796875, 0.5301513671875, 0.892333984375, 1.2545166015625, 1.61669921875, 1.9788818359375, 2.341064453125, 2.7032470703125, 3.0654296875, 3.4276123046875, 3.789794921875, 4.1519775390625, 4.51416015625, 4.8763427734375, 5.238525390625, 5.6007080078125, 5.962890625, 6.3250732421875, 6.687255859375, 7.0494384765625, 7.41162109375, 7.7738037109375, 8.135986328125, 8.4981689453125, 8.8603515625, 9.2225341796875, 9.584716796875, 9.9468994140625, 10.30908203125, 10.6712646484375, 11.033447265625, 11.3956298828125, 11.7578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 8.0, 9.0, 10.0, 10.0, 14.0, 15.0, 29.0, 30.0, 32.0, 29.0, 37.0, 32.0, 43.0, 38.0, 43.0, 42.0, 40.0, 36.0, 46.0, 42.0, 34.0, 43.0, 35.0, 36.0, 38.0, 31.0, 17.0, 37.0, 33.0, 24.0, 18.0, 10.0, 14.0, 6.0, 10.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9140625, -15.3990478515625, -14.884033203125, -14.3690185546875, -13.85400390625, -13.3389892578125, -12.823974609375, -12.3089599609375, -11.7939453125, -11.2789306640625, -10.763916015625, -10.2489013671875, -9.73388671875, -9.2188720703125, -8.703857421875, -8.1888427734375, -7.673828125, -7.1588134765625, -6.643798828125, -6.1287841796875, -5.61376953125, -5.0987548828125, -4.583740234375, -4.0687255859375, -3.5537109375, -3.0386962890625, -2.523681640625, -2.0086669921875, -1.49365234375, -0.9786376953125, -0.463623046875, 0.0513916015625, 0.56640625, 1.0814208984375, 1.596435546875, 2.1114501953125, 2.62646484375, 3.1414794921875, 3.656494140625, 4.1715087890625, 4.6865234375, 5.2015380859375, 5.716552734375, 6.2315673828125, 6.74658203125, 7.2615966796875, 7.776611328125, 8.2916259765625, 8.806640625, 9.3216552734375, 9.836669921875, 10.3516845703125, 10.86669921875, 11.3817138671875, 11.896728515625, 12.4117431640625, 12.9267578125, 13.4417724609375, 13.956787109375, 14.4718017578125, 14.98681640625, 15.5018310546875, 16.016845703125, 16.5318603515625, 17.046875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [6.0, 3.0, 9.0, 12.0, 21.0, 34.0, 32.0, 62.0, 118.0, 137.0, 227.0, 300.0, 477.0, 686.0, 959.0, 1398.0, 2047.0, 2978.0, 4301.0, 6098.0, 8560.0, 12544.0, 17930.0, 25440.0, 35481.0, 49428.0, 64344.0, 81795.0, 95891.0, 105061.0, 106385.0, 98117.0, 83876.0, 66725.0, 51236.0, 37435.0, 26606.0, 18966.0, 12999.0, 9159.0, 6178.0, 4453.0, 3188.0, 2215.0, 1444.0, 979.0, 711.0, 480.0, 336.0, 245.0, 165.0, 95.0, 73.0, 53.0, 25.0, 23.0, 16.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.2734375, -9.9317626953125, -9.590087890625, -9.2484130859375, -8.90673828125, -8.5650634765625, -8.223388671875, -7.8817138671875, -7.5400390625, -7.1983642578125, -6.856689453125, -6.5150146484375, -6.17333984375, -5.8316650390625, -5.489990234375, -5.1483154296875, -4.806640625, -4.4649658203125, -4.123291015625, -3.7816162109375, -3.43994140625, -3.0982666015625, -2.756591796875, -2.4149169921875, -2.0732421875, -1.7315673828125, -1.389892578125, -1.0482177734375, -0.70654296875, -0.3648681640625, -0.023193359375, 0.3184814453125, 0.66015625, 1.0018310546875, 1.343505859375, 1.6851806640625, 2.02685546875, 2.3685302734375, 2.710205078125, 3.0518798828125, 3.3935546875, 3.7352294921875, 4.076904296875, 4.4185791015625, 4.76025390625, 5.1019287109375, 5.443603515625, 5.7852783203125, 6.126953125, 6.4686279296875, 6.810302734375, 7.1519775390625, 7.49365234375, 7.8353271484375, 8.177001953125, 8.5186767578125, 8.8603515625, 9.2020263671875, 9.543701171875, 9.8853759765625, 10.22705078125, 10.5687255859375, 10.910400390625, 11.2520751953125, 11.59375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 11.0, 9.0, 10.0, 10.0, 10.0, 13.0, 15.0, 17.0, 22.0, 18.0, 20.0, 32.0, 40.0, 33.0, 28.0, 37.0, 40.0, 40.0, 39.0, 54.0, 37.0, 54.0, 36.0, 46.0, 43.0, 29.0, 36.0, 32.0, 16.0, 27.0, 13.0, 15.0, 18.0, 21.0, 18.0, 6.0, 11.0, 11.0, 11.0, 7.0, 5.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3046875, -9.974365234375, -9.64404296875, -9.313720703125, -8.9833984375, -8.653076171875, -8.32275390625, -7.992431640625, -7.662109375, -7.331787109375, -7.00146484375, -6.671142578125, -6.3408203125, -6.010498046875, -5.68017578125, -5.349853515625, -5.01953125, -4.689208984375, -4.35888671875, -4.028564453125, -3.6982421875, -3.367919921875, -3.03759765625, -2.707275390625, -2.376953125, -2.046630859375, -1.71630859375, -1.385986328125, -1.0556640625, -0.725341796875, -0.39501953125, -0.064697265625, 0.265625, 0.595947265625, 0.92626953125, 1.256591796875, 1.5869140625, 1.917236328125, 2.24755859375, 2.577880859375, 2.908203125, 3.238525390625, 3.56884765625, 3.899169921875, 4.2294921875, 4.559814453125, 4.89013671875, 5.220458984375, 5.55078125, 5.881103515625, 6.21142578125, 6.541748046875, 6.8720703125, 7.202392578125, 7.53271484375, 7.863037109375, 8.193359375, 8.523681640625, 8.85400390625, 9.184326171875, 9.5146484375, 9.844970703125, 10.17529296875, 10.505615234375, 10.8359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 14.0, 21.0, 16.0, 26.0, 55.0, 77.0, 99.0, 145.0, 218.0, 298.0, 415.0, 656.0, 965.0, 1554.0, 2499.0, 4137.0, 7212.0, 13084.0, 24446.0, 45424.0, 80346.0, 128701.0, 170775.0, 181197.0, 150328.0, 102180.0, 60152.0, 32799.0, 17149.0, 9611.0, 5288.0, 3141.0, 1893.0, 1221.0, 757.0, 533.0, 348.0, 242.0, 140.0, 127.0, 69.0, 61.0, 42.0, 35.0, 20.0, 11.0, 8.0, 5.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.0546875, -3.92889404296875, -3.8031005859375, -3.67730712890625, -3.551513671875, -3.42572021484375, -3.2999267578125, -3.17413330078125, -3.04833984375, -2.92254638671875, -2.7967529296875, -2.67095947265625, -2.545166015625, -2.41937255859375, -2.2935791015625, -2.16778564453125, -2.0419921875, -1.91619873046875, -1.7904052734375, -1.66461181640625, -1.538818359375, -1.41302490234375, -1.2872314453125, -1.16143798828125, -1.03564453125, -0.90985107421875, -0.7840576171875, -0.65826416015625, -0.532470703125, -0.40667724609375, -0.2808837890625, -0.15509033203125, -0.029296875, 0.09649658203125, 0.2222900390625, 0.34808349609375, 0.473876953125, 0.59967041015625, 0.7254638671875, 0.85125732421875, 0.97705078125, 1.10284423828125, 1.2286376953125, 1.35443115234375, 1.480224609375, 1.60601806640625, 1.7318115234375, 1.85760498046875, 1.9833984375, 2.10919189453125, 2.2349853515625, 2.36077880859375, 2.486572265625, 2.61236572265625, 2.7381591796875, 2.86395263671875, 2.98974609375, 3.11553955078125, 3.2413330078125, 3.36712646484375, 3.492919921875, 3.61871337890625, 3.7445068359375, 3.87030029296875, 3.99609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 7.0, 11.0, 10.0, 11.0, 20.0, 23.0, 53.0, 57.0, 72.0, 63.0, 101.0, 87.0, 90.0, 83.0, 77.0, 50.0, 57.0, 45.0, 26.0, 21.0, 13.0, 8.0, 5.0, 9.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004978179931640625, -0.0004805848002433777, -0.00046335160732269287, -0.00044611841440200806, -0.00042888522148132324, -0.00041165202856063843, -0.0003944188356399536, -0.0003771856427192688, -0.000359952449798584, -0.00034271925687789917, -0.00032548606395721436, -0.00030825287103652954, -0.0002910196781158447, -0.0002737864851951599, -0.0002565532922744751, -0.00023932009935379028, -0.00022208690643310547, -0.00020485371351242065, -0.00018762052059173584, -0.00017038732767105103, -0.0001531541347503662, -0.0001359209418296814, -0.00011868774890899658, -0.00010145455598831177, -8.422136306762695e-05, -6.698817014694214e-05, -4.9754977226257324e-05, -3.252178430557251e-05, -1.5288591384887695e-05, 1.944601535797119e-06, 1.9177794456481934e-05, 3.641098737716675e-05, 5.364418029785156e-05, 7.087737321853638e-05, 8.811056613922119e-05, 0.000105343759059906, 0.00012257695198059082, 0.00013981014490127563, 0.00015704333782196045, 0.00017427653074264526, 0.00019150972366333008, 0.0002087429165840149, 0.0002259761095046997, 0.00024320930242538452, 0.00026044249534606934, 0.00027767568826675415, 0.00029490888118743896, 0.0003121420741081238, 0.0003293752670288086, 0.0003466084599494934, 0.0003638416528701782, 0.00038107484579086304, 0.00039830803871154785, 0.00041554123163223267, 0.0004327744245529175, 0.0004500076174736023, 0.0004672408103942871, 0.0004844740033149719, 0.0005017071962356567, 0.0005189403891563416, 0.0005361735820770264, 0.0005534067749977112, 0.000570639967918396, 0.0005878731608390808, 0.0006051063537597656]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 16.0, 13.0, 24.0, 41.0, 58.0, 109.0, 192.0, 306.0, 514.0, 880.0, 1388.0, 2496.0, 4275.0, 7439.0, 12917.0, 22506.0, 37941.0, 60463.0, 90516.0, 122301.0, 144542.0, 146518.0, 127864.0, 97408.0, 66863.0, 41818.0, 25006.0, 14381.0, 8418.0, 4700.0, 2725.0, 1513.0, 961.0, 550.0, 339.0, 216.0, 126.0, 80.0, 54.0, 36.0, 20.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.40234375, -3.299560546875, -3.19677734375, -3.093994140625, -2.9912109375, -2.888427734375, -2.78564453125, -2.682861328125, -2.580078125, -2.477294921875, -2.37451171875, -2.271728515625, -2.1689453125, -2.066162109375, -1.96337890625, -1.860595703125, -1.7578125, -1.655029296875, -1.55224609375, -1.449462890625, -1.3466796875, -1.243896484375, -1.14111328125, -1.038330078125, -0.935546875, -0.832763671875, -0.72998046875, -0.627197265625, -0.5244140625, -0.421630859375, -0.31884765625, -0.216064453125, -0.11328125, -0.010498046875, 0.09228515625, 0.195068359375, 0.2978515625, 0.400634765625, 0.50341796875, 0.606201171875, 0.708984375, 0.811767578125, 0.91455078125, 1.017333984375, 1.1201171875, 1.222900390625, 1.32568359375, 1.428466796875, 1.53125, 1.634033203125, 1.73681640625, 1.839599609375, 1.9423828125, 2.045166015625, 2.14794921875, 2.250732421875, 2.353515625, 2.456298828125, 2.55908203125, 2.661865234375, 2.7646484375, 2.867431640625, 2.97021484375, 3.072998046875, 3.17578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 3.0, 7.0, 12.0, 8.0, 10.0, 12.0, 22.0, 15.0, 28.0, 24.0, 24.0, 38.0, 32.0, 38.0, 42.0, 43.0, 41.0, 61.0, 43.0, 47.0, 45.0, 49.0, 51.0, 37.0, 39.0, 38.0, 32.0, 25.0, 29.0, 22.0, 14.0, 15.0, 17.0, 10.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5078125, -1.4646453857421875, -1.421478271484375, -1.3783111572265625, -1.33514404296875, -1.2919769287109375, -1.248809814453125, -1.2056427001953125, -1.1624755859375, -1.1193084716796875, -1.076141357421875, -1.0329742431640625, -0.98980712890625, -0.9466400146484375, -0.903472900390625, -0.8603057861328125, -0.817138671875, -0.7739715576171875, -0.730804443359375, -0.6876373291015625, -0.64447021484375, -0.6013031005859375, -0.558135986328125, -0.5149688720703125, -0.4718017578125, -0.4286346435546875, -0.385467529296875, -0.3423004150390625, -0.29913330078125, -0.2559661865234375, -0.212799072265625, -0.1696319580078125, -0.12646484375, -0.0832977294921875, -0.040130615234375, 0.0030364990234375, 0.04620361328125, 0.0893707275390625, 0.132537841796875, 0.1757049560546875, 0.2188720703125, 0.2620391845703125, 0.305206298828125, 0.3483734130859375, 0.39154052734375, 0.4347076416015625, 0.477874755859375, 0.5210418701171875, 0.564208984375, 0.6073760986328125, 0.650543212890625, 0.6937103271484375, 0.73687744140625, 0.7800445556640625, 0.823211669921875, 0.8663787841796875, 0.9095458984375, 0.9527130126953125, 0.995880126953125, 1.0390472412109375, 1.08221435546875, 1.1253814697265625, 1.168548583984375, 1.2117156982421875, 1.2548828125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 2.0, 9.0, 13.0, 10.0, 19.0, 13.0, 21.0, 23.0, 34.0, 32.0, 51.0, 54.0, 57.0, 62.0, 58.0, 47.0, 63.0, 60.0, 47.0, 47.0, 46.0, 46.0, 30.0, 25.0, 26.0, 28.0, 13.0, 15.0, 10.0, 9.0, 5.0, 7.0, 2.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.813426971435547, -12.302101135253906, -11.790776252746582, -11.279450416564941, -10.7681245803833, -10.256799697875977, -9.745473861694336, -9.234148025512695, -8.722822189331055, -8.211496353149414, -7.700170993804932, -7.188845634460449, -6.677519798278809, -6.166194438934326, -5.654869079589844, -5.143543243408203, -4.632218360900879, -4.1208930015563965, -3.609567165374756, -3.0982418060302734, -2.586916208267212, -2.0755906105041504, -1.564265251159668, -1.0529396533966064, -0.5416140556335449, -0.030288517475128174, 0.4810370206832886, 0.9923624992370605, 1.503688097000122, 2.0150136947631836, 2.526339054107666, 3.0376646518707275, 3.548990249633789, 4.0603156089782715, 4.571641445159912, 5.0829668045043945, 5.594292640686035, 6.105618000030518, 6.616943359375, 7.128269195556641, 7.639594554901123, 8.150919914245605, 8.662245750427246, 9.17357063293457, 9.684896469116211, 10.196222305297852, 10.707548141479492, 11.218873023986816, 11.730198860168457, 12.241524696350098, 12.752849578857422, 13.264175415039062, 13.775501251220703, 14.286827087402344, 14.798151969909668, 15.309477806091309, 15.820802688598633, 16.332128524780273, 16.843454360961914, 17.354778289794922, 17.866104125976562, 18.377429962158203, 18.888755798339844, 19.400081634521484, 19.911407470703125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 8.0, 5.0, 15.0, 18.0, 8.0, 13.0, 30.0, 28.0, 27.0, 21.0, 39.0, 18.0, 39.0, 33.0, 37.0, 48.0, 38.0, 38.0, 45.0, 35.0, 29.0, 40.0, 44.0, 41.0, 29.0, 40.0, 20.0, 35.0, 25.0, 17.0, 18.0, 17.0, 13.0, 10.0, 13.0, 8.0, 14.0, 7.0, 4.0, 10.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.93558120727539, -14.427531242370605, -13.919480323791504, -13.411430358886719, -12.903379440307617, -12.395329475402832, -11.887279510498047, -11.379228591918945, -10.87117862701416, -10.363128662109375, -9.855077743530273, -9.347027778625488, -8.838977813720703, -8.330926895141602, -7.822876930236816, -7.314826488494873, -6.80677604675293, -6.298725605010986, -5.790675163269043, -5.282625198364258, -4.7745747566223145, -4.266524314880371, -3.758474111557007, -3.2504239082336426, -2.742373466491699, -2.234323024749756, -1.7262728214263916, -1.2182224988937378, -0.710172176361084, -0.20212173461914062, 0.30592846870422363, 0.8139786720275879, 1.322031021118164, 1.8300813436508179, 2.3381316661834717, 2.846181869506836, 3.3542323112487793, 3.8622827529907227, 4.370332717895508, 4.878383159637451, 5.3864336013793945, 5.894484043121338, 6.402534484863281, 6.910584449768066, 7.41863489151001, 7.926685333251953, 8.434735298156738, 8.942785263061523, 9.450836181640625, 9.95888614654541, 10.466937065124512, 10.974987030029297, 11.483037948608398, 11.991087913513184, 12.499137878417969, 13.00718879699707, 13.515238761901855, 14.02328872680664, 14.531339645385742, 15.039389610290527, 15.547439575195312, 16.055490493774414, 16.563541412353516, 17.071590423583984, 17.579641342163086]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 17.0, 14.0, 30.0, 53.0, 89.0, 144.0, 211.0, 326.0, 606.0, 977.0, 1583.0, 2780.0, 4868.0, 8486.0, 14804.0, 26570.0, 46978.0, 84637.0, 148337.0, 250288.0, 387903.0, 535200.0, 631990.0, 623229.0, 514339.0, 365917.0, 230262.0, 135542.0, 77418.0, 43173.0, 24368.0, 13660.0, 8053.0, 4642.0, 2764.0, 1478.0, 989.0, 574.0, 369.0, 208.0, 150.0, 78.0, 58.0, 42.0, 24.0, 15.0, 16.0, 9.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.09375, -8.779296875, -8.46484375, -8.150390625, -7.8359375, -7.521484375, -7.20703125, -6.892578125, -6.578125, -6.263671875, -5.94921875, -5.634765625, -5.3203125, -5.005859375, -4.69140625, -4.376953125, -4.0625, -3.748046875, -3.43359375, -3.119140625, -2.8046875, -2.490234375, -2.17578125, -1.861328125, -1.546875, -1.232421875, -0.91796875, -0.603515625, -0.2890625, 0.025390625, 0.33984375, 0.654296875, 0.96875, 1.283203125, 1.59765625, 1.912109375, 2.2265625, 2.541015625, 2.85546875, 3.169921875, 3.484375, 3.798828125, 4.11328125, 4.427734375, 4.7421875, 5.056640625, 5.37109375, 5.685546875, 6.0, 6.314453125, 6.62890625, 6.943359375, 7.2578125, 7.572265625, 7.88671875, 8.201171875, 8.515625, 8.830078125, 9.14453125, 9.458984375, 9.7734375, 10.087890625, 10.40234375, 10.716796875, 11.03125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 3.0, 8.0, 7.0, 12.0, 8.0, 15.0, 19.0, 17.0, 27.0, 32.0, 24.0, 21.0, 40.0, 27.0, 34.0, 51.0, 36.0, 45.0, 47.0, 32.0, 34.0, 30.0, 30.0, 44.0, 47.0, 32.0, 41.0, 34.0, 29.0, 25.0, 15.0, 14.0, 15.0, 15.0, 16.0, 11.0, 8.0, 10.0, 9.0, 9.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.34375, -11.9423828125, -11.541015625, -11.1396484375, -10.73828125, -10.3369140625, -9.935546875, -9.5341796875, -9.1328125, -8.7314453125, -8.330078125, -7.9287109375, -7.52734375, -7.1259765625, -6.724609375, -6.3232421875, -5.921875, -5.5205078125, -5.119140625, -4.7177734375, -4.31640625, -3.9150390625, -3.513671875, -3.1123046875, -2.7109375, -2.3095703125, -1.908203125, -1.5068359375, -1.10546875, -0.7041015625, -0.302734375, 0.0986328125, 0.5, 0.9013671875, 1.302734375, 1.7041015625, 2.10546875, 2.5068359375, 2.908203125, 3.3095703125, 3.7109375, 4.1123046875, 4.513671875, 4.9150390625, 5.31640625, 5.7177734375, 6.119140625, 6.5205078125, 6.921875, 7.3232421875, 7.724609375, 8.1259765625, 8.52734375, 8.9287109375, 9.330078125, 9.7314453125, 10.1328125, 10.5341796875, 10.935546875, 11.3369140625, 11.73828125, 12.1396484375, 12.541015625, 12.9423828125, 13.34375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 18.0, 30.0, 39.0, 65.0, 92.0, 147.0, 287.0, 486.0, 827.0, 1433.0, 2551.0, 4685.0, 8627.0, 15705.0, 28783.0, 53383.0, 96054.0, 167413.0, 276733.0, 417162.0, 559127.0, 641100.0, 608113.0, 485752.0, 336154.0, 210566.0, 124247.0, 70068.0, 38590.0, 21075.0, 11248.0, 6139.0, 3382.0, 1760.0, 1027.0, 613.0, 330.0, 192.0, 92.0, 77.0, 44.0, 22.0, 12.0, 11.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.4439697265625, -11.083251953125, -10.7225341796875, -10.36181640625, -10.0010986328125, -9.640380859375, -9.2796630859375, -8.9189453125, -8.5582275390625, -8.197509765625, -7.8367919921875, -7.47607421875, -7.1153564453125, -6.754638671875, -6.3939208984375, -6.033203125, -5.6724853515625, -5.311767578125, -4.9510498046875, -4.59033203125, -4.2296142578125, -3.868896484375, -3.5081787109375, -3.1474609375, -2.7867431640625, -2.426025390625, -2.0653076171875, -1.70458984375, -1.3438720703125, -0.983154296875, -0.6224365234375, -0.26171875, 0.0989990234375, 0.459716796875, 0.8204345703125, 1.18115234375, 1.5418701171875, 1.902587890625, 2.2633056640625, 2.6240234375, 2.9847412109375, 3.345458984375, 3.7061767578125, 4.06689453125, 4.4276123046875, 4.788330078125, 5.1490478515625, 5.509765625, 5.8704833984375, 6.231201171875, 6.5919189453125, 6.95263671875, 7.3133544921875, 7.674072265625, 8.0347900390625, 8.3955078125, 8.7562255859375, 9.116943359375, 9.4776611328125, 9.83837890625, 10.1990966796875, 10.559814453125, 10.9205322265625, 11.28125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 10.0, 10.0, 11.0, 20.0, 30.0, 23.0, 36.0, 57.0, 72.0, 81.0, 108.0, 114.0, 141.0, 174.0, 187.0, 171.0, 233.0, 250.0, 266.0, 240.0, 237.0, 206.0, 205.0, 193.0, 159.0, 156.0, 113.0, 99.0, 66.0, 75.0, 66.0, 54.0, 46.0, 25.0, 28.0, 23.0, 24.0, 12.0, 14.0, 8.0, 4.0, 4.0, 2.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.69140625, -5.52020263671875, -5.3489990234375, -5.17779541015625, -5.006591796875, -4.83538818359375, -4.6641845703125, -4.49298095703125, -4.32177734375, -4.15057373046875, -3.9793701171875, -3.80816650390625, -3.636962890625, -3.46575927734375, -3.2945556640625, -3.12335205078125, -2.9521484375, -2.78094482421875, -2.6097412109375, -2.43853759765625, -2.267333984375, -2.09613037109375, -1.9249267578125, -1.75372314453125, -1.58251953125, -1.41131591796875, -1.2401123046875, -1.06890869140625, -0.897705078125, -0.72650146484375, -0.5552978515625, -0.38409423828125, -0.212890625, -0.04168701171875, 0.1295166015625, 0.30072021484375, 0.471923828125, 0.64312744140625, 0.8143310546875, 0.98553466796875, 1.15673828125, 1.32794189453125, 1.4991455078125, 1.67034912109375, 1.841552734375, 2.01275634765625, 2.1839599609375, 2.35516357421875, 2.5263671875, 2.69757080078125, 2.8687744140625, 3.03997802734375, 3.211181640625, 3.38238525390625, 3.5535888671875, 3.72479248046875, 3.89599609375, 4.06719970703125, 4.2384033203125, 4.40960693359375, 4.580810546875, 4.75201416015625, 4.9232177734375, 5.09442138671875, 5.265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 3.0, 6.0, 10.0, 7.0, 8.0, 11.0, 14.0, 18.0, 22.0, 30.0, 27.0, 42.0, 51.0, 52.0, 52.0, 47.0, 51.0, 47.0, 57.0, 55.0, 52.0, 58.0, 48.0, 47.0, 25.0, 23.0, 29.0, 18.0, 15.0, 21.0, 10.0, 17.0, 14.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.007128715515137, -9.556267738342285, -9.105405807495117, -8.654544830322266, -8.203682899475098, -7.752821922302246, -7.301960468292236, -6.851099014282227, -6.400237560272217, -5.949376106262207, -5.498514652252197, -5.0476531982421875, -4.596792221069336, -4.145930290222168, -3.6950693130493164, -3.2442078590393066, -2.793346405029297, -2.342484951019287, -1.891623616218567, -1.4407622814178467, -0.9899008274078369, -0.5390393733978271, -0.08817815780639648, 0.3626832962036133, 0.813544750213623, 1.2644062042236328, 1.715267539024353, 2.1661288738250732, 2.616990327835083, 3.0678517818450928, 3.5187129974365234, 3.969574451446533, 4.420434951782227, 4.871296405792236, 5.322157859802246, 5.773018836975098, 6.223880767822266, 6.674741744995117, 7.125603199005127, 7.576464653015137, 8.027326583862305, 8.478187561035156, 8.929049491882324, 9.379910469055176, 9.830772399902344, 10.281633377075195, 10.732494354248047, 11.183356285095215, 11.634217262268066, 12.085078239440918, 12.535940170288086, 12.986801147460938, 13.437663078308105, 13.888524055480957, 14.339385986328125, 14.790246963500977, 15.241107940673828, 15.69196891784668, 16.14282989501953, 16.593692779541016, 17.044553756713867, 17.49541473388672, 17.94627571105957, 18.397136688232422, 18.847999572753906]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 8.0, 7.0, 3.0, 9.0, 7.0, 18.0, 17.0, 15.0, 29.0, 18.0, 34.0, 22.0, 30.0, 27.0, 33.0, 41.0, 36.0, 32.0, 40.0, 36.0, 47.0, 45.0, 51.0, 33.0, 52.0, 30.0, 33.0, 32.0, 31.0, 33.0, 22.0, 19.0, 20.0, 15.0, 14.0, 18.0, 13.0, 7.0, 9.0, 8.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.328036308288574, -14.82581901550293, -14.323601722717285, -13.82138442993164, -13.31916618347168, -12.816949844360352, -12.31473159790039, -11.812514305114746, -11.310297012329102, -10.808079719543457, -10.305862426757812, -9.803645133972168, -9.301427841186523, -8.799209594726562, -8.296992301940918, -7.794775009155273, -7.292557716369629, -6.790340423583984, -6.28812313079834, -5.785905361175537, -5.283688068389893, -4.781470775604248, -4.279253005981445, -3.777035713195801, -3.2748184204101562, -2.7726011276245117, -2.270383596420288, -1.768166184425354, -1.26594877243042, -0.7637314796447754, -0.26151394844055176, 0.24070358276367188, 0.742919921875, 1.245137333869934, 1.7473547458648682, 2.249572277069092, 2.7517895698547363, 3.254006862640381, 3.7562243938446045, 4.258441925048828, 4.760659217834473, 5.262876510620117, 5.765093803405762, 6.2673115730285645, 6.769528865814209, 7.2717461585998535, 7.773963928222656, 8.2761812210083, 8.778398513793945, 9.28061580657959, 9.782833099365234, 10.285050392150879, 10.787267684936523, 11.289485931396484, 11.791703224182129, 12.293920516967773, 12.796137809753418, 13.298355102539062, 13.800572395324707, 14.302789688110352, 14.805007934570312, 15.30722427368164, 15.809442520141602, 16.311660766601562, 16.81387710571289]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 10.0, 10.0, 11.0, 24.0, 31.0, 46.0, 81.0, 134.0, 211.0, 366.0, 600.0, 1030.0, 1816.0, 3257.0, 6316.0, 11882.0, 23167.0, 45639.0, 86648.0, 152423.0, 218237.0, 206859.0, 134373.0, 74618.0, 38708.0, 19737.0, 10355.0, 5373.0, 2834.0, 1541.0, 862.0, 533.0, 346.0, 178.0, 106.0, 86.0, 38.0, 26.0, 17.0, 10.0, 10.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.4453125, -13.0235595703125, -12.601806640625, -12.1800537109375, -11.75830078125, -11.3365478515625, -10.914794921875, -10.4930419921875, -10.0712890625, -9.6495361328125, -9.227783203125, -8.8060302734375, -8.38427734375, -7.9625244140625, -7.540771484375, -7.1190185546875, -6.697265625, -6.2755126953125, -5.853759765625, -5.4320068359375, -5.01025390625, -4.5885009765625, -4.166748046875, -3.7449951171875, -3.3232421875, -2.9014892578125, -2.479736328125, -2.0579833984375, -1.63623046875, -1.2144775390625, -0.792724609375, -0.3709716796875, 0.05078125, 0.4725341796875, 0.894287109375, 1.3160400390625, 1.73779296875, 2.1595458984375, 2.581298828125, 3.0030517578125, 3.4248046875, 3.8465576171875, 4.268310546875, 4.6900634765625, 5.11181640625, 5.5335693359375, 5.955322265625, 6.3770751953125, 6.798828125, 7.2205810546875, 7.642333984375, 8.0640869140625, 8.48583984375, 8.9075927734375, 9.329345703125, 9.7510986328125, 10.1728515625, 10.5946044921875, 11.016357421875, 11.4381103515625, 11.85986328125, 12.2816162109375, 12.703369140625, 13.1251220703125, 13.546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 6.0, 6.0, 7.0, 10.0, 19.0, 25.0, 14.0, 25.0, 19.0, 28.0, 29.0, 40.0, 33.0, 29.0, 31.0, 43.0, 39.0, 40.0, 44.0, 52.0, 46.0, 40.0, 39.0, 44.0, 37.0, 37.0, 29.0, 34.0, 24.0, 17.0, 21.0, 18.0, 15.0, 14.0, 12.0, 10.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.328125, -14.81787109375, -14.3076171875, -13.79736328125, -13.287109375, -12.77685546875, -12.2666015625, -11.75634765625, -11.24609375, -10.73583984375, -10.2255859375, -9.71533203125, -9.205078125, -8.69482421875, -8.1845703125, -7.67431640625, -7.1640625, -6.65380859375, -6.1435546875, -5.63330078125, -5.123046875, -4.61279296875, -4.1025390625, -3.59228515625, -3.08203125, -2.57177734375, -2.0615234375, -1.55126953125, -1.041015625, -0.53076171875, -0.0205078125, 0.48974609375, 1.0, 1.51025390625, 2.0205078125, 2.53076171875, 3.041015625, 3.55126953125, 4.0615234375, 4.57177734375, 5.08203125, 5.59228515625, 6.1025390625, 6.61279296875, 7.123046875, 7.63330078125, 8.1435546875, 8.65380859375, 9.1640625, 9.67431640625, 10.1845703125, 10.69482421875, 11.205078125, 11.71533203125, 12.2255859375, 12.73583984375, 13.24609375, 13.75634765625, 14.2666015625, 14.77685546875, 15.287109375, 15.79736328125, 16.3076171875, 16.81787109375, 17.328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 9.0, 5.0, 8.0, 18.0, 20.0, 37.0, 30.0, 59.0, 83.0, 123.0, 197.0, 296.0, 429.0, 727.0, 1142.0, 1878.0, 3205.0, 5673.0, 10282.0, 20109.0, 40019.0, 81285.0, 154893.0, 238437.0, 220186.0, 131718.0, 66784.0, 33178.0, 16534.0, 9052.0, 4847.0, 2740.0, 1691.0, 1019.0, 625.0, 423.0, 274.0, 174.0, 124.0, 67.0, 56.0, 36.0, 18.0, 15.0, 15.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.4609375, -11.1011962890625, -10.741455078125, -10.3817138671875, -10.02197265625, -9.6622314453125, -9.302490234375, -8.9427490234375, -8.5830078125, -8.2232666015625, -7.863525390625, -7.5037841796875, -7.14404296875, -6.7843017578125, -6.424560546875, -6.0648193359375, -5.705078125, -5.3453369140625, -4.985595703125, -4.6258544921875, -4.26611328125, -3.9063720703125, -3.546630859375, -3.1868896484375, -2.8271484375, -2.4674072265625, -2.107666015625, -1.7479248046875, -1.38818359375, -1.0284423828125, -0.668701171875, -0.3089599609375, 0.05078125, 0.4105224609375, 0.770263671875, 1.1300048828125, 1.48974609375, 1.8494873046875, 2.209228515625, 2.5689697265625, 2.9287109375, 3.2884521484375, 3.648193359375, 4.0079345703125, 4.36767578125, 4.7274169921875, 5.087158203125, 5.4468994140625, 5.806640625, 6.1663818359375, 6.526123046875, 6.8858642578125, 7.24560546875, 7.6053466796875, 7.965087890625, 8.3248291015625, 8.6845703125, 9.0443115234375, 9.404052734375, 9.7637939453125, 10.12353515625, 10.4832763671875, 10.843017578125, 11.2027587890625, 11.5625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 8.0, 15.0, 11.0, 9.0, 17.0, 18.0, 15.0, 25.0, 26.0, 29.0, 34.0, 30.0, 35.0, 36.0, 36.0, 44.0, 34.0, 42.0, 39.0, 28.0, 50.0, 41.0, 38.0, 36.0, 40.0, 35.0, 21.0, 34.0, 31.0, 14.0, 22.0, 14.0, 24.0, 9.0, 16.0, 10.0, 3.0, 7.0, 4.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.3671875, -13.92041015625, -13.4736328125, -13.02685546875, -12.580078125, -12.13330078125, -11.6865234375, -11.23974609375, -10.79296875, -10.34619140625, -9.8994140625, -9.45263671875, -9.005859375, -8.55908203125, -8.1123046875, -7.66552734375, -7.21875, -6.77197265625, -6.3251953125, -5.87841796875, -5.431640625, -4.98486328125, -4.5380859375, -4.09130859375, -3.64453125, -3.19775390625, -2.7509765625, -2.30419921875, -1.857421875, -1.41064453125, -0.9638671875, -0.51708984375, -0.0703125, 0.37646484375, 0.8232421875, 1.27001953125, 1.716796875, 2.16357421875, 2.6103515625, 3.05712890625, 3.50390625, 3.95068359375, 4.3974609375, 4.84423828125, 5.291015625, 5.73779296875, 6.1845703125, 6.63134765625, 7.078125, 7.52490234375, 7.9716796875, 8.41845703125, 8.865234375, 9.31201171875, 9.7587890625, 10.20556640625, 10.65234375, 11.09912109375, 11.5458984375, 11.99267578125, 12.439453125, 12.88623046875, 13.3330078125, 13.77978515625, 14.2265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 7.0, 14.0, 7.0, 10.0, 12.0, 19.0, 39.0, 40.0, 64.0, 83.0, 107.0, 168.0, 223.0, 349.0, 507.0, 741.0, 1167.0, 1848.0, 3113.0, 5169.0, 9439.0, 17792.0, 37197.0, 85908.0, 229881.0, 389375.0, 146990.0, 59187.0, 26831.0, 13456.0, 7395.0, 4245.0, 2515.0, 1561.0, 1004.0, 620.0, 453.0, 312.0, 181.0, 155.0, 104.0, 84.0, 52.0, 44.0, 30.0, 17.0, 16.0, 10.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.078125, -9.7218017578125, -9.365478515625, -9.0091552734375, -8.65283203125, -8.2965087890625, -7.940185546875, -7.5838623046875, -7.2275390625, -6.8712158203125, -6.514892578125, -6.1585693359375, -5.80224609375, -5.4459228515625, -5.089599609375, -4.7332763671875, -4.376953125, -4.0206298828125, -3.664306640625, -3.3079833984375, -2.95166015625, -2.5953369140625, -2.239013671875, -1.8826904296875, -1.5263671875, -1.1700439453125, -0.813720703125, -0.4573974609375, -0.10107421875, 0.2552490234375, 0.611572265625, 0.9678955078125, 1.32421875, 1.6805419921875, 2.036865234375, 2.3931884765625, 2.74951171875, 3.1058349609375, 3.462158203125, 3.8184814453125, 4.1748046875, 4.5311279296875, 4.887451171875, 5.2437744140625, 5.60009765625, 5.9564208984375, 6.312744140625, 6.6690673828125, 7.025390625, 7.3817138671875, 7.738037109375, 8.0943603515625, 8.45068359375, 8.8070068359375, 9.163330078125, 9.5196533203125, 9.8759765625, 10.2322998046875, 10.588623046875, 10.9449462890625, 11.30126953125, 11.6575927734375, 12.013916015625, 12.3702392578125, 12.7265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 9.0, 9.0, 7.0, 16.0, 11.0, 28.0, 17.0, 19.0, 42.0, 55.0, 68.0, 96.0, 100.0, 99.0, 101.0, 61.0, 57.0, 44.0, 32.0, 32.0, 14.0, 13.0, 21.0, 9.0, 7.0, 4.0, 7.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010061264038085938, -0.0009645968675613403, -0.0009230673313140869, -0.0008815377950668335, -0.0008400082588195801, -0.0007984787225723267, -0.0007569491863250732, -0.0007154196500778198, -0.0006738901138305664, -0.000632360577583313, -0.0005908310413360596, -0.0005493015050888062, -0.0005077719688415527, -0.0004662424325942993, -0.0004247128963470459, -0.0003831833600997925, -0.00034165382385253906, -0.00030012428760528564, -0.0002585947513580322, -0.0002170652151107788, -0.0001755356788635254, -0.00013400614261627197, -9.247660636901855e-05, -5.094707012176514e-05, -9.417533874511719e-06, 3.21120023727417e-05, 7.364153861999512e-05, 0.00011517107486724854, 0.00015670061111450195, 0.00019823014736175537, 0.0002397596836090088, 0.0002812892198562622, 0.0003228187561035156, 0.00036434829235076904, 0.00040587782859802246, 0.0004474073648452759, 0.0004889369010925293, 0.0005304664373397827, 0.0005719959735870361, 0.0006135255098342896, 0.000655055046081543, 0.0006965845823287964, 0.0007381141185760498, 0.0007796436548233032, 0.0008211731910705566, 0.0008627027273178101, 0.0009042322635650635, 0.0009457617998123169, 0.0009872913360595703, 0.0010288208723068237, 0.0010703504085540771, 0.0011118799448013306, 0.001153409481048584, 0.0011949390172958374, 0.0012364685535430908, 0.0012779980897903442, 0.0013195276260375977, 0.001361057162284851, 0.0014025866985321045, 0.001444116234779358, 0.0014856457710266113, 0.0015271753072738647, 0.0015687048435211182, 0.0016102343797683716, 0.001651763916015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 11.0, 9.0, 16.0, 13.0, 27.0, 28.0, 55.0, 65.0, 84.0, 108.0, 159.0, 237.0, 343.0, 448.0, 698.0, 1089.0, 1658.0, 2521.0, 3952.0, 6507.0, 10137.0, 16797.0, 27921.0, 47402.0, 81717.0, 145178.0, 248067.0, 193884.0, 106225.0, 60765.0, 36105.0, 21381.0, 12773.0, 7950.0, 4934.0, 3151.0, 2018.0, 1284.0, 950.0, 573.0, 392.0, 288.0, 182.0, 145.0, 90.0, 61.0, 44.0, 41.0, 28.0, 18.0, 13.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-9.5703125, -9.2779541015625, -8.985595703125, -8.6932373046875, -8.40087890625, -8.1085205078125, -7.816162109375, -7.5238037109375, -7.2314453125, -6.9390869140625, -6.646728515625, -6.3543701171875, -6.06201171875, -5.7696533203125, -5.477294921875, -5.1849365234375, -4.892578125, -4.6002197265625, -4.307861328125, -4.0155029296875, -3.72314453125, -3.4307861328125, -3.138427734375, -2.8460693359375, -2.5537109375, -2.2613525390625, -1.968994140625, -1.6766357421875, -1.38427734375, -1.0919189453125, -0.799560546875, -0.5072021484375, -0.21484375, 0.0775146484375, 0.369873046875, 0.6622314453125, 0.95458984375, 1.2469482421875, 1.539306640625, 1.8316650390625, 2.1240234375, 2.4163818359375, 2.708740234375, 3.0010986328125, 3.29345703125, 3.5858154296875, 3.878173828125, 4.1705322265625, 4.462890625, 4.7552490234375, 5.047607421875, 5.3399658203125, 5.63232421875, 5.9246826171875, 6.217041015625, 6.5093994140625, 6.8017578125, 7.0941162109375, 7.386474609375, 7.6788330078125, 7.97119140625, 8.2635498046875, 8.555908203125, 8.8482666015625, 9.140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 4.0, 7.0, 3.0, 9.0, 11.0, 11.0, 17.0, 11.0, 13.0, 23.0, 19.0, 32.0, 28.0, 39.0, 50.0, 49.0, 60.0, 87.0, 85.0, 81.0, 71.0, 39.0, 46.0, 29.0, 33.0, 21.0, 28.0, 18.0, 16.0, 8.0, 9.0, 16.0, 6.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.390625, -4.230224609375, -4.06982421875, -3.909423828125, -3.7490234375, -3.588623046875, -3.42822265625, -3.267822265625, -3.107421875, -2.947021484375, -2.78662109375, -2.626220703125, -2.4658203125, -2.305419921875, -2.14501953125, -1.984619140625, -1.82421875, -1.663818359375, -1.50341796875, -1.343017578125, -1.1826171875, -1.022216796875, -0.86181640625, -0.701416015625, -0.541015625, -0.380615234375, -0.22021484375, -0.059814453125, 0.1005859375, 0.260986328125, 0.42138671875, 0.581787109375, 0.7421875, 0.902587890625, 1.06298828125, 1.223388671875, 1.3837890625, 1.544189453125, 1.70458984375, 1.864990234375, 2.025390625, 2.185791015625, 2.34619140625, 2.506591796875, 2.6669921875, 2.827392578125, 2.98779296875, 3.148193359375, 3.30859375, 3.468994140625, 3.62939453125, 3.789794921875, 3.9501953125, 4.110595703125, 4.27099609375, 4.431396484375, 4.591796875, 4.752197265625, 4.91259765625, 5.072998046875, 5.2333984375, 5.393798828125, 5.55419921875, 5.714599609375, 5.875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 8.0, 17.0, 13.0, 19.0, 20.0, 28.0, 32.0, 24.0, 50.0, 44.0, 61.0, 50.0, 53.0, 40.0, 49.0, 74.0, 45.0, 58.0, 39.0, 37.0, 31.0, 39.0, 34.0, 23.0, 17.0, 17.0, 10.0, 15.0, 8.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.294434547424316, -13.847912788391113, -13.40139102935791, -12.954869270324707, -12.508347511291504, -12.0618257522583, -11.615303993225098, -11.168782234191895, -10.722260475158691, -10.275738716125488, -9.829216957092285, -9.382695198059082, -8.936173439025879, -8.489651679992676, -8.043129920959473, -7.5966081619262695, -7.150086402893066, -6.703564643859863, -6.25704288482666, -5.810521125793457, -5.363999366760254, -4.917477607727051, -4.470955848693848, -4.0244340896606445, -3.5779123306274414, -3.1313905715942383, -2.684868812561035, -2.238347053527832, -1.791825294494629, -1.3453035354614258, -0.8987817764282227, -0.45226001739501953, -0.0057392120361328125, 0.4407825469970703, 0.8873043060302734, 1.3338260650634766, 1.7803478240966797, 2.226869583129883, 2.673391342163086, 3.119913101196289, 3.566434860229492, 4.012956619262695, 4.459478378295898, 4.906000137329102, 5.352521896362305, 5.799043655395508, 6.245565414428711, 6.692087173461914, 7.138608932495117, 7.58513069152832, 8.031652450561523, 8.478174209594727, 8.92469596862793, 9.371217727661133, 9.817739486694336, 10.264261245727539, 10.710783004760742, 11.157304763793945, 11.603826522827148, 12.050348281860352, 12.496870040893555, 12.943391799926758, 13.389913558959961, 13.836435317993164, 14.282957077026367]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 9.0, 10.0, 8.0, 10.0, 13.0, 16.0, 15.0, 25.0, 28.0, 24.0, 21.0, 34.0, 32.0, 34.0, 25.0, 35.0, 43.0, 39.0, 21.0, 31.0, 39.0, 36.0, 41.0, 36.0, 33.0, 24.0, 27.0, 41.0, 27.0, 22.0, 30.0, 23.0, 20.0, 19.0, 15.0, 15.0, 7.0, 13.0, 13.0, 7.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.888408660888672, -13.430651664733887, -12.972894668579102, -12.515137672424316, -12.057380676269531, -11.599623680114746, -11.141866683959961, -10.68410873413086, -10.22635269165039, -9.768595695495605, -9.31083869934082, -8.853081703186035, -8.39532470703125, -7.937567710876465, -7.4798102378845215, -7.022053241729736, -6.564295768737793, -6.106538772583008, -5.648781776428223, -5.1910247802734375, -4.733267784118652, -4.275510787963867, -3.817753314971924, -3.3599963188171387, -2.9022393226623535, -2.4444823265075684, -1.9867252111434937, -1.528968095779419, -1.0712110996246338, -0.6134541034698486, -0.15569686889648438, 0.3020601272583008, 0.7598171234130859, 1.217574119567871, 1.6753312349319458, 2.1330883502960205, 2.5908453464508057, 3.048602342605591, 3.506359577178955, 3.9641165733337402, 4.421873569488525, 4.8796305656433105, 5.337387561798096, 5.795145034790039, 6.252902030944824, 6.710659027099609, 7.1684160232543945, 7.62617301940918, 8.083930015563965, 8.54168701171875, 8.999444007873535, 9.45720100402832, 9.914958000183105, 10.37271499633789, 10.830472946166992, 11.288228988647461, 11.745986938476562, 12.203743934631348, 12.661500930786133, 13.119257926940918, 13.577014923095703, 14.034771919250488, 14.492528915405273, 14.950286865234375, 15.408042907714844]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 11.0, 8.0, 11.0, 28.0, 31.0, 44.0, 65.0, 99.0, 153.0, 244.0, 403.0, 626.0, 955.0, 1591.0, 2487.0, 3809.0, 5874.0, 9202.0, 14116.0, 21505.0, 31765.0, 45675.0, 62422.0, 82257.0, 99120.0, 111704.0, 114352.0, 106645.0, 91821.0, 72586.0, 54293.0, 38420.0, 26212.0, 17524.0, 11764.0, 7405.0, 4825.0, 3056.0, 1957.0, 1171.0, 822.0, 531.0, 350.0, 215.0, 153.0, 100.0, 54.0, 34.0, 23.0, 16.0, 11.0, 8.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.8104248046875, -8.519287109375, -8.2281494140625, -7.93701171875, -7.6458740234375, -7.354736328125, -7.0635986328125, -6.7724609375, -6.4813232421875, -6.190185546875, -5.8990478515625, -5.60791015625, -5.3167724609375, -5.025634765625, -4.7344970703125, -4.443359375, -4.1522216796875, -3.861083984375, -3.5699462890625, -3.27880859375, -2.9876708984375, -2.696533203125, -2.4053955078125, -2.1142578125, -1.8231201171875, -1.531982421875, -1.2408447265625, -0.94970703125, -0.6585693359375, -0.367431640625, -0.0762939453125, 0.21484375, 0.5059814453125, 0.797119140625, 1.0882568359375, 1.37939453125, 1.6705322265625, 1.961669921875, 2.2528076171875, 2.5439453125, 2.8350830078125, 3.126220703125, 3.4173583984375, 3.70849609375, 3.9996337890625, 4.290771484375, 4.5819091796875, 4.873046875, 5.1641845703125, 5.455322265625, 5.7464599609375, 6.03759765625, 6.3287353515625, 6.619873046875, 6.9110107421875, 7.2021484375, 7.4932861328125, 7.784423828125, 8.0755615234375, 8.36669921875, 8.6578369140625, 8.948974609375, 9.2401123046875, 9.53125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 3.0, 3.0, 9.0, 8.0, 8.0, 11.0, 15.0, 14.0, 13.0, 28.0, 29.0, 28.0, 30.0, 32.0, 23.0, 38.0, 38.0, 32.0, 44.0, 38.0, 32.0, 30.0, 38.0, 45.0, 33.0, 47.0, 23.0, 35.0, 31.0, 34.0, 32.0, 33.0, 16.0, 24.0, 10.0, 20.0, 17.0, 16.0, 12.0, 8.0, 3.0, 7.0, 2.0, 3.0, 5.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.140625, -14.6634521484375, -14.186279296875, -13.7091064453125, -13.23193359375, -12.7547607421875, -12.277587890625, -11.8004150390625, -11.3232421875, -10.8460693359375, -10.368896484375, -9.8917236328125, -9.41455078125, -8.9373779296875, -8.460205078125, -7.9830322265625, -7.505859375, -7.0286865234375, -6.551513671875, -6.0743408203125, -5.59716796875, -5.1199951171875, -4.642822265625, -4.1656494140625, -3.6884765625, -3.2113037109375, -2.734130859375, -2.2569580078125, -1.77978515625, -1.3026123046875, -0.825439453125, -0.3482666015625, 0.12890625, 0.6060791015625, 1.083251953125, 1.5604248046875, 2.03759765625, 2.5147705078125, 2.991943359375, 3.4691162109375, 3.9462890625, 4.4234619140625, 4.900634765625, 5.3778076171875, 5.85498046875, 6.3321533203125, 6.809326171875, 7.2864990234375, 7.763671875, 8.2408447265625, 8.718017578125, 9.1951904296875, 9.67236328125, 10.1495361328125, 10.626708984375, 11.1038818359375, 11.5810546875, 12.0582275390625, 12.535400390625, 13.0125732421875, 13.48974609375, 13.9669189453125, 14.444091796875, 14.9212646484375, 15.3984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 12.0, 10.0, 22.0, 37.0, 35.0, 60.0, 101.0, 145.0, 189.0, 306.0, 442.0, 613.0, 836.0, 1307.0, 1792.0, 2686.0, 3826.0, 5534.0, 8214.0, 11881.0, 17173.0, 24346.0, 34597.0, 47521.0, 63298.0, 79223.0, 94846.0, 104451.0, 106481.0, 99190.0, 85492.0, 69703.0, 54036.0, 39146.0, 27973.0, 19770.0, 13369.0, 9398.0, 6406.0, 4276.0, 3033.0, 2079.0, 1461.0, 975.0, 727.0, 482.0, 341.0, 236.0, 151.0, 122.0, 78.0, 52.0, 31.0, 25.0, 16.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -9.0040283203125, -8.695556640625, -8.3870849609375, -8.07861328125, -7.7701416015625, -7.461669921875, -7.1531982421875, -6.8447265625, -6.5362548828125, -6.227783203125, -5.9193115234375, -5.61083984375, -5.3023681640625, -4.993896484375, -4.6854248046875, -4.376953125, -4.0684814453125, -3.760009765625, -3.4515380859375, -3.14306640625, -2.8345947265625, -2.526123046875, -2.2176513671875, -1.9091796875, -1.6007080078125, -1.292236328125, -0.9837646484375, -0.67529296875, -0.3668212890625, -0.058349609375, 0.2501220703125, 0.55859375, 0.8670654296875, 1.175537109375, 1.4840087890625, 1.79248046875, 2.1009521484375, 2.409423828125, 2.7178955078125, 3.0263671875, 3.3348388671875, 3.643310546875, 3.9517822265625, 4.26025390625, 4.5687255859375, 4.877197265625, 5.1856689453125, 5.494140625, 5.8026123046875, 6.111083984375, 6.4195556640625, 6.72802734375, 7.0364990234375, 7.344970703125, 7.6534423828125, 7.9619140625, 8.2703857421875, 8.578857421875, 8.8873291015625, 9.19580078125, 9.5042724609375, 9.812744140625, 10.1212158203125, 10.4296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 5.0, 3.0, 8.0, 4.0, 6.0, 8.0, 11.0, 9.0, 11.0, 18.0, 20.0, 15.0, 27.0, 30.0, 30.0, 27.0, 28.0, 36.0, 38.0, 32.0, 40.0, 26.0, 38.0, 48.0, 37.0, 51.0, 37.0, 23.0, 29.0, 26.0, 35.0, 32.0, 27.0, 36.0, 18.0, 20.0, 17.0, 19.0, 13.0, 10.0, 13.0, 6.0, 9.0, 4.0, 2.0, 4.0, 6.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.909912109375, -8.60107421875, -8.292236328125, -7.9833984375, -7.674560546875, -7.36572265625, -7.056884765625, -6.748046875, -6.439208984375, -6.13037109375, -5.821533203125, -5.5126953125, -5.203857421875, -4.89501953125, -4.586181640625, -4.27734375, -3.968505859375, -3.65966796875, -3.350830078125, -3.0419921875, -2.733154296875, -2.42431640625, -2.115478515625, -1.806640625, -1.497802734375, -1.18896484375, -0.880126953125, -0.5712890625, -0.262451171875, 0.04638671875, 0.355224609375, 0.6640625, 0.972900390625, 1.28173828125, 1.590576171875, 1.8994140625, 2.208251953125, 2.51708984375, 2.825927734375, 3.134765625, 3.443603515625, 3.75244140625, 4.061279296875, 4.3701171875, 4.678955078125, 4.98779296875, 5.296630859375, 5.60546875, 5.914306640625, 6.22314453125, 6.531982421875, 6.8408203125, 7.149658203125, 7.45849609375, 7.767333984375, 8.076171875, 8.385009765625, 8.69384765625, 9.002685546875, 9.3115234375, 9.620361328125, 9.92919921875, 10.238037109375, 10.546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 12.0, 8.0, 13.0, 20.0, 14.0, 33.0, 39.0, 63.0, 89.0, 115.0, 141.0, 209.0, 281.0, 441.0, 649.0, 1001.0, 1596.0, 2454.0, 3992.0, 7113.0, 13244.0, 25454.0, 52722.0, 107965.0, 192704.0, 239373.0, 188256.0, 104154.0, 50630.0, 24571.0, 12970.0, 6993.0, 4095.0, 2477.0, 1517.0, 988.0, 700.0, 423.0, 303.0, 192.0, 134.0, 97.0, 86.0, 60.0, 35.0, 32.0, 25.0, 20.0, 12.0, 12.0, 7.0, 3.0, 7.0, 1.0, 1.0, 4.0], "bins": [-7.4375, -7.21533203125, -6.9931640625, -6.77099609375, -6.548828125, -6.32666015625, -6.1044921875, -5.88232421875, -5.66015625, -5.43798828125, -5.2158203125, -4.99365234375, -4.771484375, -4.54931640625, -4.3271484375, -4.10498046875, -3.8828125, -3.66064453125, -3.4384765625, -3.21630859375, -2.994140625, -2.77197265625, -2.5498046875, -2.32763671875, -2.10546875, -1.88330078125, -1.6611328125, -1.43896484375, -1.216796875, -0.99462890625, -0.7724609375, -0.55029296875, -0.328125, -0.10595703125, 0.1162109375, 0.33837890625, 0.560546875, 0.78271484375, 1.0048828125, 1.22705078125, 1.44921875, 1.67138671875, 1.8935546875, 2.11572265625, 2.337890625, 2.56005859375, 2.7822265625, 3.00439453125, 3.2265625, 3.44873046875, 3.6708984375, 3.89306640625, 4.115234375, 4.33740234375, 4.5595703125, 4.78173828125, 5.00390625, 5.22607421875, 5.4482421875, 5.67041015625, 5.892578125, 6.11474609375, 6.3369140625, 6.55908203125, 6.78125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 12.0, 12.0, 10.0, 19.0, 27.0, 42.0, 37.0, 45.0, 44.0, 39.0, 58.0, 47.0, 85.0, 60.0, 70.0, 63.0, 68.0, 45.0, 33.0, 31.0, 42.0, 24.0, 15.0, 13.0, 13.0, 13.0, 4.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0], "bins": [-0.0005960464477539062, -0.0005795508623123169, -0.0005630552768707275, -0.0005465596914291382, -0.0005300641059875488, -0.0005135685205459595, -0.0004970729351043701, -0.00048057734966278076, -0.0004640817642211914, -0.00044758617877960205, -0.0004310905933380127, -0.00041459500789642334, -0.000398099422454834, -0.00038160383701324463, -0.0003651082515716553, -0.0003486126661300659, -0.00033211708068847656, -0.0003156214952468872, -0.00029912590980529785, -0.0002826303243637085, -0.00026613473892211914, -0.0002496391534805298, -0.00023314356803894043, -0.00021664798259735107, -0.00020015239715576172, -0.00018365681171417236, -0.000167161226272583, -0.00015066564083099365, -0.0001341700553894043, -0.00011767446994781494, -0.00010117888450622559, -8.468329906463623e-05, -6.818771362304688e-05, -5.169212818145752e-05, -3.5196542739868164e-05, -1.870095729827881e-05, -2.205371856689453e-06, 1.4290213584899902e-05, 3.078579902648926e-05, 4.728138446807861e-05, 6.377696990966797e-05, 8.027255535125732e-05, 9.676814079284668e-05, 0.00011326372623443604, 0.0001297593116760254, 0.00014625489711761475, 0.0001627504825592041, 0.00017924606800079346, 0.0001957416534423828, 0.00021223723888397217, 0.00022873282432556152, 0.0002452284097671509, 0.00026172399520874023, 0.0002782195806503296, 0.00029471516609191895, 0.0003112107515335083, 0.00032770633697509766, 0.000344201922416687, 0.00036069750785827637, 0.0003771930932998657, 0.0003936886787414551, 0.00041018426418304443, 0.0004266798496246338, 0.00044317543506622314, 0.0004596710205078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 5.0, 5.0, 17.0, 12.0, 21.0, 25.0, 51.0, 68.0, 116.0, 147.0, 216.0, 316.0, 472.0, 664.0, 1070.0, 1602.0, 2298.0, 3554.0, 5542.0, 8221.0, 13110.0, 20568.0, 31489.0, 47804.0, 69844.0, 96352.0, 120104.0, 133303.0, 128869.0, 110145.0, 83013.0, 58501.0, 38911.0, 25338.0, 16338.0, 10507.0, 6645.0, 4481.0, 2889.0, 1914.0, 1327.0, 904.0, 589.0, 364.0, 264.0, 190.0, 133.0, 87.0, 65.0, 34.0, 24.0, 12.0, 10.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.615234375, -3.4976806640625, -3.380126953125, -3.2625732421875, -3.14501953125, -3.0274658203125, -2.909912109375, -2.7923583984375, -2.6748046875, -2.5572509765625, -2.439697265625, -2.3221435546875, -2.20458984375, -2.0870361328125, -1.969482421875, -1.8519287109375, -1.734375, -1.6168212890625, -1.499267578125, -1.3817138671875, -1.26416015625, -1.1466064453125, -1.029052734375, -0.9114990234375, -0.7939453125, -0.6763916015625, -0.558837890625, -0.4412841796875, -0.32373046875, -0.2061767578125, -0.088623046875, 0.0289306640625, 0.146484375, 0.2640380859375, 0.381591796875, 0.4991455078125, 0.61669921875, 0.7342529296875, 0.851806640625, 0.9693603515625, 1.0869140625, 1.2044677734375, 1.322021484375, 1.4395751953125, 1.55712890625, 1.6746826171875, 1.792236328125, 1.9097900390625, 2.02734375, 2.1448974609375, 2.262451171875, 2.3800048828125, 2.49755859375, 2.6151123046875, 2.732666015625, 2.8502197265625, 2.9677734375, 3.0853271484375, 3.202880859375, 3.3204345703125, 3.43798828125, 3.5555419921875, 3.673095703125, 3.7906494140625, 3.908203125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 7.0, 1.0, 3.0, 5.0, 8.0, 6.0, 9.0, 3.0, 16.0, 10.0, 11.0, 11.0, 10.0, 20.0, 22.0, 18.0, 33.0, 27.0, 42.0, 33.0, 49.0, 46.0, 42.0, 37.0, 41.0, 44.0, 47.0, 41.0, 44.0, 44.0, 35.0, 32.0, 34.0, 25.0, 16.0, 20.0, 11.0, 22.0, 15.0, 10.0, 8.0, 7.0, 8.0, 7.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.04296875, -1.97589111328125, -1.9088134765625, -1.84173583984375, -1.774658203125, -1.70758056640625, -1.6405029296875, -1.57342529296875, -1.50634765625, -1.43927001953125, -1.3721923828125, -1.30511474609375, -1.238037109375, -1.17095947265625, -1.1038818359375, -1.03680419921875, -0.9697265625, -0.90264892578125, -0.8355712890625, -0.76849365234375, -0.701416015625, -0.63433837890625, -0.5672607421875, -0.50018310546875, -0.43310546875, -0.36602783203125, -0.2989501953125, -0.23187255859375, -0.164794921875, -0.09771728515625, -0.0306396484375, 0.03643798828125, 0.103515625, 0.17059326171875, 0.2376708984375, 0.30474853515625, 0.371826171875, 0.43890380859375, 0.5059814453125, 0.57305908203125, 0.64013671875, 0.70721435546875, 0.7742919921875, 0.84136962890625, 0.908447265625, 0.97552490234375, 1.0426025390625, 1.10968017578125, 1.1767578125, 1.24383544921875, 1.3109130859375, 1.37799072265625, 1.445068359375, 1.51214599609375, 1.5792236328125, 1.64630126953125, 1.71337890625, 1.78045654296875, 1.8475341796875, 1.91461181640625, 1.981689453125, 2.04876708984375, 2.1158447265625, 2.18292236328125, 2.25]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 12.0, 14.0, 9.0, 15.0, 16.0, 23.0, 32.0, 33.0, 28.0, 34.0, 44.0, 49.0, 41.0, 54.0, 58.0, 54.0, 44.0, 45.0, 50.0, 37.0, 51.0, 44.0, 26.0, 31.0, 31.0, 16.0, 19.0, 18.0, 8.0, 13.0, 6.0, 10.0, 6.0, 7.0, 3.0, 5.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.811851501464844, -10.398238182067871, -9.984625816345215, -9.571012496948242, -9.157400131225586, -8.743786811828613, -8.33017349243164, -7.916560649871826, -7.502947807312012, -7.089334964752197, -6.675722122192383, -6.26210880279541, -5.848495960235596, -5.434883117675781, -5.021269798278809, -4.607656955718994, -4.19404411315918, -3.7804312705993652, -3.3668181896209717, -2.953205108642578, -2.5395922660827637, -2.125979423522949, -1.7123663425445557, -1.298753261566162, -0.8851404190063477, -0.47152745723724365, -0.05791449546813965, 0.35569846630096436, 0.7693114280700684, 1.1829242706298828, 1.5965373516082764, 2.01015043258667, 2.4237632751464844, 2.837376117706299, 3.2509891986846924, 3.664602279663086, 4.0782151222229, 4.491827964782715, 4.9054412841796875, 5.319054126739502, 5.732666969299316, 6.146279811859131, 6.559892654418945, 6.973505973815918, 7.387118816375732, 7.800731658935547, 8.21434497833252, 8.627958297729492, 9.041570663452148, 9.455183982849121, 9.868796348571777, 10.28240966796875, 10.696022033691406, 11.109635353088379, 11.523248672485352, 11.936861038208008, 12.35047435760498, 12.764087677001953, 13.17770004272461, 13.591313362121582, 14.004926681518555, 14.418539047241211, 14.832152366638184, 15.245765686035156, 15.659378051757812]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 10.0, 15.0, 28.0, 14.0, 15.0, 15.0, 29.0, 37.0, 21.0, 33.0, 30.0, 41.0, 43.0, 44.0, 34.0, 40.0, 28.0, 38.0, 47.0, 35.0, 34.0, 34.0, 40.0, 34.0, 28.0, 36.0, 16.0, 25.0, 26.0, 17.0, 17.0, 15.0, 14.0, 5.0, 6.0, 8.0, 11.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.490605354309082, -13.988265991210938, -13.485925674438477, -12.983586311340332, -12.481246948242188, -11.978906631469727, -11.476567268371582, -10.974227905273438, -10.471887588500977, -9.969548225402832, -9.467207908630371, -8.964868545532227, -8.462528228759766, -7.960188865661621, -7.457849502563477, -6.955509662628174, -6.453169822692871, -5.950829982757568, -5.448490142822266, -4.946150779724121, -4.443810939788818, -3.9414710998535156, -3.439131498336792, -2.9367918968200684, -2.4344520568847656, -1.9321123361587524, -1.4297726154327393, -0.9274328947067261, -0.4250931739807129, 0.07724666595458984, 0.5795862674713135, 1.081925868988037, 1.5842647552490234, 2.086604595184326, 2.58894419670105, 3.0912837982177734, 3.593623638153076, 4.095963478088379, 4.598302841186523, 5.100642681121826, 5.602982521057129, 6.105322360992432, 6.607662200927734, 7.110001564025879, 7.612341403961182, 8.114681243896484, 8.617020606994629, 9.119359970092773, 9.621700286865234, 10.124039649963379, 10.62637996673584, 11.128719329833984, 11.631059646606445, 12.13339900970459, 12.635738372802734, 13.138078689575195, 13.64041805267334, 14.142757415771484, 14.645097732543945, 15.14743709564209, 15.649776458740234, 16.152116775512695, 16.654457092285156, 17.156795501708984, 17.659135818481445]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 14.0, 14.0, 20.0, 46.0, 61.0, 78.0, 108.0, 219.0, 276.0, 444.0, 613.0, 971.0, 1440.0, 2094.0, 3293.0, 5153.0, 7858.0, 12364.0, 19598.0, 31483.0, 50663.0, 82289.0, 131702.0, 207337.0, 305804.0, 418320.0, 515781.0, 553286.0, 519474.0, 427737.0, 315580.0, 214322.0, 137435.0, 85495.0, 52963.0, 32919.0, 20589.0, 12930.0, 8239.0, 5247.0, 3461.0, 2273.0, 1451.0, 961.0, 684.0, 394.0, 290.0, 173.0, 102.0, 78.0, 61.0, 27.0, 31.0, 10.0, 13.0, 5.0, 5.0, 3.0], "bins": [-8.6484375, -8.390625, -8.1328125, -7.875, -7.6171875, -7.359375, -7.1015625, -6.84375, -6.5859375, -6.328125, -6.0703125, -5.8125, -5.5546875, -5.296875, -5.0390625, -4.78125, -4.5234375, -4.265625, -4.0078125, -3.75, -3.4921875, -3.234375, -2.9765625, -2.71875, -2.4609375, -2.203125, -1.9453125, -1.6875, -1.4296875, -1.171875, -0.9140625, -0.65625, -0.3984375, -0.140625, 0.1171875, 0.375, 0.6328125, 0.890625, 1.1484375, 1.40625, 1.6640625, 1.921875, 2.1796875, 2.4375, 2.6953125, 2.953125, 3.2109375, 3.46875, 3.7265625, 3.984375, 4.2421875, 4.5, 4.7578125, 5.015625, 5.2734375, 5.53125, 5.7890625, 6.046875, 6.3046875, 6.5625, 6.8203125, 7.078125, 7.3359375, 7.59375, 7.8515625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 6.0, 6.0, 3.0, 7.0, 10.0, 17.0, 13.0, 14.0, 20.0, 22.0, 25.0, 26.0, 25.0, 36.0, 41.0, 32.0, 41.0, 41.0, 39.0, 42.0, 40.0, 33.0, 44.0, 38.0, 35.0, 37.0, 39.0, 32.0, 28.0, 32.0, 30.0, 28.0, 26.0, 19.0, 14.0, 8.0, 6.0, 12.0, 5.0, 12.0, 7.0, 8.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4140625, -12.01318359375, -11.6123046875, -11.21142578125, -10.810546875, -10.40966796875, -10.0087890625, -9.60791015625, -9.20703125, -8.80615234375, -8.4052734375, -8.00439453125, -7.603515625, -7.20263671875, -6.8017578125, -6.40087890625, -6.0, -5.59912109375, -5.1982421875, -4.79736328125, -4.396484375, -3.99560546875, -3.5947265625, -3.19384765625, -2.79296875, -2.39208984375, -1.9912109375, -1.59033203125, -1.189453125, -0.78857421875, -0.3876953125, 0.01318359375, 0.4140625, 0.81494140625, 1.2158203125, 1.61669921875, 2.017578125, 2.41845703125, 2.8193359375, 3.22021484375, 3.62109375, 4.02197265625, 4.4228515625, 4.82373046875, 5.224609375, 5.62548828125, 6.0263671875, 6.42724609375, 6.828125, 7.22900390625, 7.6298828125, 8.03076171875, 8.431640625, 8.83251953125, 9.2333984375, 9.63427734375, 10.03515625, 10.43603515625, 10.8369140625, 11.23779296875, 11.638671875, 12.03955078125, 12.4404296875, 12.84130859375, 13.2421875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 4.0, 10.0, 8.0, 8.0, 23.0, 36.0, 32.0, 74.0, 136.0, 210.0, 354.0, 566.0, 912.0, 1638.0, 2755.0, 4820.0, 8719.0, 16124.0, 28492.0, 50508.0, 88833.0, 151479.0, 245287.0, 370160.0, 502563.0, 597817.0, 602021.0, 514072.0, 380864.0, 254074.0, 157611.0, 92589.0, 53244.0, 29703.0, 16780.0, 9377.0, 5228.0, 2989.0, 1741.0, 994.0, 539.0, 377.0, 192.0, 127.0, 93.0, 39.0, 21.0, 22.0, 9.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.703125, -9.380126953125, -9.05712890625, -8.734130859375, -8.4111328125, -8.088134765625, -7.76513671875, -7.442138671875, -7.119140625, -6.796142578125, -6.47314453125, -6.150146484375, -5.8271484375, -5.504150390625, -5.18115234375, -4.858154296875, -4.53515625, -4.212158203125, -3.88916015625, -3.566162109375, -3.2431640625, -2.920166015625, -2.59716796875, -2.274169921875, -1.951171875, -1.628173828125, -1.30517578125, -0.982177734375, -0.6591796875, -0.336181640625, -0.01318359375, 0.309814453125, 0.6328125, 0.955810546875, 1.27880859375, 1.601806640625, 1.9248046875, 2.247802734375, 2.57080078125, 2.893798828125, 3.216796875, 3.539794921875, 3.86279296875, 4.185791015625, 4.5087890625, 4.831787109375, 5.15478515625, 5.477783203125, 5.80078125, 6.123779296875, 6.44677734375, 6.769775390625, 7.0927734375, 7.415771484375, 7.73876953125, 8.061767578125, 8.384765625, 8.707763671875, 9.03076171875, 9.353759765625, 9.6767578125, 9.999755859375, 10.32275390625, 10.645751953125, 10.96875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 6.0, 14.0, 11.0, 26.0, 30.0, 49.0, 52.0, 72.0, 93.0, 105.0, 111.0, 150.0, 183.0, 228.0, 232.0, 244.0, 267.0, 239.0, 242.0, 255.0, 239.0, 200.0, 185.0, 163.0, 145.0, 113.0, 83.0, 81.0, 68.0, 42.0, 30.0, 23.0, 13.0, 25.0, 16.0, 16.0, 8.0, 3.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.79742431640625, -4.6104736328125, -4.42352294921875, -4.236572265625, -4.04962158203125, -3.8626708984375, -3.67572021484375, -3.48876953125, -3.30181884765625, -3.1148681640625, -2.92791748046875, -2.740966796875, -2.55401611328125, -2.3670654296875, -2.18011474609375, -1.9931640625, -1.80621337890625, -1.6192626953125, -1.43231201171875, -1.245361328125, -1.05841064453125, -0.8714599609375, -0.68450927734375, -0.49755859375, -0.31060791015625, -0.1236572265625, 0.06329345703125, 0.250244140625, 0.43719482421875, 0.6241455078125, 0.81109619140625, 0.998046875, 1.18499755859375, 1.3719482421875, 1.55889892578125, 1.745849609375, 1.93280029296875, 2.1197509765625, 2.30670166015625, 2.49365234375, 2.68060302734375, 2.8675537109375, 3.05450439453125, 3.241455078125, 3.42840576171875, 3.6153564453125, 3.80230712890625, 3.9892578125, 4.17620849609375, 4.3631591796875, 4.55010986328125, 4.737060546875, 4.92401123046875, 5.1109619140625, 5.29791259765625, 5.48486328125, 5.67181396484375, 5.8587646484375, 6.04571533203125, 6.232666015625, 6.41961669921875, 6.6065673828125, 6.79351806640625, 6.98046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 12.0, 10.0, 18.0, 28.0, 26.0, 17.0, 37.0, 43.0, 59.0, 46.0, 51.0, 53.0, 59.0, 53.0, 52.0, 51.0, 52.0, 41.0, 47.0, 32.0, 28.0, 23.0, 34.0, 20.0, 15.0, 17.0, 13.0, 10.0, 8.0, 6.0, 4.0, 4.0, 5.0, 0.0, 5.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953963279724121, -10.547334671020508, -10.140706062316895, -9.734077453613281, -9.327449798583984, -8.920821189880371, -8.514192581176758, -8.107563972473145, -7.700935363769531, -7.294306755065918, -6.887678623199463, -6.48105001449585, -6.074421405792236, -5.667793273925781, -5.261164665222168, -4.854536056518555, -4.4479079246521, -4.041279315948486, -3.634650945663452, -3.228022575378418, -2.8213939666748047, -2.4147655963897705, -2.0081372261047363, -1.601508617401123, -1.1948802471160889, -0.7882517576217651, -0.3816233277320862, 0.025005102157592773, 0.4316335916519165, 0.8382620811462402, 1.2448904514312744, 1.6515190601348877, 2.058147430419922, 2.464775800704956, 2.8714044094085693, 3.2780327796936035, 3.684661388397217, 4.091289520263672, 4.497918128967285, 4.904546737670898, 5.311175346374512, 5.717803955078125, 6.12443208694458, 6.531060695648193, 6.937689304351807, 7.344317436218262, 7.750946044921875, 8.157574653625488, 8.564203262329102, 8.970831871032715, 9.377460479736328, 9.784088134765625, 10.190716743469238, 10.597345352172852, 11.003973960876465, 11.410602569580078, 11.817230224609375, 12.223858833312988, 12.630487442016602, 13.037115097045898, 13.443743705749512, 13.850372314453125, 14.257000923156738, 14.663629531860352, 15.070258140563965]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 6.0, 14.0, 10.0, 17.0, 19.0, 22.0, 25.0, 23.0, 18.0, 24.0, 32.0, 24.0, 39.0, 29.0, 29.0, 38.0, 44.0, 40.0, 36.0, 41.0, 45.0, 40.0, 45.0, 43.0, 27.0, 25.0, 39.0, 24.0, 22.0, 15.0, 22.0, 7.0, 19.0, 23.0, 17.0, 8.0, 15.0, 9.0, 6.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.626860618591309, -13.16612720489502, -12.70539379119873, -12.244660377502441, -11.783927917480469, -11.32319450378418, -10.86246109008789, -10.401727676391602, -9.940994262695312, -9.480260848999023, -9.019527435302734, -8.558794021606445, -8.098060607910156, -7.637327671051025, -7.1765947341918945, -6.7158613204956055, -6.255127906799316, -5.794394493103027, -5.333661079406738, -4.872928142547607, -4.412194728851318, -3.9514613151550293, -3.4907281398773193, -3.0299949645996094, -2.5692615509033203, -2.1085281372070312, -1.6477949619293213, -1.1870616674423218, -0.7263283729553223, -0.2655949592590332, 0.19513821601867676, 0.6558713912963867, 1.1166038513183594, 1.5773371458053589, 2.0380704402923584, 2.4988036155700684, 2.9595370292663574, 3.4202704429626465, 3.8810036182403564, 4.341736793518066, 4.8024702072143555, 5.2632036209106445, 5.723937034606934, 6.1846699714660645, 6.6454033851623535, 7.106136798858643, 7.566869735717773, 8.027603149414062, 8.488336563110352, 8.94906997680664, 9.40980339050293, 9.870536804199219, 10.331270217895508, 10.792003631591797, 11.25273609161377, 11.713469505310059, 12.174202919006348, 12.634936332702637, 13.095669746398926, 13.556403160095215, 14.017135620117188, 14.477869033813477, 14.938602447509766, 15.399335861206055, 15.860069274902344]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 15.0, 13.0, 26.0, 33.0, 30.0, 57.0, 84.0, 135.0, 190.0, 243.0, 386.0, 567.0, 829.0, 1332.0, 2097.0, 3232.0, 5067.0, 7947.0, 12123.0, 18597.0, 28522.0, 42054.0, 61377.0, 84995.0, 111009.0, 129466.0, 131809.0, 115328.0, 90620.0, 66390.0, 45525.0, 31083.0, 20318.0, 13044.0, 8449.0, 5316.0, 3509.0, 2210.0, 1543.0, 973.0, 639.0, 441.0, 295.0, 189.0, 146.0, 83.0, 62.0, 49.0, 38.0, 22.0, 12.0, 12.0, 9.0, 6.0, 6.0, 4.0, 0.0, 1.0], "bins": [-6.86328125, -6.64947509765625, -6.4356689453125, -6.22186279296875, -6.008056640625, -5.79425048828125, -5.5804443359375, -5.36663818359375, -5.15283203125, -4.93902587890625, -4.7252197265625, -4.51141357421875, -4.297607421875, -4.08380126953125, -3.8699951171875, -3.65618896484375, -3.4423828125, -3.22857666015625, -3.0147705078125, -2.80096435546875, -2.587158203125, -2.37335205078125, -2.1595458984375, -1.94573974609375, -1.73193359375, -1.51812744140625, -1.3043212890625, -1.09051513671875, -0.876708984375, -0.66290283203125, -0.4490966796875, -0.23529052734375, -0.021484375, 0.19232177734375, 0.4061279296875, 0.61993408203125, 0.833740234375, 1.04754638671875, 1.2613525390625, 1.47515869140625, 1.68896484375, 1.90277099609375, 2.1165771484375, 2.33038330078125, 2.544189453125, 2.75799560546875, 2.9718017578125, 3.18560791015625, 3.3994140625, 3.61322021484375, 3.8270263671875, 4.04083251953125, 4.254638671875, 4.46844482421875, 4.6822509765625, 4.89605712890625, 5.10986328125, 5.32366943359375, 5.5374755859375, 5.75128173828125, 5.965087890625, 6.17889404296875, 6.3927001953125, 6.60650634765625, 6.8203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 8.0, 7.0, 7.0, 12.0, 11.0, 22.0, 14.0, 28.0, 28.0, 17.0, 20.0, 29.0, 32.0, 42.0, 41.0, 36.0, 28.0, 40.0, 52.0, 51.0, 46.0, 38.0, 42.0, 47.0, 37.0, 35.0, 25.0, 28.0, 26.0, 17.0, 25.0, 32.0, 13.0, 11.0, 25.0, 10.0, 10.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5625, -14.065185546875, -13.56787109375, -13.070556640625, -12.5732421875, -12.075927734375, -11.57861328125, -11.081298828125, -10.583984375, -10.086669921875, -9.58935546875, -9.092041015625, -8.5947265625, -8.097412109375, -7.60009765625, -7.102783203125, -6.60546875, -6.108154296875, -5.61083984375, -5.113525390625, -4.6162109375, -4.118896484375, -3.62158203125, -3.124267578125, -2.626953125, -2.129638671875, -1.63232421875, -1.135009765625, -0.6376953125, -0.140380859375, 0.35693359375, 0.854248046875, 1.3515625, 1.848876953125, 2.34619140625, 2.843505859375, 3.3408203125, 3.838134765625, 4.33544921875, 4.832763671875, 5.330078125, 5.827392578125, 6.32470703125, 6.822021484375, 7.3193359375, 7.816650390625, 8.31396484375, 8.811279296875, 9.30859375, 9.805908203125, 10.30322265625, 10.800537109375, 11.2978515625, 11.795166015625, 12.29248046875, 12.789794921875, 13.287109375, 13.784423828125, 14.28173828125, 14.779052734375, 15.2763671875, 15.773681640625, 16.27099609375, 16.768310546875, 17.265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 4.0, 7.0, 5.0, 13.0, 19.0, 27.0, 44.0, 67.0, 116.0, 169.0, 224.0, 365.0, 543.0, 791.0, 1313.0, 2125.0, 3412.0, 5652.0, 9615.0, 16691.0, 29552.0, 52402.0, 88788.0, 143284.0, 189563.0, 182927.0, 131351.0, 80300.0, 45827.0, 26258.0, 14923.0, 8775.0, 4935.0, 3141.0, 1959.0, 1190.0, 720.0, 487.0, 325.0, 207.0, 157.0, 99.0, 63.0, 35.0, 29.0, 24.0, 21.0, 6.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.1805419921875, -7.915771484375, -7.6510009765625, -7.38623046875, -7.1214599609375, -6.856689453125, -6.5919189453125, -6.3271484375, -6.0623779296875, -5.797607421875, -5.5328369140625, -5.26806640625, -5.0032958984375, -4.738525390625, -4.4737548828125, -4.208984375, -3.9442138671875, -3.679443359375, -3.4146728515625, -3.14990234375, -2.8851318359375, -2.620361328125, -2.3555908203125, -2.0908203125, -1.8260498046875, -1.561279296875, -1.2965087890625, -1.03173828125, -0.7669677734375, -0.502197265625, -0.2374267578125, 0.02734375, 0.2921142578125, 0.556884765625, 0.8216552734375, 1.08642578125, 1.3511962890625, 1.615966796875, 1.8807373046875, 2.1455078125, 2.4102783203125, 2.675048828125, 2.9398193359375, 3.20458984375, 3.4693603515625, 3.734130859375, 3.9989013671875, 4.263671875, 4.5284423828125, 4.793212890625, 5.0579833984375, 5.32275390625, 5.5875244140625, 5.852294921875, 6.1170654296875, 6.3818359375, 6.6466064453125, 6.911376953125, 7.1761474609375, 7.44091796875, 7.7056884765625, 7.970458984375, 8.2352294921875, 8.5]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 3.0, 3.0, 12.0, 8.0, 8.0, 17.0, 20.0, 21.0, 24.0, 23.0, 30.0, 31.0, 24.0, 21.0, 27.0, 32.0, 44.0, 46.0, 32.0, 32.0, 42.0, 30.0, 31.0, 35.0, 49.0, 35.0, 33.0, 33.0, 28.0, 27.0, 26.0, 27.0, 24.0, 20.0, 27.0, 12.0, 12.0, 5.0, 7.0, 5.0, 10.0, 7.0, 8.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0234375, -12.6209716796875, -12.218505859375, -11.8160400390625, -11.41357421875, -11.0111083984375, -10.608642578125, -10.2061767578125, -9.8037109375, -9.4012451171875, -8.998779296875, -8.5963134765625, -8.19384765625, -7.7913818359375, -7.388916015625, -6.9864501953125, -6.583984375, -6.1815185546875, -5.779052734375, -5.3765869140625, -4.97412109375, -4.5716552734375, -4.169189453125, -3.7667236328125, -3.3642578125, -2.9617919921875, -2.559326171875, -2.1568603515625, -1.75439453125, -1.3519287109375, -0.949462890625, -0.5469970703125, -0.14453125, 0.2579345703125, 0.660400390625, 1.0628662109375, 1.46533203125, 1.8677978515625, 2.270263671875, 2.6727294921875, 3.0751953125, 3.4776611328125, 3.880126953125, 4.2825927734375, 4.68505859375, 5.0875244140625, 5.489990234375, 5.8924560546875, 6.294921875, 6.6973876953125, 7.099853515625, 7.5023193359375, 7.90478515625, 8.3072509765625, 8.709716796875, 9.1121826171875, 9.5146484375, 9.9171142578125, 10.319580078125, 10.7220458984375, 11.12451171875, 11.5269775390625, 11.929443359375, 12.3319091796875, 12.734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 11.0, 7.0, 8.0, 19.0, 33.0, 54.0, 59.0, 88.0, 123.0, 207.0, 282.0, 400.0, 638.0, 990.0, 1533.0, 2418.0, 3712.0, 6104.0, 9904.0, 17089.0, 30545.0, 55084.0, 104423.0, 201206.0, 263332.0, 161061.0, 83527.0, 44470.0, 24781.0, 14062.0, 8380.0, 5078.0, 3176.0, 2024.0, 1250.0, 798.0, 546.0, 383.0, 217.0, 183.0, 108.0, 74.0, 57.0, 28.0, 21.0, 24.0, 16.0, 9.0, 9.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.390625, -5.223876953125, -5.05712890625, -4.890380859375, -4.7236328125, -4.556884765625, -4.39013671875, -4.223388671875, -4.056640625, -3.889892578125, -3.72314453125, -3.556396484375, -3.3896484375, -3.222900390625, -3.05615234375, -2.889404296875, -2.72265625, -2.555908203125, -2.38916015625, -2.222412109375, -2.0556640625, -1.888916015625, -1.72216796875, -1.555419921875, -1.388671875, -1.221923828125, -1.05517578125, -0.888427734375, -0.7216796875, -0.554931640625, -0.38818359375, -0.221435546875, -0.0546875, 0.112060546875, 0.27880859375, 0.445556640625, 0.6123046875, 0.779052734375, 0.94580078125, 1.112548828125, 1.279296875, 1.446044921875, 1.61279296875, 1.779541015625, 1.9462890625, 2.113037109375, 2.27978515625, 2.446533203125, 2.61328125, 2.780029296875, 2.94677734375, 3.113525390625, 3.2802734375, 3.447021484375, 3.61376953125, 3.780517578125, 3.947265625, 4.114013671875, 4.28076171875, 4.447509765625, 4.6142578125, 4.781005859375, 4.94775390625, 5.114501953125, 5.28125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 4.0, 6.0, 11.0, 8.0, 11.0, 20.0, 26.0, 35.0, 32.0, 38.0, 56.0, 58.0, 69.0, 78.0, 79.0, 80.0, 71.0, 59.0, 51.0, 41.0, 27.0, 24.0, 22.0, 19.0, 16.0, 11.0, 6.0, 5.0, 7.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000885009765625, -0.0008589848875999451, -0.0008329600095748901, -0.0008069351315498352, -0.0007809102535247803, -0.0007548853754997253, -0.0007288604974746704, -0.0007028356194496155, -0.0006768107414245605, -0.0006507858633995056, -0.0006247609853744507, -0.0005987361073493958, -0.0005727112293243408, -0.0005466863512992859, -0.000520661473274231, -0.000494636595249176, -0.0004686117172241211, -0.00044258683919906616, -0.00041656196117401123, -0.0003905370831489563, -0.00036451220512390137, -0.00033848732709884644, -0.0003124624490737915, -0.00028643757104873657, -0.00026041269302368164, -0.0002343878149986267, -0.00020836293697357178, -0.00018233805894851685, -0.00015631318092346191, -0.00013028830289840698, -0.00010426342487335205, -7.823854684829712e-05, -5.221366882324219e-05, -2.6188790798187256e-05, -1.6391277313232422e-07, 2.5860965251922607e-05, 5.188584327697754e-05, 7.791072130203247e-05, 0.0001039355993270874, 0.00012996047735214233, 0.00015598535537719727, 0.0001820102334022522, 0.00020803511142730713, 0.00023405998945236206, 0.000260084867477417, 0.0002861097455024719, 0.00031213462352752686, 0.0003381595015525818, 0.0003641843795776367, 0.00039020925760269165, 0.0004162341356277466, 0.0004422590136528015, 0.00046828389167785645, 0.0004943087697029114, 0.0005203336477279663, 0.0005463585257530212, 0.0005723834037780762, 0.0005984082818031311, 0.000624433159828186, 0.000650458037853241, 0.0006764829158782959, 0.0007025077939033508, 0.0007285326719284058, 0.0007545575499534607, 0.0007805824279785156]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 7.0, 13.0, 17.0, 26.0, 45.0, 72.0, 126.0, 174.0, 315.0, 442.0, 684.0, 1063.0, 1721.0, 2757.0, 4420.0, 7038.0, 11442.0, 18302.0, 30210.0, 49338.0, 80662.0, 126558.0, 177962.0, 182233.0, 133191.0, 85105.0, 52068.0, 31639.0, 19436.0, 11818.0, 7175.0, 4593.0, 2846.0, 1789.0, 1221.0, 699.0, 472.0, 301.0, 205.0, 125.0, 89.0, 44.0, 33.0, 25.0, 25.0, 9.0, 10.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.34765625, -5.19061279296875, -5.0335693359375, -4.87652587890625, -4.719482421875, -4.56243896484375, -4.4053955078125, -4.24835205078125, -4.09130859375, -3.93426513671875, -3.7772216796875, -3.62017822265625, -3.463134765625, -3.30609130859375, -3.1490478515625, -2.99200439453125, -2.8349609375, -2.67791748046875, -2.5208740234375, -2.36383056640625, -2.206787109375, -2.04974365234375, -1.8927001953125, -1.73565673828125, -1.57861328125, -1.42156982421875, -1.2645263671875, -1.10748291015625, -0.950439453125, -0.79339599609375, -0.6363525390625, -0.47930908203125, -0.322265625, -0.16522216796875, -0.0081787109375, 0.14886474609375, 0.305908203125, 0.46295166015625, 0.6199951171875, 0.77703857421875, 0.93408203125, 1.09112548828125, 1.2481689453125, 1.40521240234375, 1.562255859375, 1.71929931640625, 1.8763427734375, 2.03338623046875, 2.1904296875, 2.34747314453125, 2.5045166015625, 2.66156005859375, 2.818603515625, 2.97564697265625, 3.1326904296875, 3.28973388671875, 3.44677734375, 3.60382080078125, 3.7608642578125, 3.91790771484375, 4.074951171875, 4.23199462890625, 4.3890380859375, 4.54608154296875, 4.703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 6.0, 6.0, 7.0, 15.0, 14.0, 24.0, 19.0, 23.0, 36.0, 39.0, 42.0, 58.0, 52.0, 51.0, 77.0, 64.0, 65.0, 57.0, 52.0, 47.0, 40.0, 37.0, 28.0, 27.0, 17.0, 14.0, 16.0, 13.0, 8.0, 4.0, 12.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.486328125, -2.39752197265625, -2.3087158203125, -2.21990966796875, -2.131103515625, -2.04229736328125, -1.9534912109375, -1.86468505859375, -1.77587890625, -1.68707275390625, -1.5982666015625, -1.50946044921875, -1.420654296875, -1.33184814453125, -1.2430419921875, -1.15423583984375, -1.0654296875, -0.97662353515625, -0.8878173828125, -0.79901123046875, -0.710205078125, -0.62139892578125, -0.5325927734375, -0.44378662109375, -0.35498046875, -0.26617431640625, -0.1773681640625, -0.08856201171875, 0.000244140625, 0.08905029296875, 0.1778564453125, 0.26666259765625, 0.35546875, 0.44427490234375, 0.5330810546875, 0.62188720703125, 0.710693359375, 0.79949951171875, 0.8883056640625, 0.97711181640625, 1.06591796875, 1.15472412109375, 1.2435302734375, 1.33233642578125, 1.421142578125, 1.50994873046875, 1.5987548828125, 1.68756103515625, 1.7763671875, 1.86517333984375, 1.9539794921875, 2.04278564453125, 2.131591796875, 2.22039794921875, 2.3092041015625, 2.39801025390625, 2.48681640625, 2.57562255859375, 2.6644287109375, 2.75323486328125, 2.842041015625, 2.93084716796875, 3.0196533203125, 3.10845947265625, 3.197265625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 1.0, 11.0, 8.0, 9.0, 14.0, 16.0, 21.0, 36.0, 32.0, 38.0, 48.0, 45.0, 46.0, 54.0, 61.0, 48.0, 64.0, 48.0, 44.0, 47.0, 54.0, 37.0, 18.0, 23.0, 30.0, 21.0, 30.0, 11.0, 16.0, 7.0, 16.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.770179748535156, -13.36972713470459, -12.969274520874023, -12.568821907043457, -12.16836929321289, -11.76791763305664, -11.367464065551758, -10.967012405395508, -10.566559791564941, -10.166107177734375, -9.765654563903809, -9.365201950073242, -8.964749336242676, -8.56429672241211, -8.16384506225586, -7.763392448425293, -7.362939357757568, -6.962486743927002, -6.5620341300964355, -6.161581993103027, -5.761129379272461, -5.3606767654418945, -4.960224151611328, -4.559771537780762, -4.159318923950195, -3.758866310119629, -3.3584139347076416, -2.957961320877075, -2.557508945465088, -2.1570563316345215, -1.756603717803955, -1.3561513423919678, -0.9556989669799805, -0.5552464723587036, -0.15479391813278198, 0.24565863609313965, 0.6461111307144165, 1.0465636253356934, 1.4470162391662598, 1.847468614578247, 2.2479212284088135, 2.64837384223938, 3.048826217651367, 3.4492788314819336, 3.8497314453125, 4.250184059143066, 4.650636672973633, 5.051088809967041, 5.451541423797607, 5.851994037628174, 6.25244665145874, 6.652898788452148, 7.053351402282715, 7.453804016113281, 7.854256629943848, 8.254709243774414, 8.65516185760498, 9.055614471435547, 9.456067085266113, 9.85651969909668, 10.256972312927246, 10.657424926757812, 11.057876586914062, 11.458329200744629, 11.858781814575195]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 6.0, 16.0, 17.0, 20.0, 16.0, 24.0, 24.0, 22.0, 29.0, 37.0, 31.0, 37.0, 32.0, 40.0, 33.0, 39.0, 39.0, 40.0, 43.0, 49.0, 32.0, 48.0, 41.0, 37.0, 26.0, 27.0, 27.0, 17.0, 17.0, 15.0, 13.0, 13.0, 15.0, 14.0, 13.0, 12.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.615378379821777, -15.127413749694824, -14.639449119567871, -14.151484489440918, -13.663519859313965, -13.175555229187012, -12.687590599060059, -12.199625968933105, -11.711661338806152, -11.2236967086792, -10.735732078552246, -10.247767448425293, -9.75980281829834, -9.271838188171387, -8.783873558044434, -8.29590892791748, -7.8079447746276855, -7.319980144500732, -6.832015514373779, -6.344050884246826, -5.856086254119873, -5.368122100830078, -4.880157470703125, -4.392192840576172, -3.9042279720306396, -3.4162633419036865, -2.9282987117767334, -2.4403343200683594, -1.9523695707321167, -1.4644050598144531, -0.9764404296875, -0.4884757995605469, -0.00051116943359375, 0.487453430891037, 0.9754180312156677, 1.463382601737976, 1.9513472318649292, 2.4393117427825928, 2.927276372909546, 3.415241003036499, 3.903205633163452, 4.391170024871826, 4.879134654998779, 5.367099285125732, 5.8550639152526855, 6.343028545379639, 6.830993175506592, 7.318957805633545, 7.806922435760498, 8.294886589050293, 8.782851219177246, 9.2708158493042, 9.758780479431152, 10.246745109558105, 10.734709739685059, 11.222674369812012, 11.710638999938965, 12.198603630065918, 12.686568260192871, 13.174532890319824, 13.662497520446777, 14.15046215057373, 14.638426780700684, 15.126391410827637, 15.61435604095459]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 9.0, 15.0, 23.0, 48.0, 53.0, 92.0, 137.0, 228.0, 365.0, 562.0, 925.0, 1371.0, 2174.0, 3518.0, 5372.0, 8637.0, 13460.0, 21068.0, 31744.0, 46213.0, 64865.0, 86154.0, 105441.0, 117915.0, 119222.0, 108889.0, 90701.0, 69309.0, 50549.0, 34818.0, 23104.0, 15227.0, 9716.0, 6183.0, 3798.0, 2477.0, 1530.0, 937.0, 637.0, 371.0, 250.0, 163.0, 103.0, 58.0, 49.0, 29.0, 14.0, 15.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.6171875, -9.30810546875, -8.9990234375, -8.68994140625, -8.380859375, -8.07177734375, -7.7626953125, -7.45361328125, -7.14453125, -6.83544921875, -6.5263671875, -6.21728515625, -5.908203125, -5.59912109375, -5.2900390625, -4.98095703125, -4.671875, -4.36279296875, -4.0537109375, -3.74462890625, -3.435546875, -3.12646484375, -2.8173828125, -2.50830078125, -2.19921875, -1.89013671875, -1.5810546875, -1.27197265625, -0.962890625, -0.65380859375, -0.3447265625, -0.03564453125, 0.2734375, 0.58251953125, 0.8916015625, 1.20068359375, 1.509765625, 1.81884765625, 2.1279296875, 2.43701171875, 2.74609375, 3.05517578125, 3.3642578125, 3.67333984375, 3.982421875, 4.29150390625, 4.6005859375, 4.90966796875, 5.21875, 5.52783203125, 5.8369140625, 6.14599609375, 6.455078125, 6.76416015625, 7.0732421875, 7.38232421875, 7.69140625, 8.00048828125, 8.3095703125, 8.61865234375, 8.927734375, 9.23681640625, 9.5458984375, 9.85498046875, 10.1640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 7.0, 6.0, 14.0, 9.0, 15.0, 21.0, 14.0, 21.0, 24.0, 35.0, 25.0, 37.0, 26.0, 28.0, 41.0, 46.0, 35.0, 37.0, 27.0, 35.0, 55.0, 43.0, 45.0, 48.0, 35.0, 34.0, 26.0, 27.0, 32.0, 19.0, 21.0, 15.0, 13.0, 15.0, 12.0, 14.0, 9.0, 9.0, 11.0, 4.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.453125, -13.98583984375, -13.5185546875, -13.05126953125, -12.583984375, -12.11669921875, -11.6494140625, -11.18212890625, -10.71484375, -10.24755859375, -9.7802734375, -9.31298828125, -8.845703125, -8.37841796875, -7.9111328125, -7.44384765625, -6.9765625, -6.50927734375, -6.0419921875, -5.57470703125, -5.107421875, -4.64013671875, -4.1728515625, -3.70556640625, -3.23828125, -2.77099609375, -2.3037109375, -1.83642578125, -1.369140625, -0.90185546875, -0.4345703125, 0.03271484375, 0.5, 0.96728515625, 1.4345703125, 1.90185546875, 2.369140625, 2.83642578125, 3.3037109375, 3.77099609375, 4.23828125, 4.70556640625, 5.1728515625, 5.64013671875, 6.107421875, 6.57470703125, 7.0419921875, 7.50927734375, 7.9765625, 8.44384765625, 8.9111328125, 9.37841796875, 9.845703125, 10.31298828125, 10.7802734375, 11.24755859375, 11.71484375, 12.18212890625, 12.6494140625, 13.11669921875, 13.583984375, 14.05126953125, 14.5185546875, 14.98583984375, 15.453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 1.0, 7.0, 4.0, 4.0, 1.0, 15.0, 15.0, 26.0, 33.0, 64.0, 110.0, 191.0, 314.0, 533.0, 911.0, 1547.0, 2396.0, 4019.0, 6790.0, 11085.0, 18416.0, 29557.0, 47088.0, 70328.0, 98551.0, 126387.0, 140348.0, 135417.0, 113952.0, 84992.0, 58537.0, 37188.0, 23259.0, 14508.0, 8607.0, 5350.0, 3159.0, 1915.0, 1156.0, 689.0, 428.0, 233.0, 158.0, 96.0, 71.0, 33.0, 28.0, 15.0, 12.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.359375, -11.95751953125, -11.5556640625, -11.15380859375, -10.751953125, -10.35009765625, -9.9482421875, -9.54638671875, -9.14453125, -8.74267578125, -8.3408203125, -7.93896484375, -7.537109375, -7.13525390625, -6.7333984375, -6.33154296875, -5.9296875, -5.52783203125, -5.1259765625, -4.72412109375, -4.322265625, -3.92041015625, -3.5185546875, -3.11669921875, -2.71484375, -2.31298828125, -1.9111328125, -1.50927734375, -1.107421875, -0.70556640625, -0.3037109375, 0.09814453125, 0.5, 0.90185546875, 1.3037109375, 1.70556640625, 2.107421875, 2.50927734375, 2.9111328125, 3.31298828125, 3.71484375, 4.11669921875, 4.5185546875, 4.92041015625, 5.322265625, 5.72412109375, 6.1259765625, 6.52783203125, 6.9296875, 7.33154296875, 7.7333984375, 8.13525390625, 8.537109375, 8.93896484375, 9.3408203125, 9.74267578125, 10.14453125, 10.54638671875, 10.9482421875, 11.35009765625, 11.751953125, 12.15380859375, 12.5556640625, 12.95751953125, 13.359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 13.0, 12.0, 15.0, 14.0, 12.0, 28.0, 25.0, 17.0, 28.0, 22.0, 26.0, 39.0, 34.0, 39.0, 28.0, 35.0, 32.0, 47.0, 64.0, 43.0, 48.0, 34.0, 40.0, 28.0, 41.0, 36.0, 26.0, 25.0, 17.0, 26.0, 21.0, 19.0, 8.0, 14.0, 5.0, 10.0, 10.0, 7.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1015625, -9.760009765625, -9.41845703125, -9.076904296875, -8.7353515625, -8.393798828125, -8.05224609375, -7.710693359375, -7.369140625, -7.027587890625, -6.68603515625, -6.344482421875, -6.0029296875, -5.661376953125, -5.31982421875, -4.978271484375, -4.63671875, -4.295166015625, -3.95361328125, -3.612060546875, -3.2705078125, -2.928955078125, -2.58740234375, -2.245849609375, -1.904296875, -1.562744140625, -1.22119140625, -0.879638671875, -0.5380859375, -0.196533203125, 0.14501953125, 0.486572265625, 0.828125, 1.169677734375, 1.51123046875, 1.852783203125, 2.1943359375, 2.535888671875, 2.87744140625, 3.218994140625, 3.560546875, 3.902099609375, 4.24365234375, 4.585205078125, 4.9267578125, 5.268310546875, 5.60986328125, 5.951416015625, 6.29296875, 6.634521484375, 6.97607421875, 7.317626953125, 7.6591796875, 8.000732421875, 8.34228515625, 8.683837890625, 9.025390625, 9.366943359375, 9.70849609375, 10.050048828125, 10.3916015625, 10.733154296875, 11.07470703125, 11.416259765625, 11.7578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 3.0, 5.0, 8.0, 14.0, 29.0, 28.0, 27.0, 76.0, 97.0, 105.0, 183.0, 256.0, 381.0, 557.0, 880.0, 1349.0, 2102.0, 3440.0, 5657.0, 9387.0, 16315.0, 29674.0, 56475.0, 107841.0, 182880.0, 224799.0, 178509.0, 104212.0, 54827.0, 28664.0, 15834.0, 9106.0, 5478.0, 3299.0, 2080.0, 1364.0, 859.0, 552.0, 394.0, 245.0, 183.0, 104.0, 91.0, 46.0, 46.0, 29.0, 19.0, 11.0, 13.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-8.296875, -8.04901123046875, -7.8011474609375, -7.55328369140625, -7.305419921875, -7.05755615234375, -6.8096923828125, -6.56182861328125, -6.31396484375, -6.06610107421875, -5.8182373046875, -5.57037353515625, -5.322509765625, -5.07464599609375, -4.8267822265625, -4.57891845703125, -4.3310546875, -4.08319091796875, -3.8353271484375, -3.58746337890625, -3.339599609375, -3.09173583984375, -2.8438720703125, -2.59600830078125, -2.34814453125, -2.10028076171875, -1.8524169921875, -1.60455322265625, -1.356689453125, -1.10882568359375, -0.8609619140625, -0.61309814453125, -0.365234375, -0.11737060546875, 0.1304931640625, 0.37835693359375, 0.626220703125, 0.87408447265625, 1.1219482421875, 1.36981201171875, 1.61767578125, 1.86553955078125, 2.1134033203125, 2.36126708984375, 2.609130859375, 2.85699462890625, 3.1048583984375, 3.35272216796875, 3.6005859375, 3.84844970703125, 4.0963134765625, 4.34417724609375, 4.592041015625, 4.83990478515625, 5.0877685546875, 5.33563232421875, 5.58349609375, 5.83135986328125, 6.0792236328125, 6.32708740234375, 6.574951171875, 6.82281494140625, 7.0706787109375, 7.31854248046875, 7.56640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 9.0, 9.0, 15.0, 20.0, 24.0, 35.0, 43.0, 54.0, 62.0, 63.0, 71.0, 91.0, 80.0, 68.0, 61.0, 61.0, 48.0, 32.0, 39.0, 24.0, 19.0, 12.0, 10.0, 9.0, 7.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006737709045410156, -0.0006503835320472717, -0.0006269961595535278, -0.0006036087870597839, -0.00058022141456604, -0.0005568340420722961, -0.0005334466695785522, -0.0005100592970848083, -0.00048667192459106445, -0.00046328455209732056, -0.00043989717960357666, -0.00041650980710983276, -0.00039312243461608887, -0.00036973506212234497, -0.0003463476896286011, -0.0003229603171348572, -0.0002995729446411133, -0.0002761855721473694, -0.0002527981996536255, -0.0002294108271598816, -0.0002060234546661377, -0.0001826360821723938, -0.0001592487096786499, -0.000135861337184906, -0.00011247396469116211, -8.908659219741821e-05, -6.569921970367432e-05, -4.231184720993042e-05, -1.8924474716186523e-05, 4.462897777557373e-06, 2.785027027130127e-05, 5.1237642765045166e-05, 7.462501525878906e-05, 9.801238775253296e-05, 0.00012139976024627686, 0.00014478713274002075, 0.00016817450523376465, 0.00019156187772750854, 0.00021494925022125244, 0.00023833662271499634, 0.00026172399520874023, 0.00028511136770248413, 0.00030849874019622803, 0.0003318861126899719, 0.0003552734851837158, 0.0003786608576774597, 0.0004020482301712036, 0.0004254356026649475, 0.0004488229751586914, 0.0004722103476524353, 0.0004955977201461792, 0.0005189850926399231, 0.000542372465133667, 0.0005657598376274109, 0.0005891472101211548, 0.0006125345826148987, 0.0006359219551086426, 0.0006593093276023865, 0.0006826967000961304, 0.0007060840725898743, 0.0007294714450836182, 0.0007528588175773621, 0.000776246190071106, 0.0007996335625648499, 0.0008230209350585938]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 10.0, 14.0, 28.0, 40.0, 47.0, 102.0, 130.0, 191.0, 267.0, 472.0, 703.0, 1081.0, 1772.0, 2832.0, 4785.0, 8594.0, 15533.0, 28378.0, 51362.0, 89299.0, 138886.0, 179785.0, 179508.0, 138725.0, 89618.0, 51310.0, 28591.0, 15168.0, 8790.0, 4865.0, 2896.0, 1711.0, 1084.0, 720.0, 449.0, 261.0, 208.0, 110.0, 86.0, 56.0, 27.0, 22.0, 18.0, 6.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.9140625, -5.729248046875, -5.54443359375, -5.359619140625, -5.1748046875, -4.989990234375, -4.80517578125, -4.620361328125, -4.435546875, -4.250732421875, -4.06591796875, -3.881103515625, -3.6962890625, -3.511474609375, -3.32666015625, -3.141845703125, -2.95703125, -2.772216796875, -2.58740234375, -2.402587890625, -2.2177734375, -2.032958984375, -1.84814453125, -1.663330078125, -1.478515625, -1.293701171875, -1.10888671875, -0.924072265625, -0.7392578125, -0.554443359375, -0.36962890625, -0.184814453125, 0.0, 0.184814453125, 0.36962890625, 0.554443359375, 0.7392578125, 0.924072265625, 1.10888671875, 1.293701171875, 1.478515625, 1.663330078125, 1.84814453125, 2.032958984375, 2.2177734375, 2.402587890625, 2.58740234375, 2.772216796875, 2.95703125, 3.141845703125, 3.32666015625, 3.511474609375, 3.6962890625, 3.881103515625, 4.06591796875, 4.250732421875, 4.435546875, 4.620361328125, 4.80517578125, 4.989990234375, 5.1748046875, 5.359619140625, 5.54443359375, 5.729248046875, 5.9140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 6.0, 13.0, 9.0, 15.0, 11.0, 20.0, 16.0, 31.0, 32.0, 26.0, 41.0, 40.0, 33.0, 46.0, 53.0, 61.0, 65.0, 68.0, 70.0, 52.0, 42.0, 41.0, 39.0, 23.0, 23.0, 29.0, 23.0, 11.0, 15.0, 9.0, 8.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.681640625, -2.574188232421875, -2.46673583984375, -2.359283447265625, -2.2518310546875, -2.144378662109375, -2.03692626953125, -1.929473876953125, -1.822021484375, -1.714569091796875, -1.60711669921875, -1.499664306640625, -1.3922119140625, -1.284759521484375, -1.17730712890625, -1.069854736328125, -0.96240234375, -0.854949951171875, -0.74749755859375, -0.640045166015625, -0.5325927734375, -0.425140380859375, -0.31768798828125, -0.210235595703125, -0.102783203125, 0.004669189453125, 0.11212158203125, 0.219573974609375, 0.3270263671875, 0.434478759765625, 0.54193115234375, 0.649383544921875, 0.7568359375, 0.864288330078125, 0.97174072265625, 1.079193115234375, 1.1866455078125, 1.294097900390625, 1.40155029296875, 1.509002685546875, 1.616455078125, 1.723907470703125, 1.83135986328125, 1.938812255859375, 2.0462646484375, 2.153717041015625, 2.26116943359375, 2.368621826171875, 2.47607421875, 2.583526611328125, 2.69097900390625, 2.798431396484375, 2.9058837890625, 3.013336181640625, 3.12078857421875, 3.228240966796875, 3.335693359375, 3.443145751953125, 3.55059814453125, 3.658050537109375, 3.7655029296875, 3.872955322265625, 3.98040771484375, 4.087860107421875, 4.1953125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 6.0, 7.0, 6.0, 16.0, 10.0, 13.0, 29.0, 25.0, 31.0, 38.0, 46.0, 43.0, 51.0, 57.0, 50.0, 58.0, 56.0, 50.0, 43.0, 50.0, 56.0, 31.0, 37.0, 36.0, 24.0, 23.0, 19.0, 17.0, 12.0, 12.0, 13.0, 10.0, 7.0, 8.0, 2.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.619549751281738, -12.207066535949707, -11.794584274291992, -11.382101058959961, -10.96961784362793, -10.557134628295898, -10.144651412963867, -9.732169151306152, -9.319685935974121, -8.90720272064209, -8.494720458984375, -8.082237243652344, -7.6697540283203125, -7.257270812988281, -6.844788074493408, -6.432305335998535, -6.019822120666504, -5.607338905334473, -5.1948561668396, -4.782373428344727, -4.369890213012695, -3.957407236099243, -3.544924259185791, -3.132441282272339, -2.7199583053588867, -2.3074753284454346, -1.8949923515319824, -1.4825093746185303, -1.0700263977050781, -0.657543420791626, -0.24506044387817383, 0.16742253303527832, 0.5799055099487305, 0.9923884868621826, 1.4048714637756348, 1.817354440689087, 2.229837417602539, 2.642320394515991, 3.0548033714294434, 3.4672863483428955, 3.8797693252563477, 4.292252540588379, 4.704735279083252, 5.117218017578125, 5.529701232910156, 5.9421844482421875, 6.3546671867370605, 6.767149925231934, 7.179633140563965, 7.592116355895996, 8.004598617553711, 8.417081832885742, 8.829565048217773, 9.242048263549805, 9.654531478881836, 10.06701374053955, 10.479496955871582, 10.891980171203613, 11.304462432861328, 11.71694564819336, 12.12942886352539, 12.541912078857422, 12.954395294189453, 13.366877555847168, 13.7793607711792]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 10.0, 9.0, 11.0, 16.0, 12.0, 23.0, 23.0, 22.0, 21.0, 28.0, 34.0, 35.0, 34.0, 33.0, 36.0, 40.0, 30.0, 30.0, 36.0, 39.0, 35.0, 40.0, 54.0, 34.0, 32.0, 30.0, 40.0, 25.0, 22.0, 27.0, 28.0, 14.0, 14.0, 16.0, 8.0, 13.0, 9.0, 10.0, 3.0, 3.0, 10.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.739502906799316, -14.261563301086426, -13.783624649047852, -13.305685043334961, -12.82774543762207, -12.34980583190918, -11.871867179870605, -11.393927574157715, -10.91598892211914, -10.43804931640625, -9.960110664367676, -9.482171058654785, -9.004231452941895, -8.52629280090332, -8.04835319519043, -7.570413589477539, -7.092473983764648, -6.614534854888916, -6.136595249176025, -5.658656120300293, -5.180716514587402, -4.70277738571167, -4.2248382568359375, -3.746898889541626, -3.2689595222473145, -2.791020154953003, -2.3130807876586914, -1.835141658782959, -1.3572022914886475, -0.8792629241943359, -0.4013237953186035, 0.07661557197570801, 0.5545539855957031, 1.0324933528900146, 1.5104326009750366, 1.9883718490600586, 2.46631121635437, 2.9442505836486816, 3.422189712524414, 3.9001290798187256, 4.378068447113037, 4.8560075759887695, 5.33394718170166, 5.811886310577393, 6.289825439453125, 6.767765045166016, 7.245704174041748, 7.7236433029174805, 8.201582908630371, 8.679522514343262, 9.157461166381836, 9.635400772094727, 10.113340377807617, 10.591279983520508, 11.069218635559082, 11.547158241271973, 12.025096893310547, 12.503036499023438, 12.980975151062012, 13.458914756774902, 13.936854362487793, 14.414793014526367, 14.892732620239258, 15.370672225952148, 15.848611831665039]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 10.0, 4.0, 11.0, 16.0, 29.0, 36.0, 58.0, 80.0, 140.0, 221.0, 378.0, 583.0, 989.0, 1694.0, 2919.0, 5056.0, 8992.0, 15746.0, 28453.0, 51496.0, 92786.0, 167414.0, 289537.0, 461461.0, 631727.0, 704086.0, 625381.0, 455063.0, 283713.0, 163728.0, 90448.0, 50056.0, 27294.0, 15026.0, 8554.0, 4782.0, 2707.0, 1526.0, 821.0, 501.0, 311.0, 169.0, 100.0, 74.0, 40.0, 29.0, 15.0, 14.0, 16.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4296875, -9.1097412109375, -8.789794921875, -8.4698486328125, -8.14990234375, -7.8299560546875, -7.510009765625, -7.1900634765625, -6.8701171875, -6.5501708984375, -6.230224609375, -5.9102783203125, -5.59033203125, -5.2703857421875, -4.950439453125, -4.6304931640625, -4.310546875, -3.9906005859375, -3.670654296875, -3.3507080078125, -3.03076171875, -2.7108154296875, -2.390869140625, -2.0709228515625, -1.7509765625, -1.4310302734375, -1.111083984375, -0.7911376953125, -0.47119140625, -0.1512451171875, 0.168701171875, 0.4886474609375, 0.80859375, 1.1285400390625, 1.448486328125, 1.7684326171875, 2.08837890625, 2.4083251953125, 2.728271484375, 3.0482177734375, 3.3681640625, 3.6881103515625, 4.008056640625, 4.3280029296875, 4.64794921875, 4.9678955078125, 5.287841796875, 5.6077880859375, 5.927734375, 6.2476806640625, 6.567626953125, 6.8875732421875, 7.20751953125, 7.5274658203125, 7.847412109375, 8.1673583984375, 8.4873046875, 8.8072509765625, 9.127197265625, 9.4471435546875, 9.76708984375, 10.0870361328125, 10.406982421875, 10.7269287109375, 11.046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 4.0, 7.0, 8.0, 3.0, 12.0, 18.0, 20.0, 19.0, 32.0, 23.0, 18.0, 25.0, 31.0, 43.0, 37.0, 40.0, 32.0, 22.0, 36.0, 44.0, 36.0, 31.0, 35.0, 45.0, 37.0, 39.0, 27.0, 36.0, 32.0, 32.0, 32.0, 14.0, 19.0, 15.0, 14.0, 14.0, 14.0, 12.0, 8.0, 6.0, 9.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.6875, -10.3233642578125, -9.959228515625, -9.5950927734375, -9.23095703125, -8.8668212890625, -8.502685546875, -8.1385498046875, -7.7744140625, -7.4102783203125, -7.046142578125, -6.6820068359375, -6.31787109375, -5.9537353515625, -5.589599609375, -5.2254638671875, -4.861328125, -4.4971923828125, -4.133056640625, -3.7689208984375, -3.40478515625, -3.0406494140625, -2.676513671875, -2.3123779296875, -1.9482421875, -1.5841064453125, -1.219970703125, -0.8558349609375, -0.49169921875, -0.1275634765625, 0.236572265625, 0.6007080078125, 0.96484375, 1.3289794921875, 1.693115234375, 2.0572509765625, 2.42138671875, 2.7855224609375, 3.149658203125, 3.5137939453125, 3.8779296875, 4.2420654296875, 4.606201171875, 4.9703369140625, 5.33447265625, 5.6986083984375, 6.062744140625, 6.4268798828125, 6.791015625, 7.1551513671875, 7.519287109375, 7.8834228515625, 8.24755859375, 8.6116943359375, 8.975830078125, 9.3399658203125, 9.7041015625, 10.0682373046875, 10.432373046875, 10.7965087890625, 11.16064453125, 11.5247802734375, 11.888916015625, 12.2530517578125, 12.6171875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 6.0, 16.0, 16.0, 29.0, 50.0, 100.0, 152.0, 245.0, 395.0, 718.0, 1250.0, 2153.0, 3964.0, 7703.0, 14357.0, 26901.0, 50749.0, 95135.0, 172369.0, 291367.0, 448658.0, 603786.0, 677466.0, 617342.0, 468946.0, 308734.0, 182456.0, 102236.0, 54700.0, 28900.0, 15320.0, 8270.0, 4302.0, 2366.0, 1320.0, 745.0, 446.0, 253.0, 145.0, 91.0, 47.0, 30.0, 21.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.28125, -10.945068359375, -10.60888671875, -10.272705078125, -9.9365234375, -9.600341796875, -9.26416015625, -8.927978515625, -8.591796875, -8.255615234375, -7.91943359375, -7.583251953125, -7.2470703125, -6.910888671875, -6.57470703125, -6.238525390625, -5.90234375, -5.566162109375, -5.22998046875, -4.893798828125, -4.5576171875, -4.221435546875, -3.88525390625, -3.549072265625, -3.212890625, -2.876708984375, -2.54052734375, -2.204345703125, -1.8681640625, -1.531982421875, -1.19580078125, -0.859619140625, -0.5234375, -0.187255859375, 0.14892578125, 0.485107421875, 0.8212890625, 1.157470703125, 1.49365234375, 1.829833984375, 2.166015625, 2.502197265625, 2.83837890625, 3.174560546875, 3.5107421875, 3.846923828125, 4.18310546875, 4.519287109375, 4.85546875, 5.191650390625, 5.52783203125, 5.864013671875, 6.2001953125, 6.536376953125, 6.87255859375, 7.208740234375, 7.544921875, 7.881103515625, 8.21728515625, 8.553466796875, 8.8896484375, 9.225830078125, 9.56201171875, 9.898193359375, 10.234375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 13.0, 13.0, 14.0, 28.0, 32.0, 29.0, 59.0, 59.0, 83.0, 87.0, 140.0, 133.0, 176.0, 197.0, 219.0, 215.0, 255.0, 239.0, 246.0, 252.0, 225.0, 199.0, 181.0, 167.0, 157.0, 111.0, 99.0, 90.0, 76.0, 53.0, 50.0, 37.0, 36.0, 24.0, 13.0, 16.0, 12.0, 8.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.768310546875, -4.59912109375, -4.429931640625, -4.2607421875, -4.091552734375, -3.92236328125, -3.753173828125, -3.583984375, -3.414794921875, -3.24560546875, -3.076416015625, -2.9072265625, -2.738037109375, -2.56884765625, -2.399658203125, -2.23046875, -2.061279296875, -1.89208984375, -1.722900390625, -1.5537109375, -1.384521484375, -1.21533203125, -1.046142578125, -0.876953125, -0.707763671875, -0.53857421875, -0.369384765625, -0.2001953125, -0.031005859375, 0.13818359375, 0.307373046875, 0.4765625, 0.645751953125, 0.81494140625, 0.984130859375, 1.1533203125, 1.322509765625, 1.49169921875, 1.660888671875, 1.830078125, 1.999267578125, 2.16845703125, 2.337646484375, 2.5068359375, 2.676025390625, 2.84521484375, 3.014404296875, 3.18359375, 3.352783203125, 3.52197265625, 3.691162109375, 3.8603515625, 4.029541015625, 4.19873046875, 4.367919921875, 4.537109375, 4.706298828125, 4.87548828125, 5.044677734375, 5.2138671875, 5.383056640625, 5.55224609375, 5.721435546875, 5.890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 11.0, 11.0, 9.0, 12.0, 26.0, 26.0, 32.0, 33.0, 42.0, 41.0, 37.0, 46.0, 45.0, 54.0, 62.0, 41.0, 42.0, 48.0, 44.0, 51.0, 43.0, 33.0, 32.0, 40.0, 15.0, 16.0, 24.0, 12.0, 7.0, 16.0, 14.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.007650375366211, -9.644770622253418, -9.281889915466309, -8.919010162353516, -8.556129455566406, -8.193249702453613, -7.83036994934082, -7.467489719390869, -7.104609489440918, -6.741729259490967, -6.378849029541016, -6.015969276428223, -5.6530890464782715, -5.29020881652832, -4.927329063415527, -4.564448833465576, -4.201568603515625, -3.838688373565674, -3.4758083820343018, -3.1129283905029297, -2.7500481605529785, -2.3871679306030273, -2.0242879390716553, -1.6614079475402832, -1.298527717590332, -0.9356476068496704, -0.5727674961090088, -0.20988738536834717, 0.15299272537231445, 0.5158728361129761, 0.8787529468536377, 1.2416329383850098, 1.6045141220092773, 1.967394232749939, 2.3302743434906006, 2.6931543350219727, 3.056034564971924, 3.418914794921875, 3.781794786453247, 4.144674777984619, 4.50755500793457, 4.8704352378845215, 5.233315467834473, 5.596195220947266, 5.959075450897217, 6.321955680847168, 6.684835433959961, 7.047715663909912, 7.410595893859863, 7.7734761238098145, 8.136356353759766, 8.499236106872559, 8.862115859985352, 9.224996566772461, 9.587876319885254, 9.950756072998047, 10.313636779785156, 10.67651653289795, 11.039397239685059, 11.402276992797852, 11.765157699584961, 12.128037452697754, 12.490917205810547, 12.853797912597656, 13.21667766571045]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 11.0, 11.0, 13.0, 14.0, 20.0, 23.0, 22.0, 28.0, 28.0, 30.0, 32.0, 33.0, 28.0, 33.0, 39.0, 52.0, 48.0, 39.0, 42.0, 48.0, 42.0, 30.0, 29.0, 36.0, 32.0, 29.0, 22.0, 25.0, 13.0, 23.0, 12.0, 16.0, 14.0, 10.0, 10.0, 13.0, 8.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.150494575500488, -11.726051330566406, -11.30160903930664, -10.877165794372559, -10.452723503112793, -10.028280258178711, -9.603837966918945, -9.179394721984863, -8.754951477050781, -8.3305082321167, -7.906065940856934, -7.481622695922852, -7.057179927825928, -6.632737159729004, -6.20829439163208, -5.783851623535156, -5.359408855438232, -4.934966087341309, -4.510523319244385, -4.086080551147461, -3.661637306213379, -3.237194538116455, -2.8127517700195312, -2.3883087635040283, -1.9638659954071045, -1.5394231081008911, -1.1149802207946777, -0.6905374526977539, -0.2660945653915405, 0.15834832191467285, 0.5827910900115967, 1.0072340965270996, 1.4316768646240234, 1.8561197519302368, 2.28056263923645, 2.705005407333374, 3.129448413848877, 3.553891181945801, 3.9783339500427246, 4.402776718139648, 4.8272199630737305, 5.251662731170654, 5.676105499267578, 6.10054874420166, 6.524991512298584, 6.949434280395508, 7.373877048492432, 7.7983198165893555, 8.222763061523438, 8.64720630645752, 9.071648597717285, 9.496091842651367, 9.920534133911133, 10.344977378845215, 10.769420623779297, 11.193862915039062, 11.618305206298828, 12.04274845123291, 12.467190742492676, 12.891633987426758, 13.316076278686523, 13.740519523620605, 14.164962768554688, 14.589405059814453, 15.013848304748535]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 4.0, 14.0, 15.0, 21.0, 38.0, 49.0, 76.0, 129.0, 167.0, 236.0, 346.0, 544.0, 766.0, 1158.0, 1606.0, 2538.0, 3898.0, 6216.0, 9844.0, 15403.0, 24451.0, 38594.0, 59485.0, 88208.0, 120500.0, 144761.0, 145031.0, 122605.0, 90936.0, 61795.0, 39911.0, 24975.0, 15952.0, 9825.0, 6258.0, 4162.0, 2654.0, 1809.0, 1123.0, 784.0, 525.0, 377.0, 252.0, 160.0, 112.0, 85.0, 58.0, 41.0, 16.0, 19.0, 14.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.47265625, -5.2841796875, -5.095703125, -4.9072265625, -4.71875, -4.5302734375, -4.341796875, -4.1533203125, -3.96484375, -3.7763671875, -3.587890625, -3.3994140625, -3.2109375, -3.0224609375, -2.833984375, -2.6455078125, -2.45703125, -2.2685546875, -2.080078125, -1.8916015625, -1.703125, -1.5146484375, -1.326171875, -1.1376953125, -0.94921875, -0.7607421875, -0.572265625, -0.3837890625, -0.1953125, -0.0068359375, 0.181640625, 0.3701171875, 0.55859375, 0.7470703125, 0.935546875, 1.1240234375, 1.3125, 1.5009765625, 1.689453125, 1.8779296875, 2.06640625, 2.2548828125, 2.443359375, 2.6318359375, 2.8203125, 3.0087890625, 3.197265625, 3.3857421875, 3.57421875, 3.7626953125, 3.951171875, 4.1396484375, 4.328125, 4.5166015625, 4.705078125, 4.8935546875, 5.08203125, 5.2705078125, 5.458984375, 5.6474609375, 5.8359375, 6.0244140625, 6.212890625, 6.4013671875, 6.58984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 10.0, 6.0, 19.0, 10.0, 19.0, 17.0, 18.0, 29.0, 26.0, 26.0, 36.0, 29.0, 43.0, 37.0, 36.0, 42.0, 47.0, 48.0, 51.0, 43.0, 39.0, 35.0, 36.0, 39.0, 35.0, 26.0, 22.0, 30.0, 18.0, 16.0, 15.0, 17.0, 16.0, 13.0, 10.0, 5.0, 12.0, 10.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.46875, -13.0189208984375, -12.569091796875, -12.1192626953125, -11.66943359375, -11.2196044921875, -10.769775390625, -10.3199462890625, -9.8701171875, -9.4202880859375, -8.970458984375, -8.5206298828125, -8.07080078125, -7.6209716796875, -7.171142578125, -6.7213134765625, -6.271484375, -5.8216552734375, -5.371826171875, -4.9219970703125, -4.47216796875, -4.0223388671875, -3.572509765625, -3.1226806640625, -2.6728515625, -2.2230224609375, -1.773193359375, -1.3233642578125, -0.87353515625, -0.4237060546875, 0.026123046875, 0.4759521484375, 0.92578125, 1.3756103515625, 1.825439453125, 2.2752685546875, 2.72509765625, 3.1749267578125, 3.624755859375, 4.0745849609375, 4.5244140625, 4.9742431640625, 5.424072265625, 5.8739013671875, 6.32373046875, 6.7735595703125, 7.223388671875, 7.6732177734375, 8.123046875, 8.5728759765625, 9.022705078125, 9.4725341796875, 9.92236328125, 10.3721923828125, 10.822021484375, 11.2718505859375, 11.7216796875, 12.1715087890625, 12.621337890625, 13.0711669921875, 13.52099609375, 13.9708251953125, 14.420654296875, 14.8704833984375, 15.3203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 8.0, 5.0, 13.0, 17.0, 26.0, 41.0, 57.0, 73.0, 126.0, 160.0, 271.0, 397.0, 676.0, 1067.0, 1705.0, 2810.0, 4698.0, 8012.0, 13799.0, 24142.0, 42360.0, 74328.0, 124636.0, 182283.0, 196459.0, 149886.0, 93006.0, 54114.0, 30778.0, 17449.0, 9984.0, 5914.0, 3485.0, 2130.0, 1316.0, 828.0, 491.0, 347.0, 232.0, 134.0, 104.0, 65.0, 32.0, 35.0, 18.0, 8.0, 13.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.80078125, -6.5828857421875, -6.364990234375, -6.1470947265625, -5.92919921875, -5.7113037109375, -5.493408203125, -5.2755126953125, -5.0576171875, -4.8397216796875, -4.621826171875, -4.4039306640625, -4.18603515625, -3.9681396484375, -3.750244140625, -3.5323486328125, -3.314453125, -3.0965576171875, -2.878662109375, -2.6607666015625, -2.44287109375, -2.2249755859375, -2.007080078125, -1.7891845703125, -1.5712890625, -1.3533935546875, -1.135498046875, -0.9176025390625, -0.69970703125, -0.4818115234375, -0.263916015625, -0.0460205078125, 0.171875, 0.3897705078125, 0.607666015625, 0.8255615234375, 1.04345703125, 1.2613525390625, 1.479248046875, 1.6971435546875, 1.9150390625, 2.1329345703125, 2.350830078125, 2.5687255859375, 2.78662109375, 3.0045166015625, 3.222412109375, 3.4403076171875, 3.658203125, 3.8760986328125, 4.093994140625, 4.3118896484375, 4.52978515625, 4.7476806640625, 4.965576171875, 5.1834716796875, 5.4013671875, 5.6192626953125, 5.837158203125, 6.0550537109375, 6.27294921875, 6.4908447265625, 6.708740234375, 6.9266357421875, 7.14453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 10.0, 6.0, 5.0, 7.0, 13.0, 18.0, 14.0, 16.0, 22.0, 19.0, 27.0, 15.0, 21.0, 24.0, 27.0, 36.0, 30.0, 32.0, 36.0, 39.0, 54.0, 36.0, 36.0, 39.0, 37.0, 48.0, 37.0, 26.0, 29.0, 24.0, 28.0, 26.0, 24.0, 21.0, 21.0, 20.0, 13.0, 9.0, 12.0, 8.0, 10.0, 6.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0], "bins": [-10.765625, -10.4580078125, -10.150390625, -9.8427734375, -9.53515625, -9.2275390625, -8.919921875, -8.6123046875, -8.3046875, -7.9970703125, -7.689453125, -7.3818359375, -7.07421875, -6.7666015625, -6.458984375, -6.1513671875, -5.84375, -5.5361328125, -5.228515625, -4.9208984375, -4.61328125, -4.3056640625, -3.998046875, -3.6904296875, -3.3828125, -3.0751953125, -2.767578125, -2.4599609375, -2.15234375, -1.8447265625, -1.537109375, -1.2294921875, -0.921875, -0.6142578125, -0.306640625, 0.0009765625, 0.30859375, 0.6162109375, 0.923828125, 1.2314453125, 1.5390625, 1.8466796875, 2.154296875, 2.4619140625, 2.76953125, 3.0771484375, 3.384765625, 3.6923828125, 4.0, 4.3076171875, 4.615234375, 4.9228515625, 5.23046875, 5.5380859375, 5.845703125, 6.1533203125, 6.4609375, 6.7685546875, 7.076171875, 7.3837890625, 7.69140625, 7.9990234375, 8.306640625, 8.6142578125, 8.921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 1.0, 9.0, 12.0, 21.0, 33.0, 43.0, 51.0, 76.0, 99.0, 187.0, 258.0, 412.0, 634.0, 1076.0, 1729.0, 3047.0, 5622.0, 11614.0, 25875.0, 68700.0, 211843.0, 413224.0, 192874.0, 62793.0, 24416.0, 11029.0, 5416.0, 2979.0, 1664.0, 1030.0, 587.0, 387.0, 250.0, 175.0, 122.0, 74.0, 53.0, 35.0, 21.0, 24.0, 15.0, 8.0, 6.0, 6.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.80078125, -4.6431884765625, -4.485595703125, -4.3280029296875, -4.17041015625, -4.0128173828125, -3.855224609375, -3.6976318359375, -3.5400390625, -3.3824462890625, -3.224853515625, -3.0672607421875, -2.90966796875, -2.7520751953125, -2.594482421875, -2.4368896484375, -2.279296875, -2.1217041015625, -1.964111328125, -1.8065185546875, -1.64892578125, -1.4913330078125, -1.333740234375, -1.1761474609375, -1.0185546875, -0.8609619140625, -0.703369140625, -0.5457763671875, -0.38818359375, -0.2305908203125, -0.072998046875, 0.0845947265625, 0.2421875, 0.3997802734375, 0.557373046875, 0.7149658203125, 0.87255859375, 1.0301513671875, 1.187744140625, 1.3453369140625, 1.5029296875, 1.6605224609375, 1.818115234375, 1.9757080078125, 2.13330078125, 2.2908935546875, 2.448486328125, 2.6060791015625, 2.763671875, 2.9212646484375, 3.078857421875, 3.2364501953125, 3.39404296875, 3.5516357421875, 3.709228515625, 3.8668212890625, 4.0244140625, 4.1820068359375, 4.339599609375, 4.4971923828125, 4.65478515625, 4.8123779296875, 4.969970703125, 5.1275634765625, 5.28515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 1.0, 9.0, 8.0, 5.0, 9.0, 15.0, 25.0, 29.0, 32.0, 55.0, 64.0, 91.0, 139.0, 150.0, 104.0, 72.0, 45.0, 45.0, 17.0, 13.0, 18.0, 8.0, 12.0, 5.0, 7.0, 4.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006122589111328125, -0.0005917996168136597, -0.0005713403224945068, -0.000550881028175354, -0.0005304217338562012, -0.0005099624395370483, -0.0004895031452178955, -0.0004690438508987427, -0.00044858455657958984, -0.000428125262260437, -0.0004076659679412842, -0.00038720667362213135, -0.0003667473793029785, -0.0003462880849838257, -0.00032582879066467285, -0.00030536949634552, -0.0002849102020263672, -0.00026445090770721436, -0.00024399161338806152, -0.0002235323190689087, -0.00020307302474975586, -0.00018261373043060303, -0.0001621544361114502, -0.00014169514179229736, -0.00012123584747314453, -0.0001007765531539917, -8.031725883483887e-05, -5.9857964515686035e-05, -3.93986701965332e-05, -1.893937587738037e-05, 1.519918441772461e-06, 2.1979212760925293e-05, 4.2438507080078125e-05, 6.289780139923096e-05, 8.335709571838379e-05, 0.00010381639003753662, 0.00012427568435668945, 0.00014473497867584229, 0.00016519427299499512, 0.00018565356731414795, 0.00020611286163330078, 0.0002265721559524536, 0.00024703145027160645, 0.0002674907445907593, 0.0002879500389099121, 0.00030840933322906494, 0.0003288686275482178, 0.0003493279218673706, 0.00036978721618652344, 0.00039024651050567627, 0.0004107058048248291, 0.00043116509914398193, 0.00045162439346313477, 0.0004720836877822876, 0.0004925429821014404, 0.0005130022764205933, 0.0005334615707397461, 0.0005539208650588989, 0.0005743801593780518, 0.0005948394536972046, 0.0006152987480163574, 0.0006357580423355103, 0.0006562173366546631, 0.0006766766309738159, 0.0006971359252929688]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 4.0, 7.0, 11.0, 21.0, 26.0, 40.0, 41.0, 64.0, 133.0, 220.0, 299.0, 488.0, 740.0, 1182.0, 1969.0, 3454.0, 5864.0, 11349.0, 22063.0, 45554.0, 95990.0, 187613.0, 266394.0, 200179.0, 103601.0, 49393.0, 24113.0, 12204.0, 6423.0, 3484.0, 2149.0, 1301.0, 772.0, 475.0, 328.0, 183.0, 131.0, 108.0, 63.0, 41.0, 20.0, 28.0, 7.0, 7.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.5078125, -4.37347412109375, -4.2391357421875, -4.10479736328125, -3.970458984375, -3.83612060546875, -3.7017822265625, -3.56744384765625, -3.43310546875, -3.29876708984375, -3.1644287109375, -3.03009033203125, -2.895751953125, -2.76141357421875, -2.6270751953125, -2.49273681640625, -2.3583984375, -2.22406005859375, -2.0897216796875, -1.95538330078125, -1.821044921875, -1.68670654296875, -1.5523681640625, -1.41802978515625, -1.28369140625, -1.14935302734375, -1.0150146484375, -0.88067626953125, -0.746337890625, -0.61199951171875, -0.4776611328125, -0.34332275390625, -0.208984375, -0.07464599609375, 0.0596923828125, 0.19403076171875, 0.328369140625, 0.46270751953125, 0.5970458984375, 0.73138427734375, 0.86572265625, 1.00006103515625, 1.1343994140625, 1.26873779296875, 1.403076171875, 1.53741455078125, 1.6717529296875, 1.80609130859375, 1.9404296875, 2.07476806640625, 2.2091064453125, 2.34344482421875, 2.477783203125, 2.61212158203125, 2.7464599609375, 2.88079833984375, 3.01513671875, 3.14947509765625, 3.2838134765625, 3.41815185546875, 3.552490234375, 3.68682861328125, 3.8211669921875, 3.95550537109375, 4.08984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 4.0, 17.0, 17.0, 11.0, 28.0, 37.0, 43.0, 48.0, 60.0, 67.0, 72.0, 83.0, 73.0, 80.0, 60.0, 45.0, 58.0, 40.0, 37.0, 24.0, 19.0, 9.0, 15.0, 8.0, 5.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.798828125, -1.7428436279296875, -1.686859130859375, -1.6308746337890625, -1.57489013671875, -1.5189056396484375, -1.462921142578125, -1.4069366455078125, -1.3509521484375, -1.2949676513671875, -1.238983154296875, -1.1829986572265625, -1.12701416015625, -1.0710296630859375, -1.015045166015625, -0.9590606689453125, -0.903076171875, -0.8470916748046875, -0.791107177734375, -0.7351226806640625, -0.67913818359375, -0.6231536865234375, -0.567169189453125, -0.5111846923828125, -0.4552001953125, -0.3992156982421875, -0.343231201171875, -0.2872467041015625, -0.23126220703125, -0.1752777099609375, -0.119293212890625, -0.0633087158203125, -0.00732421875, 0.0486602783203125, 0.104644775390625, 0.1606292724609375, 0.21661376953125, 0.2725982666015625, 0.328582763671875, 0.3845672607421875, 0.4405517578125, 0.4965362548828125, 0.552520751953125, 0.6085052490234375, 0.66448974609375, 0.7204742431640625, 0.776458740234375, 0.8324432373046875, 0.888427734375, 0.9444122314453125, 1.000396728515625, 1.0563812255859375, 1.11236572265625, 1.1683502197265625, 1.224334716796875, 1.2803192138671875, 1.3363037109375, 1.3922882080078125, 1.448272705078125, 1.5042572021484375, 1.56024169921875, 1.6162261962890625, 1.672210693359375, 1.7281951904296875, 1.7841796875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 12.0, 12.0, 15.0, 24.0, 22.0, 32.0, 31.0, 41.0, 24.0, 52.0, 46.0, 43.0, 52.0, 56.0, 42.0, 54.0, 37.0, 45.0, 45.0, 38.0, 48.0, 31.0, 31.0, 22.0, 25.0, 14.0, 20.0, 13.0, 10.0, 9.0, 6.0, 6.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.850679397583008, -9.4957275390625, -9.140775680541992, -8.785823822021484, -8.430871963500977, -8.075920104980469, -7.720968723297119, -7.366016864776611, -7.0110650062561035, -6.656113147735596, -6.301161289215088, -5.946209907531738, -5.5912580490112305, -5.236306190490723, -4.881354331970215, -4.526402473449707, -4.171450614929199, -3.8164987564086914, -3.4615468978881836, -3.106595277786255, -2.751643419265747, -2.3966915607452393, -2.0417399406433105, -1.6867880821228027, -1.331836223602295, -0.9768844246864319, -0.6219326257705688, -0.2669808864593506, 0.08797097206115723, 0.44292283058166504, 0.7978744506835938, 1.1528263092041016, 1.5077781677246094, 1.8627300262451172, 2.217681884765625, 2.5726335048675537, 2.9275853633880615, 3.2825372219085693, 3.637488842010498, 3.992440700531006, 4.347392559051514, 4.7023444175720215, 5.057296276092529, 5.412247657775879, 5.767199516296387, 6.1221513748168945, 6.477103233337402, 6.83205509185791, 7.187006950378418, 7.541958808898926, 7.896910667419434, 8.251862525939941, 8.60681438446045, 8.961766242980957, 9.316717147827148, 9.671669006347656, 10.026620864868164, 10.381572723388672, 10.73652458190918, 11.091476440429688, 11.446428298950195, 11.801380157470703, 12.156332015991211, 12.511283874511719, 12.866235733032227]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 4.0, 10.0, 7.0, 13.0, 9.0, 13.0, 14.0, 28.0, 27.0, 27.0, 22.0, 27.0, 32.0, 28.0, 39.0, 39.0, 39.0, 47.0, 48.0, 41.0, 29.0, 50.0, 45.0, 37.0, 31.0, 33.0, 32.0, 22.0, 28.0, 15.0, 25.0, 17.0, 17.0, 13.0, 11.0, 17.0, 9.0, 13.0, 6.0, 8.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.599098205566406, -12.174299240112305, -11.749500274658203, -11.324701309204102, -10.89990234375, -10.475103378295898, -10.050305366516113, -9.625506401062012, -9.20070743560791, -8.775908470153809, -8.351109504699707, -7.926311016082764, -7.501512050628662, -7.0767130851745605, -6.651914596557617, -6.227115631103516, -5.802316665649414, -5.3775177001953125, -4.952718734741211, -4.527920246124268, -4.103121280670166, -3.6783223152160645, -3.253523588180542, -2.8287248611450195, -2.403925895690918, -1.979127049446106, -1.554328203201294, -1.129529356956482, -0.7047305107116699, -0.27993154525756836, 0.1448671817779541, 0.5696659088134766, 0.9944658279418945, 1.4192646741867065, 1.8440635204315186, 2.268862247467041, 2.6936612129211426, 3.118460178375244, 3.5432589054107666, 3.968057632446289, 4.392856597900391, 4.817655563354492, 5.242454528808594, 5.667253017425537, 6.092051982879639, 6.51685094833374, 6.941649436950684, 7.366448402404785, 7.791247367858887, 8.216046333312988, 8.64084529876709, 9.065644264221191, 9.490442276000977, 9.915241241455078, 10.34004020690918, 10.764839172363281, 11.189638137817383, 11.614437103271484, 12.039236068725586, 12.464035034179688, 12.888833999633789, 13.31363296508789, 13.738430976867676, 14.163229942321777, 14.588028907775879]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 9.0, 21.0, 33.0, 43.0, 68.0, 111.0, 163.0, 275.0, 421.0, 573.0, 897.0, 1384.0, 2007.0, 3102.0, 4750.0, 7052.0, 10457.0, 15359.0, 22428.0, 31709.0, 43815.0, 58055.0, 72898.0, 88447.0, 98476.0, 103068.0, 99871.0, 90166.0, 76386.0, 61012.0, 46730.0, 33702.0, 24098.0, 16861.0, 11317.0, 7558.0, 5060.0, 3450.0, 2241.0, 1560.0, 1014.0, 668.0, 412.0, 295.0, 176.0, 119.0, 78.0, 59.0, 33.0, 24.0, 13.0, 7.0, 9.0, 11.0, 0.0, 0.0, 3.0], "bins": [-7.70703125, -7.47064208984375, -7.2342529296875, -6.99786376953125, -6.761474609375, -6.52508544921875, -6.2886962890625, -6.05230712890625, -5.81591796875, -5.57952880859375, -5.3431396484375, -5.10675048828125, -4.870361328125, -4.63397216796875, -4.3975830078125, -4.16119384765625, -3.9248046875, -3.68841552734375, -3.4520263671875, -3.21563720703125, -2.979248046875, -2.74285888671875, -2.5064697265625, -2.27008056640625, -2.03369140625, -1.79730224609375, -1.5609130859375, -1.32452392578125, -1.088134765625, -0.85174560546875, -0.6153564453125, -0.37896728515625, -0.142578125, 0.09381103515625, 0.3302001953125, 0.56658935546875, 0.802978515625, 1.03936767578125, 1.2757568359375, 1.51214599609375, 1.74853515625, 1.98492431640625, 2.2213134765625, 2.45770263671875, 2.694091796875, 2.93048095703125, 3.1668701171875, 3.40325927734375, 3.6396484375, 3.87603759765625, 4.1124267578125, 4.34881591796875, 4.585205078125, 4.82159423828125, 5.0579833984375, 5.29437255859375, 5.53076171875, 5.76715087890625, 6.0035400390625, 6.23992919921875, 6.476318359375, 6.71270751953125, 6.9490966796875, 7.18548583984375, 7.421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 7.0, 3.0, 4.0, 6.0, 7.0, 7.0, 9.0, 20.0, 18.0, 24.0, 24.0, 23.0, 19.0, 26.0, 28.0, 36.0, 43.0, 39.0, 42.0, 35.0, 42.0, 44.0, 32.0, 40.0, 46.0, 41.0, 30.0, 26.0, 27.0, 26.0, 34.0, 33.0, 18.0, 18.0, 26.0, 15.0, 11.0, 13.0, 4.0, 14.0, 6.0, 8.0, 6.0, 13.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.546875, -12.1422119140625, -11.737548828125, -11.3328857421875, -10.92822265625, -10.5235595703125, -10.118896484375, -9.7142333984375, -9.3095703125, -8.9049072265625, -8.500244140625, -8.0955810546875, -7.69091796875, -7.2862548828125, -6.881591796875, -6.4769287109375, -6.072265625, -5.6676025390625, -5.262939453125, -4.8582763671875, -4.45361328125, -4.0489501953125, -3.644287109375, -3.2396240234375, -2.8349609375, -2.4302978515625, -2.025634765625, -1.6209716796875, -1.21630859375, -0.8116455078125, -0.406982421875, -0.0023193359375, 0.40234375, 0.8070068359375, 1.211669921875, 1.6163330078125, 2.02099609375, 2.4256591796875, 2.830322265625, 3.2349853515625, 3.6396484375, 4.0443115234375, 4.448974609375, 4.8536376953125, 5.25830078125, 5.6629638671875, 6.067626953125, 6.4722900390625, 6.876953125, 7.2816162109375, 7.686279296875, 8.0909423828125, 8.49560546875, 8.9002685546875, 9.304931640625, 9.7095947265625, 10.1142578125, 10.5189208984375, 10.923583984375, 11.3282470703125, 11.73291015625, 12.1375732421875, 12.542236328125, 12.9468994140625, 13.3515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 5.0, 9.0, 13.0, 17.0, 28.0, 30.0, 40.0, 52.0, 101.0, 152.0, 215.0, 360.0, 523.0, 863.0, 1459.0, 2249.0, 3705.0, 5851.0, 9758.0, 15754.0, 25499.0, 39604.0, 59605.0, 84841.0, 110775.0, 129600.0, 133791.0, 120929.0, 97946.0, 71786.0, 49247.0, 31660.0, 19901.0, 12390.0, 7551.0, 4711.0, 2799.0, 1741.0, 1112.0, 711.0, 434.0, 225.0, 185.0, 114.0, 75.0, 55.0, 30.0, 26.0, 13.0, 12.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.2578125, -10.9290771484375, -10.600341796875, -10.2716064453125, -9.94287109375, -9.6141357421875, -9.285400390625, -8.9566650390625, -8.6279296875, -8.2991943359375, -7.970458984375, -7.6417236328125, -7.31298828125, -6.9842529296875, -6.655517578125, -6.3267822265625, -5.998046875, -5.6693115234375, -5.340576171875, -5.0118408203125, -4.68310546875, -4.3543701171875, -4.025634765625, -3.6968994140625, -3.3681640625, -3.0394287109375, -2.710693359375, -2.3819580078125, -2.05322265625, -1.7244873046875, -1.395751953125, -1.0670166015625, -0.73828125, -0.4095458984375, -0.080810546875, 0.2479248046875, 0.57666015625, 0.9053955078125, 1.234130859375, 1.5628662109375, 1.8916015625, 2.2203369140625, 2.549072265625, 2.8778076171875, 3.20654296875, 3.5352783203125, 3.864013671875, 4.1927490234375, 4.521484375, 4.8502197265625, 5.178955078125, 5.5076904296875, 5.83642578125, 6.1651611328125, 6.493896484375, 6.8226318359375, 7.1513671875, 7.4801025390625, 7.808837890625, 8.1375732421875, 8.46630859375, 8.7950439453125, 9.123779296875, 9.4525146484375, 9.78125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 3.0, 8.0, 4.0, 15.0, 17.0, 24.0, 28.0, 14.0, 25.0, 33.0, 33.0, 29.0, 42.0, 40.0, 38.0, 35.0, 48.0, 37.0, 43.0, 48.0, 32.0, 33.0, 38.0, 42.0, 45.0, 38.0, 27.0, 32.0, 29.0, 23.0, 17.0, 14.0, 11.0, 15.0, 7.0, 4.0, 5.0, 2.0, 4.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-11.46875, -11.1544189453125, -10.840087890625, -10.5257568359375, -10.21142578125, -9.8970947265625, -9.582763671875, -9.2684326171875, -8.9541015625, -8.6397705078125, -8.325439453125, -8.0111083984375, -7.69677734375, -7.3824462890625, -7.068115234375, -6.7537841796875, -6.439453125, -6.1251220703125, -5.810791015625, -5.4964599609375, -5.18212890625, -4.8677978515625, -4.553466796875, -4.2391357421875, -3.9248046875, -3.6104736328125, -3.296142578125, -2.9818115234375, -2.66748046875, -2.3531494140625, -2.038818359375, -1.7244873046875, -1.41015625, -1.0958251953125, -0.781494140625, -0.4671630859375, -0.15283203125, 0.1614990234375, 0.475830078125, 0.7901611328125, 1.1044921875, 1.4188232421875, 1.733154296875, 2.0474853515625, 2.36181640625, 2.6761474609375, 2.990478515625, 3.3048095703125, 3.619140625, 3.9334716796875, 4.247802734375, 4.5621337890625, 4.87646484375, 5.1907958984375, 5.505126953125, 5.8194580078125, 6.1337890625, 6.4481201171875, 6.762451171875, 7.0767822265625, 7.39111328125, 7.7054443359375, 8.019775390625, 8.3341064453125, 8.6484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 7.0, 7.0, 5.0, 10.0, 13.0, 20.0, 51.0, 59.0, 85.0, 125.0, 196.0, 244.0, 424.0, 553.0, 865.0, 1258.0, 1921.0, 2990.0, 4530.0, 7380.0, 12186.0, 20566.0, 34915.0, 61399.0, 104273.0, 156449.0, 186461.0, 166306.0, 115998.0, 69645.0, 39975.0, 23001.0, 13569.0, 8232.0, 5093.0, 3317.0, 2170.0, 1437.0, 850.0, 629.0, 422.0, 283.0, 203.0, 147.0, 100.0, 55.0, 49.0, 28.0, 29.0, 15.0, 13.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.91796875, -5.73077392578125, -5.5435791015625, -5.35638427734375, -5.169189453125, -4.98199462890625, -4.7947998046875, -4.60760498046875, -4.42041015625, -4.23321533203125, -4.0460205078125, -3.85882568359375, -3.671630859375, -3.48443603515625, -3.2972412109375, -3.11004638671875, -2.9228515625, -2.73565673828125, -2.5484619140625, -2.36126708984375, -2.174072265625, -1.98687744140625, -1.7996826171875, -1.61248779296875, -1.42529296875, -1.23809814453125, -1.0509033203125, -0.86370849609375, -0.676513671875, -0.48931884765625, -0.3021240234375, -0.11492919921875, 0.072265625, 0.25946044921875, 0.4466552734375, 0.63385009765625, 0.821044921875, 1.00823974609375, 1.1954345703125, 1.38262939453125, 1.56982421875, 1.75701904296875, 1.9442138671875, 2.13140869140625, 2.318603515625, 2.50579833984375, 2.6929931640625, 2.88018798828125, 3.0673828125, 3.25457763671875, 3.4417724609375, 3.62896728515625, 3.816162109375, 4.00335693359375, 4.1905517578125, 4.37774658203125, 4.56494140625, 4.75213623046875, 4.9393310546875, 5.12652587890625, 5.313720703125, 5.50091552734375, 5.6881103515625, 5.87530517578125, 6.0625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 5.0, 8.0, 6.0, 15.0, 16.0, 23.0, 17.0, 17.0, 28.0, 38.0, 35.0, 33.0, 55.0, 60.0, 57.0, 52.0, 51.0, 53.0, 50.0, 55.0, 41.0, 47.0, 35.0, 31.0, 35.0, 29.0, 25.0, 14.0, 15.0, 14.0, 9.0, 7.0, 3.0, 6.0, 5.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003612041473388672, -0.00034720078110694885, -0.0003331974148750305, -0.0003191940486431122, -0.00030519068241119385, -0.0002911873161792755, -0.0002771839499473572, -0.00026318058371543884, -0.0002491772174835205, -0.00023517385125160217, -0.00022117048501968384, -0.0002071671187877655, -0.00019316375255584717, -0.00017916038632392883, -0.0001651570200920105, -0.00015115365386009216, -0.00013715028762817383, -0.0001231469213962555, -0.00010914355516433716, -9.514018893241882e-05, -8.113682270050049e-05, -6.713345646858215e-05, -5.313009023666382e-05, -3.9126724004745483e-05, -2.512335777282715e-05, -1.1119991540908813e-05, 2.8833746910095215e-06, 1.6886740922927856e-05, 3.089010715484619e-05, 4.4893473386764526e-05, 5.889683961868286e-05, 7.29002058506012e-05, 8.690357208251953e-05, 0.00010090693831443787, 0.0001149103045463562, 0.00012891367077827454, 0.00014291703701019287, 0.0001569204032421112, 0.00017092376947402954, 0.00018492713570594788, 0.0001989305019378662, 0.00021293386816978455, 0.00022693723440170288, 0.00024094060063362122, 0.00025494396686553955, 0.0002689473330974579, 0.0002829506993293762, 0.00029695406556129456, 0.0003109574317932129, 0.0003249607980251312, 0.00033896416425704956, 0.0003529675304889679, 0.00036697089672088623, 0.00038097426295280457, 0.0003949776291847229, 0.00040898099541664124, 0.00042298436164855957, 0.0004369877278804779, 0.00045099109411239624, 0.0004649944603443146, 0.0004789978265762329, 0.0004930011928081512, 0.0005070045590400696, 0.0005210079252719879, 0.0005350112915039062]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 13.0, 15.0, 25.0, 28.0, 34.0, 101.0, 107.0, 189.0, 282.0, 419.0, 664.0, 1040.0, 1669.0, 2904.0, 4889.0, 8669.0, 15428.0, 28034.0, 51339.0, 89787.0, 143149.0, 186319.0, 183595.0, 136613.0, 84590.0, 47821.0, 26406.0, 14627.0, 8045.0, 4666.0, 2646.0, 1652.0, 1008.0, 640.0, 400.0, 256.0, 172.0, 113.0, 68.0, 65.0, 19.0, 17.0, 17.0, 5.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.335205078125, -5.15087890625, -4.966552734375, -4.7822265625, -4.597900390625, -4.41357421875, -4.229248046875, -4.044921875, -3.860595703125, -3.67626953125, -3.491943359375, -3.3076171875, -3.123291015625, -2.93896484375, -2.754638671875, -2.5703125, -2.385986328125, -2.20166015625, -2.017333984375, -1.8330078125, -1.648681640625, -1.46435546875, -1.280029296875, -1.095703125, -0.911376953125, -0.72705078125, -0.542724609375, -0.3583984375, -0.174072265625, 0.01025390625, 0.194580078125, 0.37890625, 0.563232421875, 0.74755859375, 0.931884765625, 1.1162109375, 1.300537109375, 1.48486328125, 1.669189453125, 1.853515625, 2.037841796875, 2.22216796875, 2.406494140625, 2.5908203125, 2.775146484375, 2.95947265625, 3.143798828125, 3.328125, 3.512451171875, 3.69677734375, 3.881103515625, 4.0654296875, 4.249755859375, 4.43408203125, 4.618408203125, 4.802734375, 4.987060546875, 5.17138671875, 5.355712890625, 5.5400390625, 5.724365234375, 5.90869140625, 6.093017578125, 6.27734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 7.0, 3.0, 3.0, 7.0, 8.0, 13.0, 17.0, 17.0, 21.0, 20.0, 28.0, 35.0, 50.0, 60.0, 65.0, 48.0, 64.0, 66.0, 66.0, 60.0, 49.0, 67.0, 58.0, 24.0, 27.0, 27.0, 22.0, 17.0, 17.0, 16.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.19921875, -5.0601806640625, -4.921142578125, -4.7821044921875, -4.64306640625, -4.5040283203125, -4.364990234375, -4.2259521484375, -4.0869140625, -3.9478759765625, -3.808837890625, -3.6697998046875, -3.53076171875, -3.3917236328125, -3.252685546875, -3.1136474609375, -2.974609375, -2.8355712890625, -2.696533203125, -2.5574951171875, -2.41845703125, -2.2794189453125, -2.140380859375, -2.0013427734375, -1.8623046875, -1.7232666015625, -1.584228515625, -1.4451904296875, -1.30615234375, -1.1671142578125, -1.028076171875, -0.8890380859375, -0.75, -0.6109619140625, -0.471923828125, -0.3328857421875, -0.19384765625, -0.0548095703125, 0.084228515625, 0.2232666015625, 0.3623046875, 0.5013427734375, 0.640380859375, 0.7794189453125, 0.91845703125, 1.0574951171875, 1.196533203125, 1.3355712890625, 1.474609375, 1.6136474609375, 1.752685546875, 1.8917236328125, 2.03076171875, 2.1697998046875, 2.308837890625, 2.4478759765625, 2.5869140625, 2.7259521484375, 2.864990234375, 3.0040283203125, 3.14306640625, 3.2821044921875, 3.421142578125, 3.5601806640625, 3.69921875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 7.0, 6.0, 9.0, 5.0, 8.0, 14.0, 17.0, 11.0, 23.0, 26.0, 34.0, 29.0, 33.0, 42.0, 36.0, 31.0, 43.0, 35.0, 53.0, 52.0, 48.0, 42.0, 44.0, 41.0, 45.0, 33.0, 36.0, 30.0, 32.0, 14.0, 19.0, 13.0, 14.0, 10.0, 8.0, 10.0, 10.0, 8.0, 6.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.082929611206055, -9.758069038391113, -9.433208465576172, -9.10834789276123, -8.783487319946289, -8.458626747131348, -8.133766174316406, -7.808905601501465, -7.484045028686523, -7.159184455871582, -6.834323883056641, -6.509463310241699, -6.184602737426758, -5.859742164611816, -5.534881591796875, -5.210021018981934, -4.885159969329834, -4.560299396514893, -4.235438823699951, -3.9105782508850098, -3.5857176780700684, -3.260857105255127, -2.9359962940216064, -2.611135721206665, -2.2862751483917236, -1.9614145755767822, -1.6365540027618408, -1.3116933107376099, -0.9868327379226685, -0.661972165107727, -0.3371114730834961, -0.012250900268554688, 0.3126096725463867, 0.6374702453613281, 0.9623308777809143, 1.2871915102005005, 1.612052083015442, 1.9369126558303833, 2.2617733478546143, 2.5866339206695557, 2.911494493484497, 3.2363550662994385, 3.56121563911438, 3.8860764503479004, 4.210937023162842, 4.535797595977783, 4.860658168792725, 5.185518741607666, 5.510379314422607, 5.835239887237549, 6.16010046005249, 6.484961032867432, 6.809821605682373, 7.1346821784973145, 7.459543228149414, 7.7844038009643555, 8.109264373779297, 8.434124946594238, 8.75898551940918, 9.083846092224121, 9.408706665039062, 9.733567237854004, 10.058427810668945, 10.383288383483887, 10.708148956298828]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 9.0, 7.0, 18.0, 20.0, 13.0, 17.0, 15.0, 29.0, 35.0, 29.0, 33.0, 42.0, 39.0, 42.0, 35.0, 42.0, 51.0, 46.0, 48.0, 42.0, 41.0, 35.0, 46.0, 31.0, 32.0, 26.0, 36.0, 22.0, 15.0, 16.0, 8.0, 13.0, 11.0, 9.0, 10.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.361552238464355, -13.906168937683105, -13.450786590576172, -12.995403289794922, -12.540019989013672, -12.084636688232422, -11.629253387451172, -11.173871040344238, -10.718487739562988, -10.263104438781738, -9.807722091674805, -9.352338790893555, -8.896955490112305, -8.441572189331055, -7.986189365386963, -7.530806541442871, -7.075423240661621, -6.620039939880371, -6.164657115936279, -5.7092742919921875, -5.2538909912109375, -4.7985076904296875, -4.343124866485596, -3.887741804122925, -3.432358741760254, -2.976975679397583, -2.521592617034912, -2.066209554672241, -1.6108264923095703, -1.1554434299468994, -0.7000603675842285, -0.24467730522155762, 0.21070575714111328, 0.6660888195037842, 1.121471881866455, 1.576854944229126, 2.032238006591797, 2.4876210689544678, 2.9430041313171387, 3.3983871936798096, 3.8537702560424805, 4.3091535568237305, 4.764536380767822, 5.219919204711914, 5.675302505493164, 6.130685806274414, 6.586068630218506, 7.041451454162598, 7.496834754943848, 7.952218055725098, 8.407600402832031, 8.862983703613281, 9.318367004394531, 9.773750305175781, 10.229133605957031, 10.684515953063965, 11.139899253845215, 11.595282554626465, 12.050664901733398, 12.506048202514648, 12.961431503295898, 13.416814804077148, 13.872198104858398, 14.327580451965332, 14.782963752746582]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 16.0, 11.0, 43.0, 47.0, 97.0, 160.0, 245.0, 383.0, 659.0, 978.0, 1767.0, 2914.0, 4867.0, 8241.0, 14430.0, 24724.0, 44024.0, 76860.0, 134374.0, 226601.0, 358984.0, 509763.0, 624987.0, 636597.0, 537098.0, 385686.0, 247112.0, 148815.0, 86189.0, 49510.0, 28202.0, 16316.0, 9495.0, 5667.0, 3334.0, 1879.0, 1211.0, 748.0, 470.0, 288.0, 190.0, 123.0, 67.0, 45.0, 25.0, 22.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.5234375, -8.2493896484375, -7.975341796875, -7.7012939453125, -7.42724609375, -7.1531982421875, -6.879150390625, -6.6051025390625, -6.3310546875, -6.0570068359375, -5.782958984375, -5.5089111328125, -5.23486328125, -4.9608154296875, -4.686767578125, -4.4127197265625, -4.138671875, -3.8646240234375, -3.590576171875, -3.3165283203125, -3.04248046875, -2.7684326171875, -2.494384765625, -2.2203369140625, -1.9462890625, -1.6722412109375, -1.398193359375, -1.1241455078125, -0.85009765625, -0.5760498046875, -0.302001953125, -0.0279541015625, 0.24609375, 0.5201416015625, 0.794189453125, 1.0682373046875, 1.34228515625, 1.6163330078125, 1.890380859375, 2.1644287109375, 2.4384765625, 2.7125244140625, 2.986572265625, 3.2606201171875, 3.53466796875, 3.8087158203125, 4.082763671875, 4.3568115234375, 4.630859375, 4.9049072265625, 5.178955078125, 5.4530029296875, 5.72705078125, 6.0010986328125, 6.275146484375, 6.5491943359375, 6.8232421875, 7.0972900390625, 7.371337890625, 7.6453857421875, 7.91943359375, 8.1934814453125, 8.467529296875, 8.7415771484375, 9.015625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 4.0, 7.0, 9.0, 10.0, 13.0, 9.0, 18.0, 19.0, 31.0, 25.0, 30.0, 42.0, 34.0, 33.0, 44.0, 32.0, 40.0, 46.0, 53.0, 40.0, 40.0, 40.0, 42.0, 29.0, 40.0, 43.0, 27.0, 27.0, 27.0, 27.0, 16.0, 11.0, 15.0, 11.0, 16.0, 8.0, 10.0, 7.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.3310546875, -9.990234375, -9.6494140625, -9.30859375, -8.9677734375, -8.626953125, -8.2861328125, -7.9453125, -7.6044921875, -7.263671875, -6.9228515625, -6.58203125, -6.2412109375, -5.900390625, -5.5595703125, -5.21875, -4.8779296875, -4.537109375, -4.1962890625, -3.85546875, -3.5146484375, -3.173828125, -2.8330078125, -2.4921875, -2.1513671875, -1.810546875, -1.4697265625, -1.12890625, -0.7880859375, -0.447265625, -0.1064453125, 0.234375, 0.5751953125, 0.916015625, 1.2568359375, 1.59765625, 1.9384765625, 2.279296875, 2.6201171875, 2.9609375, 3.3017578125, 3.642578125, 3.9833984375, 4.32421875, 4.6650390625, 5.005859375, 5.3466796875, 5.6875, 6.0283203125, 6.369140625, 6.7099609375, 7.05078125, 7.3916015625, 7.732421875, 8.0732421875, 8.4140625, 8.7548828125, 9.095703125, 9.4365234375, 9.77734375, 10.1181640625, 10.458984375, 10.7998046875, 11.140625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 7.0, 14.0, 12.0, 18.0, 33.0, 51.0, 68.0, 109.0, 175.0, 283.0, 433.0, 702.0, 1126.0, 1885.0, 3166.0, 5480.0, 9282.0, 15801.0, 26824.0, 46080.0, 77108.0, 125746.0, 196576.0, 291996.0, 401317.0, 500783.0, 550091.0, 529176.0, 447388.0, 337622.0, 235788.0, 152945.0, 95306.0, 57888.0, 34208.0, 20177.0, 11637.0, 6878.0, 3944.0, 2382.0, 1416.0, 859.0, 581.0, 305.0, 238.0, 126.0, 95.0, 57.0, 40.0, 21.0, 14.0, 14.0, 3.0, 2.0, 1.0, 2.0, 4.0], "bins": [-8.6328125, -8.37677001953125, -8.1207275390625, -7.86468505859375, -7.608642578125, -7.35260009765625, -7.0965576171875, -6.84051513671875, -6.58447265625, -6.32843017578125, -6.0723876953125, -5.81634521484375, -5.560302734375, -5.30426025390625, -5.0482177734375, -4.79217529296875, -4.5361328125, -4.28009033203125, -4.0240478515625, -3.76800537109375, -3.511962890625, -3.25592041015625, -2.9998779296875, -2.74383544921875, -2.48779296875, -2.23175048828125, -1.9757080078125, -1.71966552734375, -1.463623046875, -1.20758056640625, -0.9515380859375, -0.69549560546875, -0.439453125, -0.18341064453125, 0.0726318359375, 0.32867431640625, 0.584716796875, 0.84075927734375, 1.0968017578125, 1.35284423828125, 1.60888671875, 1.86492919921875, 2.1209716796875, 2.37701416015625, 2.633056640625, 2.88909912109375, 3.1451416015625, 3.40118408203125, 3.6572265625, 3.91326904296875, 4.1693115234375, 4.42535400390625, 4.681396484375, 4.93743896484375, 5.1934814453125, 5.44952392578125, 5.70556640625, 5.96160888671875, 6.2176513671875, 6.47369384765625, 6.729736328125, 6.98577880859375, 7.2418212890625, 7.49786376953125, 7.75390625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 6.0, 9.0, 9.0, 14.0, 20.0, 12.0, 30.0, 30.0, 67.0, 70.0, 83.0, 99.0, 121.0, 136.0, 144.0, 183.0, 191.0, 184.0, 220.0, 202.0, 226.0, 211.0, 232.0, 181.0, 186.0, 162.0, 153.0, 144.0, 109.0, 107.0, 83.0, 91.0, 71.0, 50.0, 47.0, 33.0, 36.0, 19.0, 20.0, 18.0, 15.0, 12.0, 8.0, 8.0, 3.0, 1.0, 3.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.9921875, -3.85809326171875, -3.7239990234375, -3.58990478515625, -3.455810546875, -3.32171630859375, -3.1876220703125, -3.05352783203125, -2.91943359375, -2.78533935546875, -2.6512451171875, -2.51715087890625, -2.383056640625, -2.24896240234375, -2.1148681640625, -1.98077392578125, -1.8466796875, -1.71258544921875, -1.5784912109375, -1.44439697265625, -1.310302734375, -1.17620849609375, -1.0421142578125, -0.90802001953125, -0.77392578125, -0.63983154296875, -0.5057373046875, -0.37164306640625, -0.237548828125, -0.10345458984375, 0.0306396484375, 0.16473388671875, 0.298828125, 0.43292236328125, 0.5670166015625, 0.70111083984375, 0.835205078125, 0.96929931640625, 1.1033935546875, 1.23748779296875, 1.37158203125, 1.50567626953125, 1.6397705078125, 1.77386474609375, 1.907958984375, 2.04205322265625, 2.1761474609375, 2.31024169921875, 2.4443359375, 2.57843017578125, 2.7125244140625, 2.84661865234375, 2.980712890625, 3.11480712890625, 3.2489013671875, 3.38299560546875, 3.51708984375, 3.65118408203125, 3.7852783203125, 3.91937255859375, 4.053466796875, 4.18756103515625, 4.3216552734375, 4.45574951171875, 4.58984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 7.0, 16.0, 10.0, 23.0, 21.0, 21.0, 30.0, 23.0, 28.0, 38.0, 33.0, 32.0, 39.0, 55.0, 60.0, 38.0, 51.0, 40.0, 45.0, 49.0, 33.0, 47.0, 43.0, 31.0, 21.0, 26.0, 18.0, 23.0, 12.0, 16.0, 8.0, 11.0, 7.0, 3.0, 8.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.858766555786133, -8.546050071716309, -8.233333587646484, -7.92061710357666, -7.607900619506836, -7.295184135437012, -6.9824676513671875, -6.669751167297363, -6.357034683227539, -6.044318199157715, -5.731601715087891, -5.418885231018066, -5.106168746948242, -4.793452262878418, -4.480735778808594, -4.1680192947387695, -3.8553028106689453, -3.542586326599121, -3.229869842529297, -2.9171533584594727, -2.6044368743896484, -2.291720390319824, -1.97900390625, -1.6662874221801758, -1.3535709381103516, -1.0408544540405273, -0.7281379699707031, -0.4154214859008789, -0.10270500183105469, 0.21001148223876953, 0.5227279663085938, 0.835444450378418, 1.1481609344482422, 1.4608774185180664, 1.7735939025878906, 2.086310386657715, 2.399026870727539, 2.7117433547973633, 3.0244598388671875, 3.3371763229370117, 3.649892807006836, 3.96260929107666, 4.275325775146484, 4.588042259216309, 4.900758743286133, 5.213475227355957, 5.526191711425781, 5.8389081954956055, 6.15162467956543, 6.464341163635254, 6.777057647705078, 7.089774131774902, 7.402490615844727, 7.715207099914551, 8.027923583984375, 8.3406400680542, 8.653356552124023, 8.966073036193848, 9.278789520263672, 9.591506004333496, 9.90422248840332, 10.216938972473145, 10.529655456542969, 10.842371940612793, 11.155088424682617]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 7.0, 10.0, 7.0, 5.0, 9.0, 16.0, 18.0, 22.0, 25.0, 32.0, 26.0, 28.0, 36.0, 47.0, 33.0, 38.0, 47.0, 39.0, 43.0, 32.0, 45.0, 47.0, 51.0, 33.0, 45.0, 31.0, 27.0, 24.0, 31.0, 16.0, 15.0, 20.0, 13.0, 11.0, 15.0, 13.0, 7.0, 9.0, 7.0, 3.0, 4.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.650596618652344, -12.258272171020508, -11.865946769714355, -11.47362232208252, -11.081296920776367, -10.688972473144531, -10.296648025512695, -9.90432357788086, -9.511998176574707, -9.119673728942871, -8.727348327636719, -8.335023880004883, -7.942698955535889, -7.5503740310668945, -7.158049583435059, -6.7657246589660645, -6.37339973449707, -5.981074810028076, -5.588749885559082, -5.196425437927246, -4.804100513458252, -4.411775588989258, -4.019451141357422, -3.6271262168884277, -3.2348012924194336, -2.8424763679504395, -2.4501516819000244, -2.0578269958496094, -1.6655020713806152, -1.2731772661209106, -0.880852460861206, -0.488527774810791, -0.09620285034179688, 0.2961219549179077, 0.6884467601776123, 1.080771565437317, 1.4730963706970215, 1.865421175956726, 2.2577459812164307, 2.6500706672668457, 3.04239559173584, 3.434720516204834, 3.827045202255249, 4.219369888305664, 4.611694812774658, 5.004019737243652, 5.396344184875488, 5.788669109344482, 6.180994033813477, 6.573318958282471, 6.965643882751465, 7.357968330383301, 7.750293254852295, 8.142618179321289, 8.534942626953125, 8.927267074584961, 9.319592475891113, 9.71191692352295, 10.104242324829102, 10.496566772460938, 10.888891220092773, 11.281216621398926, 11.673541069030762, 12.065866470336914, 12.45819091796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 10.0, 23.0, 31.0, 45.0, 36.0, 57.0, 95.0, 131.0, 215.0, 300.0, 432.0, 734.0, 1239.0, 2209.0, 4129.0, 7563.0, 14712.0, 28149.0, 53094.0, 92434.0, 145444.0, 186804.0, 183117.0, 137619.0, 86417.0, 48244.0, 25624.0, 13587.0, 7068.0, 3691.0, 2084.0, 1166.0, 708.0, 442.0, 251.0, 173.0, 137.0, 105.0, 61.0, 52.0, 27.0, 24.0, 23.0, 13.0, 9.0, 7.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.32757568359375, -5.1434326171875, -4.95928955078125, -4.775146484375, -4.59100341796875, -4.4068603515625, -4.22271728515625, -4.03857421875, -3.85443115234375, -3.6702880859375, -3.48614501953125, -3.302001953125, -3.11785888671875, -2.9337158203125, -2.74957275390625, -2.5654296875, -2.38128662109375, -2.1971435546875, -2.01300048828125, -1.828857421875, -1.64471435546875, -1.4605712890625, -1.27642822265625, -1.09228515625, -0.90814208984375, -0.7239990234375, -0.53985595703125, -0.355712890625, -0.17156982421875, 0.0125732421875, 0.19671630859375, 0.380859375, 0.56500244140625, 0.7491455078125, 0.93328857421875, 1.117431640625, 1.30157470703125, 1.4857177734375, 1.66986083984375, 1.85400390625, 2.03814697265625, 2.2222900390625, 2.40643310546875, 2.590576171875, 2.77471923828125, 2.9588623046875, 3.14300537109375, 3.3271484375, 3.51129150390625, 3.6954345703125, 3.87957763671875, 4.063720703125, 4.24786376953125, 4.4320068359375, 4.61614990234375, 4.80029296875, 4.98443603515625, 5.1685791015625, 5.35272216796875, 5.536865234375, 5.72100830078125, 5.9051513671875, 6.08929443359375, 6.2734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 3.0, 11.0, 8.0, 10.0, 11.0, 18.0, 12.0, 20.0, 22.0, 32.0, 24.0, 35.0, 29.0, 38.0, 39.0, 38.0, 43.0, 42.0, 34.0, 41.0, 53.0, 36.0, 42.0, 41.0, 42.0, 32.0, 25.0, 26.0, 29.0, 15.0, 25.0, 23.0, 18.0, 10.0, 14.0, 13.0, 12.0, 5.0, 9.0, 3.0, 4.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.34375, -11.9522705078125, -11.560791015625, -11.1693115234375, -10.77783203125, -10.3863525390625, -9.994873046875, -9.6033935546875, -9.2119140625, -8.8204345703125, -8.428955078125, -8.0374755859375, -7.64599609375, -7.2545166015625, -6.863037109375, -6.4715576171875, -6.080078125, -5.6885986328125, -5.297119140625, -4.9056396484375, -4.51416015625, -4.1226806640625, -3.731201171875, -3.3397216796875, -2.9482421875, -2.5567626953125, -2.165283203125, -1.7738037109375, -1.38232421875, -0.9908447265625, -0.599365234375, -0.2078857421875, 0.18359375, 0.5750732421875, 0.966552734375, 1.3580322265625, 1.74951171875, 2.1409912109375, 2.532470703125, 2.9239501953125, 3.3154296875, 3.7069091796875, 4.098388671875, 4.4898681640625, 4.88134765625, 5.2728271484375, 5.664306640625, 6.0557861328125, 6.447265625, 6.8387451171875, 7.230224609375, 7.6217041015625, 8.01318359375, 8.4046630859375, 8.796142578125, 9.1876220703125, 9.5791015625, 9.9705810546875, 10.362060546875, 10.7535400390625, 11.14501953125, 11.5364990234375, 11.927978515625, 12.3194580078125, 12.7109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 8.0, 9.0, 20.0, 31.0, 35.0, 77.0, 120.0, 204.0, 365.0, 672.0, 1294.0, 2694.0, 5753.0, 12734.0, 30481.0, 73076.0, 162016.0, 272312.0, 248960.0, 135380.0, 58243.0, 24201.0, 10647.0, 4703.0, 2129.0, 1120.0, 532.0, 305.0, 175.0, 113.0, 50.0, 35.0, 19.0, 11.0, 12.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.95703125, -7.7149658203125, -7.472900390625, -7.2308349609375, -6.98876953125, -6.7467041015625, -6.504638671875, -6.2625732421875, -6.0205078125, -5.7784423828125, -5.536376953125, -5.2943115234375, -5.05224609375, -4.8101806640625, -4.568115234375, -4.3260498046875, -4.083984375, -3.8419189453125, -3.599853515625, -3.3577880859375, -3.11572265625, -2.8736572265625, -2.631591796875, -2.3895263671875, -2.1474609375, -1.9053955078125, -1.663330078125, -1.4212646484375, -1.17919921875, -0.9371337890625, -0.695068359375, -0.4530029296875, -0.2109375, 0.0311279296875, 0.273193359375, 0.5152587890625, 0.75732421875, 0.9993896484375, 1.241455078125, 1.4835205078125, 1.7255859375, 1.9676513671875, 2.209716796875, 2.4517822265625, 2.69384765625, 2.9359130859375, 3.177978515625, 3.4200439453125, 3.662109375, 3.9041748046875, 4.146240234375, 4.3883056640625, 4.63037109375, 4.8724365234375, 5.114501953125, 5.3565673828125, 5.5986328125, 5.8406982421875, 6.082763671875, 6.3248291015625, 6.56689453125, 6.8089599609375, 7.051025390625, 7.2930908203125, 7.53515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 7.0, 14.0, 22.0, 20.0, 19.0, 20.0, 23.0, 37.0, 29.0, 27.0, 35.0, 29.0, 31.0, 50.0, 43.0, 32.0, 33.0, 40.0, 34.0, 43.0, 42.0, 21.0, 36.0, 31.0, 34.0, 26.0, 26.0, 24.0, 27.0, 14.0, 15.0, 14.0, 18.0, 13.0, 13.0, 9.0, 10.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.5390625, -9.260009765625, -8.98095703125, -8.701904296875, -8.4228515625, -8.143798828125, -7.86474609375, -7.585693359375, -7.306640625, -7.027587890625, -6.74853515625, -6.469482421875, -6.1904296875, -5.911376953125, -5.63232421875, -5.353271484375, -5.07421875, -4.795166015625, -4.51611328125, -4.237060546875, -3.9580078125, -3.678955078125, -3.39990234375, -3.120849609375, -2.841796875, -2.562744140625, -2.28369140625, -2.004638671875, -1.7255859375, -1.446533203125, -1.16748046875, -0.888427734375, -0.609375, -0.330322265625, -0.05126953125, 0.227783203125, 0.5068359375, 0.785888671875, 1.06494140625, 1.343994140625, 1.623046875, 1.902099609375, 2.18115234375, 2.460205078125, 2.7392578125, 3.018310546875, 3.29736328125, 3.576416015625, 3.85546875, 4.134521484375, 4.41357421875, 4.692626953125, 4.9716796875, 5.250732421875, 5.52978515625, 5.808837890625, 6.087890625, 6.366943359375, 6.64599609375, 6.925048828125, 7.2041015625, 7.483154296875, 7.76220703125, 8.041259765625, 8.3203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 12.0, 20.0, 29.0, 35.0, 36.0, 76.0, 94.0, 138.0, 172.0, 287.0, 429.0, 646.0, 1069.0, 1745.0, 3146.0, 5895.0, 11872.0, 27355.0, 74418.0, 231561.0, 404712.0, 180883.0, 58889.0, 22310.0, 10199.0, 5136.0, 2824.0, 1609.0, 934.0, 661.0, 398.0, 266.0, 217.0, 129.0, 93.0, 74.0, 41.0, 36.0, 24.0, 18.0, 14.0, 6.0, 11.0, 6.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.771484375, -3.651336669921875, -3.53118896484375, -3.411041259765625, -3.2908935546875, -3.170745849609375, -3.05059814453125, -2.930450439453125, -2.810302734375, -2.690155029296875, -2.57000732421875, -2.449859619140625, -2.3297119140625, -2.209564208984375, -2.08941650390625, -1.969268798828125, -1.84912109375, -1.728973388671875, -1.60882568359375, -1.488677978515625, -1.3685302734375, -1.248382568359375, -1.12823486328125, -1.008087158203125, -0.887939453125, -0.767791748046875, -0.64764404296875, -0.527496337890625, -0.4073486328125, -0.287200927734375, -0.16705322265625, -0.046905517578125, 0.0732421875, 0.193389892578125, 0.31353759765625, 0.433685302734375, 0.5538330078125, 0.673980712890625, 0.79412841796875, 0.914276123046875, 1.034423828125, 1.154571533203125, 1.27471923828125, 1.394866943359375, 1.5150146484375, 1.635162353515625, 1.75531005859375, 1.875457763671875, 1.99560546875, 2.115753173828125, 2.23590087890625, 2.356048583984375, 2.4761962890625, 2.596343994140625, 2.71649169921875, 2.836639404296875, 2.956787109375, 3.076934814453125, 3.19708251953125, 3.317230224609375, 3.4373779296875, 3.557525634765625, 3.67767333984375, 3.797821044921875, 3.91796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 6.0, 5.0, 11.0, 11.0, 12.0, 23.0, 19.0, 27.0, 47.0, 61.0, 96.0, 100.0, 96.0, 122.0, 74.0, 71.0, 35.0, 39.0, 35.0, 25.0, 19.0, 11.0, 7.0, 10.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00033092498779296875, -0.0003193952143192291, -0.0003078654408454895, -0.0002963356673717499, -0.00028480589389801025, -0.00027327612042427063, -0.000261746346950531, -0.0002502165734767914, -0.00023868680000305176, -0.00022715702652931213, -0.0002156272530555725, -0.00020409747958183289, -0.00019256770610809326, -0.00018103793263435364, -0.00016950815916061401, -0.0001579783856868744, -0.00014644861221313477, -0.00013491883873939514, -0.00012338906526565552, -0.0001118592917919159, -0.00010032951831817627, -8.879974484443665e-05, -7.726997137069702e-05, -6.57401978969574e-05, -5.4210424423217773e-05, -4.268065094947815e-05, -3.1150877475738525e-05, -1.96211040019989e-05, -8.091330528259277e-06, 3.4384429454803467e-06, 1.496821641921997e-05, 2.6497989892959595e-05, 3.802776336669922e-05, 4.955753684043884e-05, 6.108731031417847e-05, 7.261708378791809e-05, 8.414685726165771e-05, 9.567663073539734e-05, 0.00010720640420913696, 0.00011873617768287659, 0.0001302659511566162, 0.00014179572463035583, 0.00015332549810409546, 0.00016485527157783508, 0.0001763850450515747, 0.00018791481852531433, 0.00019944459199905396, 0.00021097436547279358, 0.0002225041389465332, 0.00023403391242027283, 0.00024556368589401245, 0.0002570934593677521, 0.0002686232328414917, 0.0002801530063152313, 0.00029168277978897095, 0.00030321255326271057, 0.0003147423267364502, 0.0003262721002101898, 0.00033780187368392944, 0.00034933164715766907, 0.0003608614206314087, 0.0003723911941051483, 0.00038392096757888794, 0.00039545074105262756, 0.0004069805145263672]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 13.0, 20.0, 20.0, 37.0, 49.0, 61.0, 119.0, 206.0, 255.0, 439.0, 660.0, 1020.0, 1479.0, 2509.0, 3792.0, 6014.0, 10319.0, 17381.0, 30194.0, 51481.0, 87629.0, 135053.0, 176062.0, 175078.0, 134781.0, 87385.0, 51742.0, 30224.0, 17471.0, 10287.0, 6175.0, 3882.0, 2361.0, 1549.0, 925.0, 646.0, 398.0, 295.0, 172.0, 118.0, 86.0, 51.0, 35.0, 30.0, 25.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-2.517578125, -2.445648193359375, -2.37371826171875, -2.301788330078125, -2.2298583984375, -2.157928466796875, -2.08599853515625, -2.014068603515625, -1.942138671875, -1.870208740234375, -1.79827880859375, -1.726348876953125, -1.6544189453125, -1.582489013671875, -1.51055908203125, -1.438629150390625, -1.36669921875, -1.294769287109375, -1.22283935546875, -1.150909423828125, -1.0789794921875, -1.007049560546875, -0.93511962890625, -0.863189697265625, -0.791259765625, -0.719329833984375, -0.64739990234375, -0.575469970703125, -0.5035400390625, -0.431610107421875, -0.35968017578125, -0.287750244140625, -0.2158203125, -0.143890380859375, -0.07196044921875, -3.0517578125e-05, 0.0718994140625, 0.143829345703125, 0.21575927734375, 0.287689208984375, 0.359619140625, 0.431549072265625, 0.50347900390625, 0.575408935546875, 0.6473388671875, 0.719268798828125, 0.79119873046875, 0.863128662109375, 0.93505859375, 1.006988525390625, 1.07891845703125, 1.150848388671875, 1.2227783203125, 1.294708251953125, 1.36663818359375, 1.438568115234375, 1.510498046875, 1.582427978515625, 1.65435791015625, 1.726287841796875, 1.7982177734375, 1.870147705078125, 1.94207763671875, 2.014007568359375, 2.0859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 9.0, 9.0, 16.0, 15.0, 19.0, 20.0, 16.0, 31.0, 33.0, 35.0, 54.0, 43.0, 56.0, 48.0, 60.0, 51.0, 65.0, 62.0, 54.0, 55.0, 37.0, 33.0, 28.0, 26.0, 22.0, 18.0, 16.0, 19.0, 10.0, 6.0, 8.0, 7.0, 3.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.15234375, -1.11334228515625, -1.0743408203125, -1.03533935546875, -0.996337890625, -0.95733642578125, -0.9183349609375, -0.87933349609375, -0.84033203125, -0.80133056640625, -0.7623291015625, -0.72332763671875, -0.684326171875, -0.64532470703125, -0.6063232421875, -0.56732177734375, -0.5283203125, -0.48931884765625, -0.4503173828125, -0.41131591796875, -0.372314453125, -0.33331298828125, -0.2943115234375, -0.25531005859375, -0.21630859375, -0.17730712890625, -0.1383056640625, -0.09930419921875, -0.060302734375, -0.02130126953125, 0.0177001953125, 0.05670166015625, 0.095703125, 0.13470458984375, 0.1737060546875, 0.21270751953125, 0.251708984375, 0.29071044921875, 0.3297119140625, 0.36871337890625, 0.40771484375, 0.44671630859375, 0.4857177734375, 0.52471923828125, 0.563720703125, 0.60272216796875, 0.6417236328125, 0.68072509765625, 0.7197265625, 0.75872802734375, 0.7977294921875, 0.83673095703125, 0.875732421875, 0.91473388671875, 0.9537353515625, 0.99273681640625, 1.03173828125, 1.07073974609375, 1.1097412109375, 1.14874267578125, 1.187744140625, 1.22674560546875, 1.2657470703125, 1.30474853515625, 1.34375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 11.0, 8.0, 14.0, 14.0, 11.0, 30.0, 35.0, 21.0, 25.0, 28.0, 32.0, 44.0, 35.0, 48.0, 58.0, 42.0, 45.0, 50.0, 53.0, 44.0, 41.0, 53.0, 30.0, 30.0, 28.0, 24.0, 24.0, 21.0, 18.0, 13.0, 14.0, 14.0, 5.0, 3.0, 3.0, 5.0, 0.0, 4.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.833765983581543, -8.515646934509277, -8.197526931762695, -7.87940788269043, -7.561288356781006, -7.243168830871582, -6.925049304962158, -6.606929779052734, -6.288810729980469, -5.970691204071045, -5.652571678161621, -5.3344526290893555, -5.016333103179932, -4.698213577270508, -4.380094051361084, -4.06197452545166, -3.7438549995422363, -3.4257354736328125, -3.1076161861419678, -2.789496660232544, -2.471377372741699, -2.1532578468322754, -1.8351383209228516, -1.5170190334320068, -1.198899507522583, -0.8807801008224487, -0.5626606345176697, -0.24454116821289062, 0.07357823848724365, 0.39169764518737793, 0.7098171710968018, 1.0279364585876465, 1.3460559844970703, 1.6641753911972046, 1.9822947978973389, 2.3004143238067627, 2.6185336112976074, 2.9366531372070312, 3.254772663116455, 3.5728919506073, 3.8910114765167236, 4.209130764007568, 4.527250289916992, 4.845369815826416, 5.16348934173584, 5.4816083908081055, 5.7997283935546875, 6.117847442626953, 6.435966968536377, 6.754086494445801, 7.072206020355225, 7.390325546264648, 7.708444595336914, 8.02656364440918, 8.344683647155762, 8.662802696228027, 8.98092269897461, 9.299041748046875, 9.617161750793457, 9.935280799865723, 10.253400802612305, 10.57151985168457, 10.889638900756836, 11.207758903503418, 11.525877952575684]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 7.0, 5.0, 10.0, 5.0, 8.0, 11.0, 23.0, 23.0, 21.0, 25.0, 37.0, 43.0, 24.0, 46.0, 33.0, 40.0, 51.0, 46.0, 39.0, 41.0, 45.0, 36.0, 51.0, 40.0, 35.0, 37.0, 20.0, 25.0, 32.0, 17.0, 17.0, 17.0, 16.0, 8.0, 14.0, 12.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.05257511138916, -12.656755447387695, -12.26093578338623, -11.865116119384766, -11.469297409057617, -11.073477745056152, -10.677658081054688, -10.281838417053223, -9.886018753051758, -9.490199089050293, -9.094379425048828, -8.69856071472168, -8.302741050720215, -7.90692138671875, -7.511101722717285, -7.11528205871582, -6.719463348388672, -6.323643684387207, -5.9278244972229, -5.5320048332214355, -5.136185646057129, -4.740365982055664, -4.344546318054199, -3.9487268924713135, -3.5529074668884277, -3.157088041305542, -2.7612686157226562, -2.3654489517211914, -1.9696295261383057, -1.57381010055542, -1.177990436553955, -0.7821710109710693, -0.3863515853881836, 0.009467899799346924, 0.40528738498687744, 0.8011069297790527, 1.1969263553619385, 1.5927457809448242, 1.988565444946289, 2.384384870529175, 2.7802042961120605, 3.1760237216949463, 3.571843147277832, 3.967662811279297, 4.363482475280762, 4.759301662445068, 5.155121326446533, 5.55094051361084, 5.946760177612305, 6.3425798416137695, 6.738399028778076, 7.134218692779541, 7.530037879943848, 7.9258575439453125, 8.321677207946777, 8.717496871948242, 9.11331558227539, 9.509135246276855, 9.90495491027832, 10.300773620605469, 10.696593284606934, 11.092412948608398, 11.488232612609863, 11.884052276611328, 12.279871940612793]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 3.0, 1.0, 5.0, 5.0, 9.0, 28.0, 33.0, 51.0, 73.0, 105.0, 162.0, 267.0, 418.0, 675.0, 1008.0, 1652.0, 2617.0, 4361.0, 6815.0, 10953.0, 17102.0, 26662.0, 40290.0, 58076.0, 78590.0, 99834.0, 115940.0, 121732.0, 115227.0, 99538.0, 77686.0, 56868.0, 39494.0, 26254.0, 17259.0, 10837.0, 6610.0, 4221.0, 2547.0, 1700.0, 1015.0, 645.0, 404.0, 285.0, 174.0, 110.0, 73.0, 55.0, 35.0, 15.0, 19.0, 10.0, 7.0, 3.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.078125, -7.8131103515625, -7.548095703125, -7.2830810546875, -7.01806640625, -6.7530517578125, -6.488037109375, -6.2230224609375, -5.9580078125, -5.6929931640625, -5.427978515625, -5.1629638671875, -4.89794921875, -4.6329345703125, -4.367919921875, -4.1029052734375, -3.837890625, -3.5728759765625, -3.307861328125, -3.0428466796875, -2.77783203125, -2.5128173828125, -2.247802734375, -1.9827880859375, -1.7177734375, -1.4527587890625, -1.187744140625, -0.9227294921875, -0.65771484375, -0.3927001953125, -0.127685546875, 0.1373291015625, 0.40234375, 0.6673583984375, 0.932373046875, 1.1973876953125, 1.46240234375, 1.7274169921875, 1.992431640625, 2.2574462890625, 2.5224609375, 2.7874755859375, 3.052490234375, 3.3175048828125, 3.58251953125, 3.8475341796875, 4.112548828125, 4.3775634765625, 4.642578125, 4.9075927734375, 5.172607421875, 5.4376220703125, 5.70263671875, 5.9676513671875, 6.232666015625, 6.4976806640625, 6.7626953125, 7.0277099609375, 7.292724609375, 7.5577392578125, 7.82275390625, 8.0877685546875, 8.352783203125, 8.6177978515625, 8.8828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 6.0, 10.0, 6.0, 6.0, 9.0, 13.0, 11.0, 13.0, 18.0, 36.0, 27.0, 22.0, 30.0, 28.0, 35.0, 43.0, 44.0, 42.0, 50.0, 38.0, 46.0, 38.0, 34.0, 33.0, 45.0, 40.0, 34.0, 33.0, 25.0, 37.0, 23.0, 15.0, 13.0, 18.0, 15.0, 14.0, 10.0, 5.0, 6.0, 11.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.890625, -11.524169921875, -11.15771484375, -10.791259765625, -10.4248046875, -10.058349609375, -9.69189453125, -9.325439453125, -8.958984375, -8.592529296875, -8.22607421875, -7.859619140625, -7.4931640625, -7.126708984375, -6.76025390625, -6.393798828125, -6.02734375, -5.660888671875, -5.29443359375, -4.927978515625, -4.5615234375, -4.195068359375, -3.82861328125, -3.462158203125, -3.095703125, -2.729248046875, -2.36279296875, -1.996337890625, -1.6298828125, -1.263427734375, -0.89697265625, -0.530517578125, -0.1640625, 0.202392578125, 0.56884765625, 0.935302734375, 1.3017578125, 1.668212890625, 2.03466796875, 2.401123046875, 2.767578125, 3.134033203125, 3.50048828125, 3.866943359375, 4.2333984375, 4.599853515625, 4.96630859375, 5.332763671875, 5.69921875, 6.065673828125, 6.43212890625, 6.798583984375, 7.1650390625, 7.531494140625, 7.89794921875, 8.264404296875, 8.630859375, 8.997314453125, 9.36376953125, 9.730224609375, 10.0966796875, 10.463134765625, 10.82958984375, 11.196044921875, 11.5625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 13.0, 14.0, 22.0, 29.0, 58.0, 84.0, 145.0, 233.0, 394.0, 614.0, 1100.0, 1793.0, 2931.0, 5069.0, 8083.0, 13445.0, 21641.0, 34178.0, 52487.0, 75951.0, 101609.0, 123694.0, 133397.0, 126354.0, 106905.0, 81357.0, 57086.0, 38079.0, 23969.0, 15005.0, 9095.0, 5480.0, 3164.0, 1956.0, 1215.0, 721.0, 484.0, 263.0, 159.0, 104.0, 55.0, 48.0, 30.0, 17.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.9609375, -9.66455078125, -9.3681640625, -9.07177734375, -8.775390625, -8.47900390625, -8.1826171875, -7.88623046875, -7.58984375, -7.29345703125, -6.9970703125, -6.70068359375, -6.404296875, -6.10791015625, -5.8115234375, -5.51513671875, -5.21875, -4.92236328125, -4.6259765625, -4.32958984375, -4.033203125, -3.73681640625, -3.4404296875, -3.14404296875, -2.84765625, -2.55126953125, -2.2548828125, -1.95849609375, -1.662109375, -1.36572265625, -1.0693359375, -0.77294921875, -0.4765625, -0.18017578125, 0.1162109375, 0.41259765625, 0.708984375, 1.00537109375, 1.3017578125, 1.59814453125, 1.89453125, 2.19091796875, 2.4873046875, 2.78369140625, 3.080078125, 3.37646484375, 3.6728515625, 3.96923828125, 4.265625, 4.56201171875, 4.8583984375, 5.15478515625, 5.451171875, 5.74755859375, 6.0439453125, 6.34033203125, 6.63671875, 6.93310546875, 7.2294921875, 7.52587890625, 7.822265625, 8.11865234375, 8.4150390625, 8.71142578125, 9.0078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 3.0, 7.0, 9.0, 9.0, 16.0, 14.0, 12.0, 11.0, 21.0, 21.0, 28.0, 29.0, 34.0, 39.0, 38.0, 31.0, 29.0, 48.0, 48.0, 46.0, 48.0, 42.0, 44.0, 42.0, 36.0, 34.0, 30.0, 24.0, 27.0, 34.0, 26.0, 29.0, 14.0, 19.0, 15.0, 10.0, 10.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.703125, -8.44976806640625, -8.1964111328125, -7.94305419921875, -7.689697265625, -7.43634033203125, -7.1829833984375, -6.92962646484375, -6.67626953125, -6.42291259765625, -6.1695556640625, -5.91619873046875, -5.662841796875, -5.40948486328125, -5.1561279296875, -4.90277099609375, -4.6494140625, -4.39605712890625, -4.1427001953125, -3.88934326171875, -3.635986328125, -3.38262939453125, -3.1292724609375, -2.87591552734375, -2.62255859375, -2.36920166015625, -2.1158447265625, -1.86248779296875, -1.609130859375, -1.35577392578125, -1.1024169921875, -0.84906005859375, -0.595703125, -0.34234619140625, -0.0889892578125, 0.16436767578125, 0.417724609375, 0.67108154296875, 0.9244384765625, 1.17779541015625, 1.43115234375, 1.68450927734375, 1.9378662109375, 2.19122314453125, 2.444580078125, 2.69793701171875, 2.9512939453125, 3.20465087890625, 3.4580078125, 3.71136474609375, 3.9647216796875, 4.21807861328125, 4.471435546875, 4.72479248046875, 4.9781494140625, 5.23150634765625, 5.48486328125, 5.73822021484375, 5.9915771484375, 6.24493408203125, 6.498291015625, 6.75164794921875, 7.0050048828125, 7.25836181640625, 7.51171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 12.0, 20.0, 33.0, 28.0, 71.0, 83.0, 160.0, 271.0, 482.0, 919.0, 1687.0, 3532.0, 7055.0, 15343.0, 34146.0, 78205.0, 165542.0, 259984.0, 237531.0, 133137.0, 60570.0, 26249.0, 11805.0, 5581.0, 2814.0, 1449.0, 776.0, 431.0, 237.0, 146.0, 86.0, 54.0, 38.0, 23.0, 16.0, 7.0, 2.0, 8.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.94921875, -7.7210693359375, -7.492919921875, -7.2647705078125, -7.03662109375, -6.8084716796875, -6.580322265625, -6.3521728515625, -6.1240234375, -5.8958740234375, -5.667724609375, -5.4395751953125, -5.21142578125, -4.9832763671875, -4.755126953125, -4.5269775390625, -4.298828125, -4.0706787109375, -3.842529296875, -3.6143798828125, -3.38623046875, -3.1580810546875, -2.929931640625, -2.7017822265625, -2.4736328125, -2.2454833984375, -2.017333984375, -1.7891845703125, -1.56103515625, -1.3328857421875, -1.104736328125, -0.8765869140625, -0.6484375, -0.4202880859375, -0.192138671875, 0.0360107421875, 0.26416015625, 0.4923095703125, 0.720458984375, 0.9486083984375, 1.1767578125, 1.4049072265625, 1.633056640625, 1.8612060546875, 2.08935546875, 2.3175048828125, 2.545654296875, 2.7738037109375, 3.001953125, 3.2301025390625, 3.458251953125, 3.6864013671875, 3.91455078125, 4.1427001953125, 4.370849609375, 4.5989990234375, 4.8271484375, 5.0552978515625, 5.283447265625, 5.5115966796875, 5.73974609375, 5.9678955078125, 6.196044921875, 6.4241943359375, 6.65234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 13.0, 16.0, 14.0, 15.0, 28.0, 27.0, 34.0, 44.0, 45.0, 62.0, 85.0, 67.0, 59.0, 68.0, 61.0, 54.0, 58.0, 43.0, 45.0, 27.0, 21.0, 27.0, 23.0, 12.0, 5.0, 9.0, 11.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005674362182617188, -0.0005509816110134125, -0.0005345270037651062, -0.0005180723965167999, -0.0005016177892684937, -0.0004851631820201874, -0.0004687085747718811, -0.00045225396752357483, -0.00043579936027526855, -0.0004193447530269623, -0.000402890145778656, -0.00038643553853034973, -0.00036998093128204346, -0.0003535263240337372, -0.0003370717167854309, -0.00032061710953712463, -0.00030416250228881836, -0.0002877078950405121, -0.0002712532877922058, -0.00025479868054389954, -0.00023834407329559326, -0.000221889466047287, -0.0002054348587989807, -0.00018898025155067444, -0.00017252564430236816, -0.0001560710370540619, -0.00013961642980575562, -0.00012316182255744934, -0.00010670721530914307, -9.025260806083679e-05, -7.379800081253052e-05, -5.734339356422424e-05, -4.088878631591797e-05, -2.4434179067611694e-05, -7.97957181930542e-06, 8.475035429000854e-06, 2.492964267730713e-05, 4.13842499256134e-05, 5.783885717391968e-05, 7.429346442222595e-05, 9.074807167053223e-05, 0.0001072026789188385, 0.00012365728616714478, 0.00014011189341545105, 0.00015656650066375732, 0.0001730211079120636, 0.00018947571516036987, 0.00020593032240867615, 0.00022238492965698242, 0.0002388395369052887, 0.00025529414415359497, 0.00027174875140190125, 0.0002882033586502075, 0.0003046579658985138, 0.00032111257314682007, 0.00033756718039512634, 0.0003540217876434326, 0.0003704763948917389, 0.00038693100214004517, 0.00040338560938835144, 0.0004198402166366577, 0.000436294823884964, 0.00045274943113327026, 0.00046920403838157654, 0.0004856586456298828]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 4.0, 13.0, 24.0, 27.0, 48.0, 71.0, 110.0, 206.0, 324.0, 501.0, 865.0, 1504.0, 2580.0, 4484.0, 7819.0, 13632.0, 23405.0, 40238.0, 65909.0, 101438.0, 140019.0, 163931.0, 154167.0, 120440.0, 81992.0, 51776.0, 30730.0, 18013.0, 10146.0, 5927.0, 3469.0, 1887.0, 1126.0, 683.0, 385.0, 229.0, 150.0, 94.0, 56.0, 40.0, 22.0, 22.0, 23.0, 7.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.37109375, -4.2333984375, -4.095703125, -3.9580078125, -3.8203125, -3.6826171875, -3.544921875, -3.4072265625, -3.26953125, -3.1318359375, -2.994140625, -2.8564453125, -2.71875, -2.5810546875, -2.443359375, -2.3056640625, -2.16796875, -2.0302734375, -1.892578125, -1.7548828125, -1.6171875, -1.4794921875, -1.341796875, -1.2041015625, -1.06640625, -0.9287109375, -0.791015625, -0.6533203125, -0.515625, -0.3779296875, -0.240234375, -0.1025390625, 0.03515625, 0.1728515625, 0.310546875, 0.4482421875, 0.5859375, 0.7236328125, 0.861328125, 0.9990234375, 1.13671875, 1.2744140625, 1.412109375, 1.5498046875, 1.6875, 1.8251953125, 1.962890625, 2.1005859375, 2.23828125, 2.3759765625, 2.513671875, 2.6513671875, 2.7890625, 2.9267578125, 3.064453125, 3.2021484375, 3.33984375, 3.4775390625, 3.615234375, 3.7529296875, 3.890625, 4.0283203125, 4.166015625, 4.3037109375, 4.44140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 7.0, 10.0, 9.0, 14.0, 16.0, 17.0, 30.0, 27.0, 28.0, 45.0, 43.0, 46.0, 63.0, 55.0, 63.0, 76.0, 69.0, 52.0, 53.0, 44.0, 37.0, 47.0, 31.0, 27.0, 21.0, 16.0, 12.0, 11.0, 9.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.55206298828125, -2.4752197265625, -2.39837646484375, -2.321533203125, -2.24468994140625, -2.1678466796875, -2.09100341796875, -2.01416015625, -1.93731689453125, -1.8604736328125, -1.78363037109375, -1.706787109375, -1.62994384765625, -1.5531005859375, -1.47625732421875, -1.3994140625, -1.32257080078125, -1.2457275390625, -1.16888427734375, -1.092041015625, -1.01519775390625, -0.9383544921875, -0.86151123046875, -0.78466796875, -0.70782470703125, -0.6309814453125, -0.55413818359375, -0.477294921875, -0.40045166015625, -0.3236083984375, -0.24676513671875, -0.169921875, -0.09307861328125, -0.0162353515625, 0.06060791015625, 0.137451171875, 0.21429443359375, 0.2911376953125, 0.36798095703125, 0.44482421875, 0.52166748046875, 0.5985107421875, 0.67535400390625, 0.752197265625, 0.82904052734375, 0.9058837890625, 0.98272705078125, 1.0595703125, 1.13641357421875, 1.2132568359375, 1.29010009765625, 1.366943359375, 1.44378662109375, 1.5206298828125, 1.59747314453125, 1.67431640625, 1.75115966796875, 1.8280029296875, 1.90484619140625, 1.981689453125, 2.05853271484375, 2.1353759765625, 2.21221923828125, 2.2890625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 8.0, 3.0, 7.0, 5.0, 7.0, 10.0, 11.0, 11.0, 22.0, 25.0, 27.0, 21.0, 38.0, 45.0, 41.0, 48.0, 32.0, 45.0, 30.0, 45.0, 47.0, 56.0, 42.0, 43.0, 42.0, 42.0, 33.0, 38.0, 23.0, 18.0, 22.0, 24.0, 16.0, 20.0, 9.0, 10.0, 6.0, 6.0, 6.0, 6.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.338193893432617, -9.029687881469727, -8.721181869506836, -8.412675857543945, -8.104169845581055, -7.795663356781006, -7.487156867980957, -7.178650856018066, -6.870144844055176, -6.561638832092285, -6.2531328201293945, -5.944626331329346, -5.636120319366455, -5.3276143074035645, -5.019107818603516, -4.710601806640625, -4.402095794677734, -4.093589782714844, -3.785083532333374, -3.4765772819519043, -3.1680712699890137, -2.859565258026123, -2.5510590076446533, -2.2425527572631836, -1.934046745300293, -1.6255406141281128, -1.3170344829559326, -1.0085283517837524, -0.7000222206115723, -0.3915160894393921, -0.08300995826721191, 0.2254962921142578, 0.534001350402832, 0.8425074815750122, 1.1510136127471924, 1.4595197439193726, 1.7680258750915527, 2.0765318870544434, 2.385038137435913, 2.693544387817383, 3.0020503997802734, 3.310556411743164, 3.619062662124634, 3.9275689125061035, 4.236074924468994, 4.544580936431885, 4.853087425231934, 5.161593437194824, 5.470099449157715, 5.7786054611206055, 6.087111473083496, 6.395617961883545, 6.7041239738464355, 7.012629985809326, 7.321136474609375, 7.629642486572266, 7.938148498535156, 8.246654510498047, 8.555160522460938, 8.863666534423828, 9.172172546386719, 9.480679512023926, 9.789185523986816, 10.097691535949707, 10.406197547912598]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 7.0, 13.0, 14.0, 13.0, 12.0, 11.0, 16.0, 17.0, 19.0, 31.0, 26.0, 31.0, 24.0, 25.0, 29.0, 34.0, 34.0, 40.0, 43.0, 44.0, 38.0, 35.0, 30.0, 44.0, 34.0, 29.0, 36.0, 36.0, 24.0, 29.0, 18.0, 21.0, 17.0, 21.0, 8.0, 17.0, 8.0, 10.0, 10.0, 5.0, 8.0, 2.0, 5.0, 6.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0], "bins": [-11.287220001220703, -10.946866035461426, -10.606511116027832, -10.266157150268555, -9.925803184509277, -9.58544921875, -9.245094299316406, -8.904740333557129, -8.564386367797852, -8.224032402038574, -7.883677959442139, -7.543323516845703, -7.202969551086426, -6.86261510848999, -6.522260665893555, -6.181906700134277, -5.841551780700684, -5.501197338104248, -5.160843372344971, -4.820488929748535, -4.480134963989258, -4.139780521392822, -3.7994260787963867, -3.4590718746185303, -3.118717670440674, -2.7783634662628174, -2.438009262084961, -2.0976548194885254, -1.757300615310669, -1.4169464111328125, -1.076591968536377, -0.7362377643585205, -0.39588260650634766, -0.055528342723846436, 0.2848259210586548, 0.6251802444458008, 0.9655344486236572, 1.3058886528015137, 1.6462430953979492, 1.9865972995758057, 2.326951503753662, 2.6673057079315186, 3.007659912109375, 3.3480143547058105, 3.688368558883667, 4.028722763061523, 4.369077205657959, 4.7094316482543945, 5.049785614013672, 5.390140056610107, 5.730494022369385, 6.07084846496582, 6.411202430725098, 6.751556873321533, 7.091911315917969, 7.432265281677246, 7.772619724273682, 8.112974166870117, 8.453328132629395, 8.793682098388672, 9.134037017822266, 9.474390983581543, 9.81474494934082, 10.155099868774414, 10.495453834533691]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 6.0, 8.0, 20.0, 21.0, 42.0, 45.0, 83.0, 114.0, 219.0, 274.0, 456.0, 758.0, 1167.0, 1937.0, 3043.0, 5190.0, 8420.0, 14109.0, 23888.0, 39922.0, 65755.0, 107458.0, 173233.0, 263417.0, 378890.0, 491818.0, 561625.0, 556468.0, 476329.0, 360634.0, 247972.0, 158982.0, 99849.0, 60486.0, 36277.0, 21819.0, 12870.0, 7913.0, 4810.0, 2932.0, 1855.0, 1160.0, 701.0, 467.0, 299.0, 200.0, 127.0, 77.0, 46.0, 34.0, 22.0, 13.0, 12.0, 7.0, 5.0, 2.0, 0.0, 2.0], "bins": [-7.484375, -7.25701904296875, -7.0296630859375, -6.80230712890625, -6.574951171875, -6.34759521484375, -6.1202392578125, -5.89288330078125, -5.66552734375, -5.43817138671875, -5.2108154296875, -4.98345947265625, -4.756103515625, -4.52874755859375, -4.3013916015625, -4.07403564453125, -3.8466796875, -3.61932373046875, -3.3919677734375, -3.16461181640625, -2.937255859375, -2.70989990234375, -2.4825439453125, -2.25518798828125, -2.02783203125, -1.80047607421875, -1.5731201171875, -1.34576416015625, -1.118408203125, -0.89105224609375, -0.6636962890625, -0.43634033203125, -0.208984375, 0.01837158203125, 0.2457275390625, 0.47308349609375, 0.700439453125, 0.92779541015625, 1.1551513671875, 1.38250732421875, 1.60986328125, 1.83721923828125, 2.0645751953125, 2.29193115234375, 2.519287109375, 2.74664306640625, 2.9739990234375, 3.20135498046875, 3.4287109375, 3.65606689453125, 3.8834228515625, 4.11077880859375, 4.338134765625, 4.56549072265625, 4.7928466796875, 5.02020263671875, 5.24755859375, 5.47491455078125, 5.7022705078125, 5.92962646484375, 6.156982421875, 6.38433837890625, 6.6116943359375, 6.83905029296875, 7.06640625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 7.0, 6.0, 5.0, 12.0, 10.0, 13.0, 14.0, 17.0, 22.0, 22.0, 15.0, 35.0, 38.0, 27.0, 31.0, 33.0, 35.0, 27.0, 46.0, 39.0, 33.0, 46.0, 39.0, 36.0, 29.0, 49.0, 34.0, 36.0, 41.0, 19.0, 20.0, 21.0, 21.0, 18.0, 14.0, 21.0, 10.0, 14.0, 8.0, 4.0, 4.0, 6.0, 9.0, 4.0, 5.0, 4.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0], "bins": [-9.3515625, -9.06982421875, -8.7880859375, -8.50634765625, -8.224609375, -7.94287109375, -7.6611328125, -7.37939453125, -7.09765625, -6.81591796875, -6.5341796875, -6.25244140625, -5.970703125, -5.68896484375, -5.4072265625, -5.12548828125, -4.84375, -4.56201171875, -4.2802734375, -3.99853515625, -3.716796875, -3.43505859375, -3.1533203125, -2.87158203125, -2.58984375, -2.30810546875, -2.0263671875, -1.74462890625, -1.462890625, -1.18115234375, -0.8994140625, -0.61767578125, -0.3359375, -0.05419921875, 0.2275390625, 0.50927734375, 0.791015625, 1.07275390625, 1.3544921875, 1.63623046875, 1.91796875, 2.19970703125, 2.4814453125, 2.76318359375, 3.044921875, 3.32666015625, 3.6083984375, 3.89013671875, 4.171875, 4.45361328125, 4.7353515625, 5.01708984375, 5.298828125, 5.58056640625, 5.8623046875, 6.14404296875, 6.42578125, 6.70751953125, 6.9892578125, 7.27099609375, 7.552734375, 7.83447265625, 8.1162109375, 8.39794921875, 8.6796875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 15.0, 18.0, 32.0, 66.0, 92.0, 155.0, 245.0, 436.0, 795.0, 1294.0, 2186.0, 3885.0, 6623.0, 11532.0, 20276.0, 34796.0, 58228.0, 96757.0, 154520.0, 233169.0, 332556.0, 436152.0, 515497.0, 538158.0, 495589.0, 406212.0, 300752.0, 206025.0, 134412.0, 83838.0, 50338.0, 29615.0, 16851.0, 9739.0, 5535.0, 3307.0, 1893.0, 1032.0, 667.0, 415.0, 239.0, 124.0, 93.0, 63.0, 36.0, 14.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.875, -7.63885498046875, -7.4027099609375, -7.16656494140625, -6.930419921875, -6.69427490234375, -6.4581298828125, -6.22198486328125, -5.98583984375, -5.74969482421875, -5.5135498046875, -5.27740478515625, -5.041259765625, -4.80511474609375, -4.5689697265625, -4.33282470703125, -4.0966796875, -3.86053466796875, -3.6243896484375, -3.38824462890625, -3.152099609375, -2.91595458984375, -2.6798095703125, -2.44366455078125, -2.20751953125, -1.97137451171875, -1.7352294921875, -1.49908447265625, -1.262939453125, -1.02679443359375, -0.7906494140625, -0.55450439453125, -0.318359375, -0.08221435546875, 0.1539306640625, 0.39007568359375, 0.626220703125, 0.86236572265625, 1.0985107421875, 1.33465576171875, 1.57080078125, 1.80694580078125, 2.0430908203125, 2.27923583984375, 2.515380859375, 2.75152587890625, 2.9876708984375, 3.22381591796875, 3.4599609375, 3.69610595703125, 3.9322509765625, 4.16839599609375, 4.404541015625, 4.64068603515625, 4.8768310546875, 5.11297607421875, 5.34912109375, 5.58526611328125, 5.8214111328125, 6.05755615234375, 6.293701171875, 6.52984619140625, 6.7659912109375, 7.00213623046875, 7.23828125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 11.0, 13.0, 12.0, 13.0, 26.0, 42.0, 47.0, 61.0, 58.0, 73.0, 82.0, 99.0, 119.0, 153.0, 164.0, 154.0, 173.0, 202.0, 214.0, 191.0, 209.0, 206.0, 203.0, 187.0, 179.0, 149.0, 157.0, 132.0, 127.0, 109.0, 82.0, 91.0, 70.0, 50.0, 35.0, 38.0, 28.0, 23.0, 12.0, 12.0, 8.0, 16.0, 11.0, 9.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.40234375, -3.28460693359375, -3.1668701171875, -3.04913330078125, -2.931396484375, -2.81365966796875, -2.6959228515625, -2.57818603515625, -2.46044921875, -2.34271240234375, -2.2249755859375, -2.10723876953125, -1.989501953125, -1.87176513671875, -1.7540283203125, -1.63629150390625, -1.5185546875, -1.40081787109375, -1.2830810546875, -1.16534423828125, -1.047607421875, -0.92987060546875, -0.8121337890625, -0.69439697265625, -0.57666015625, -0.45892333984375, -0.3411865234375, -0.22344970703125, -0.105712890625, 0.01202392578125, 0.1297607421875, 0.24749755859375, 0.365234375, 0.48297119140625, 0.6007080078125, 0.71844482421875, 0.836181640625, 0.95391845703125, 1.0716552734375, 1.18939208984375, 1.30712890625, 1.42486572265625, 1.5426025390625, 1.66033935546875, 1.778076171875, 1.89581298828125, 2.0135498046875, 2.13128662109375, 2.2490234375, 2.36676025390625, 2.4844970703125, 2.60223388671875, 2.719970703125, 2.83770751953125, 2.9554443359375, 3.07318115234375, 3.19091796875, 3.30865478515625, 3.4263916015625, 3.54412841796875, 3.661865234375, 3.77960205078125, 3.8973388671875, 4.01507568359375, 4.1328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 0.0, 3.0, 6.0, 1.0, 6.0, 7.0, 7.0, 13.0, 15.0, 15.0, 24.0, 21.0, 34.0, 21.0, 37.0, 46.0, 48.0, 39.0, 57.0, 43.0, 49.0, 51.0, 52.0, 50.0, 46.0, 48.0, 34.0, 45.0, 25.0, 26.0, 15.0, 26.0, 13.0, 24.0, 11.0, 13.0, 7.0, 9.0, 3.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.147982597351074, -8.843207359313965, -8.538432121276855, -8.233656883239746, -7.9288811683654785, -7.624105930328369, -7.319330215454102, -7.014554977416992, -6.709779739379883, -6.405004501342773, -6.100229263305664, -5.7954535484313965, -5.490678310394287, -5.185903072357178, -4.88112735748291, -4.576352119445801, -4.271576881408691, -3.966801643371582, -3.6620261669158936, -3.357250690460205, -3.0524754524230957, -2.7477002143859863, -2.442924737930298, -2.1381492614746094, -1.8333740234375, -1.528598666191101, -1.2238233089447021, -0.9190479516983032, -0.6142725944519043, -0.30949723720550537, -0.004721879959106445, 0.30005359649658203, 0.6048297882080078, 0.9096051454544067, 1.2143805027008057, 1.5191558599472046, 1.8239312171936035, 2.128706455230713, 2.4334819316864014, 2.73825740814209, 3.043032646179199, 3.3478078842163086, 3.652583360671997, 3.9573588371276855, 4.262134075164795, 4.566909313201904, 4.871685028076172, 5.176460266113281, 5.481235504150391, 5.7860107421875, 6.090785980224609, 6.395561695098877, 6.700336933135986, 7.005112171173096, 7.309887886047363, 7.614663124084473, 7.919438362121582, 8.224213600158691, 8.5289888381958, 8.83376407623291, 9.138540267944336, 9.443315505981445, 9.748090744018555, 10.052865982055664, 10.357641220092773]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 6.0, 8.0, 8.0, 15.0, 14.0, 16.0, 20.0, 27.0, 22.0, 19.0, 30.0, 32.0, 34.0, 42.0, 41.0, 33.0, 45.0, 38.0, 36.0, 35.0, 32.0, 46.0, 40.0, 37.0, 35.0, 36.0, 29.0, 22.0, 28.0, 19.0, 26.0, 23.0, 17.0, 9.0, 10.0, 16.0, 11.0, 4.0, 4.0, 7.0, 3.0, 6.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.548196792602539, -10.220373153686523, -9.892549514770508, -9.564725875854492, -9.236902236938477, -8.909079551696777, -8.581255912780762, -8.253432273864746, -7.9256086349487305, -7.597784996032715, -7.269961357116699, -6.942138195037842, -6.614314556121826, -6.2864909172058105, -5.958667755126953, -5.6308441162109375, -5.303020477294922, -4.975196838378906, -4.647373199462891, -4.319550037384033, -3.9917263984680176, -3.663902759552002, -3.3360793590545654, -3.008255958557129, -2.6804323196411133, -2.3526086807250977, -2.024785280227661, -1.696961760520935, -1.369138240814209, -1.041314721107483, -0.7134912014007568, -0.3856678009033203, -0.05784320831298828, 0.2699803113937378, 0.5978038311004639, 0.9256273508071899, 1.253450870513916, 1.581274390220642, 1.9090979099273682, 2.2369213104248047, 2.5647449493408203, 2.892568588256836, 3.2203919887542725, 3.548215389251709, 3.8760390281677246, 4.20386266708374, 4.531685829162598, 4.859509468078613, 5.187333106994629, 5.5151567459106445, 5.84298038482666, 6.170803546905518, 6.498627185821533, 6.826450824737549, 7.154273986816406, 7.482097625732422, 7.8099212646484375, 8.137744903564453, 8.465568542480469, 8.793392181396484, 9.1212158203125, 9.4490385055542, 9.776862144470215, 10.10468578338623, 10.432509422302246]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 17.0, 12.0, 25.0, 46.0, 45.0, 82.0, 138.0, 183.0, 317.0, 458.0, 723.0, 1139.0, 1771.0, 2984.0, 4968.0, 8300.0, 14199.0, 24303.0, 41544.0, 69272.0, 107960.0, 150035.0, 172558.0, 154956.0, 112727.0, 72508.0, 44003.0, 25965.0, 14859.0, 8821.0, 5268.0, 3070.0, 1965.0, 1237.0, 760.0, 495.0, 302.0, 194.0, 125.0, 84.0, 51.0, 39.0, 20.0, 8.0, 9.0, 9.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.87701416015625, -3.7501220703125, -3.62322998046875, -3.496337890625, -3.36944580078125, -3.2425537109375, -3.11566162109375, -2.98876953125, -2.86187744140625, -2.7349853515625, -2.60809326171875, -2.481201171875, -2.35430908203125, -2.2274169921875, -2.10052490234375, -1.9736328125, -1.84674072265625, -1.7198486328125, -1.59295654296875, -1.466064453125, -1.33917236328125, -1.2122802734375, -1.08538818359375, -0.95849609375, -0.83160400390625, -0.7047119140625, -0.57781982421875, -0.450927734375, -0.32403564453125, -0.1971435546875, -0.07025146484375, 0.056640625, 0.18353271484375, 0.3104248046875, 0.43731689453125, 0.564208984375, 0.69110107421875, 0.8179931640625, 0.94488525390625, 1.07177734375, 1.19866943359375, 1.3255615234375, 1.45245361328125, 1.579345703125, 1.70623779296875, 1.8331298828125, 1.96002197265625, 2.0869140625, 2.21380615234375, 2.3406982421875, 2.46759033203125, 2.594482421875, 2.72137451171875, 2.8482666015625, 2.97515869140625, 3.10205078125, 3.22894287109375, 3.3558349609375, 3.48272705078125, 3.609619140625, 3.73651123046875, 3.8634033203125, 3.99029541015625, 4.1171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 8.0, 8.0, 8.0, 11.0, 9.0, 14.0, 20.0, 20.0, 18.0, 21.0, 26.0, 22.0, 44.0, 37.0, 33.0, 39.0, 42.0, 41.0, 40.0, 29.0, 42.0, 42.0, 30.0, 47.0, 35.0, 39.0, 33.0, 42.0, 27.0, 24.0, 26.0, 20.0, 25.0, 10.0, 15.0, 12.0, 5.0, 5.0, 7.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.9140625, -10.5731201171875, -10.232177734375, -9.8912353515625, -9.55029296875, -9.2093505859375, -8.868408203125, -8.5274658203125, -8.1865234375, -7.8455810546875, -7.504638671875, -7.1636962890625, -6.82275390625, -6.4818115234375, -6.140869140625, -5.7999267578125, -5.458984375, -5.1180419921875, -4.777099609375, -4.4361572265625, -4.09521484375, -3.7542724609375, -3.413330078125, -3.0723876953125, -2.7314453125, -2.3905029296875, -2.049560546875, -1.7086181640625, -1.36767578125, -1.0267333984375, -0.685791015625, -0.3448486328125, -0.00390625, 0.3370361328125, 0.677978515625, 1.0189208984375, 1.35986328125, 1.7008056640625, 2.041748046875, 2.3826904296875, 2.7236328125, 3.0645751953125, 3.405517578125, 3.7464599609375, 4.08740234375, 4.4283447265625, 4.769287109375, 5.1102294921875, 5.451171875, 5.7921142578125, 6.133056640625, 6.4739990234375, 6.81494140625, 7.1558837890625, 7.496826171875, 7.8377685546875, 8.1787109375, 8.5196533203125, 8.860595703125, 9.2015380859375, 9.54248046875, 9.8834228515625, 10.224365234375, 10.5653076171875, 10.90625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 7.0, 11.0, 21.0, 26.0, 52.0, 55.0, 120.0, 149.0, 259.0, 429.0, 745.0, 1383.0, 2616.0, 4913.0, 10508.0, 22982.0, 53246.0, 123945.0, 238426.0, 275911.0, 172290.0, 77803.0, 33429.0, 14583.0, 6985.0, 3391.0, 1789.0, 978.0, 545.0, 362.0, 221.0, 124.0, 84.0, 52.0, 27.0, 21.0, 10.0, 16.0, 7.0, 6.0, 10.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.66925048828125, -5.4752197265625, -5.28118896484375, -5.087158203125, -4.89312744140625, -4.6990966796875, -4.50506591796875, -4.31103515625, -4.11700439453125, -3.9229736328125, -3.72894287109375, -3.534912109375, -3.34088134765625, -3.1468505859375, -2.95281982421875, -2.7587890625, -2.56475830078125, -2.3707275390625, -2.17669677734375, -1.982666015625, -1.78863525390625, -1.5946044921875, -1.40057373046875, -1.20654296875, -1.01251220703125, -0.8184814453125, -0.62445068359375, -0.430419921875, -0.23638916015625, -0.0423583984375, 0.15167236328125, 0.345703125, 0.53973388671875, 0.7337646484375, 0.92779541015625, 1.121826171875, 1.31585693359375, 1.5098876953125, 1.70391845703125, 1.89794921875, 2.09197998046875, 2.2860107421875, 2.48004150390625, 2.674072265625, 2.86810302734375, 3.0621337890625, 3.25616455078125, 3.4501953125, 3.64422607421875, 3.8382568359375, 4.03228759765625, 4.226318359375, 4.42034912109375, 4.6143798828125, 4.80841064453125, 5.00244140625, 5.19647216796875, 5.3905029296875, 5.58453369140625, 5.778564453125, 5.97259521484375, 6.1666259765625, 6.36065673828125, 6.5546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 7.0, 7.0, 21.0, 13.0, 11.0, 16.0, 17.0, 20.0, 19.0, 28.0, 27.0, 33.0, 25.0, 32.0, 35.0, 31.0, 36.0, 35.0, 42.0, 40.0, 42.0, 46.0, 34.0, 41.0, 26.0, 34.0, 34.0, 22.0, 21.0, 35.0, 25.0, 18.0, 19.0, 17.0, 9.0, 17.0, 11.0, 16.0, 10.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-7.6171875, -7.383056640625, -7.14892578125, -6.914794921875, -6.6806640625, -6.446533203125, -6.21240234375, -5.978271484375, -5.744140625, -5.510009765625, -5.27587890625, -5.041748046875, -4.8076171875, -4.573486328125, -4.33935546875, -4.105224609375, -3.87109375, -3.636962890625, -3.40283203125, -3.168701171875, -2.9345703125, -2.700439453125, -2.46630859375, -2.232177734375, -1.998046875, -1.763916015625, -1.52978515625, -1.295654296875, -1.0615234375, -0.827392578125, -0.59326171875, -0.359130859375, -0.125, 0.109130859375, 0.34326171875, 0.577392578125, 0.8115234375, 1.045654296875, 1.27978515625, 1.513916015625, 1.748046875, 1.982177734375, 2.21630859375, 2.450439453125, 2.6845703125, 2.918701171875, 3.15283203125, 3.386962890625, 3.62109375, 3.855224609375, 4.08935546875, 4.323486328125, 4.5576171875, 4.791748046875, 5.02587890625, 5.260009765625, 5.494140625, 5.728271484375, 5.96240234375, 6.196533203125, 6.4306640625, 6.664794921875, 6.89892578125, 7.133056640625, 7.3671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 3.0, 11.0, 12.0, 15.0, 20.0, 26.0, 39.0, 56.0, 73.0, 104.0, 146.0, 172.0, 265.0, 406.0, 538.0, 792.0, 1171.0, 1919.0, 3417.0, 6284.0, 12927.0, 31766.0, 105492.0, 442970.0, 318635.0, 72494.0, 24638.0, 10551.0, 5453.0, 2881.0, 1725.0, 1102.0, 711.0, 488.0, 364.0, 235.0, 170.0, 138.0, 87.0, 63.0, 54.0, 41.0, 21.0, 30.0, 17.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-4.38671875, -4.25323486328125, -4.1197509765625, -3.98626708984375, -3.852783203125, -3.71929931640625, -3.5858154296875, -3.45233154296875, -3.31884765625, -3.18536376953125, -3.0518798828125, -2.91839599609375, -2.784912109375, -2.65142822265625, -2.5179443359375, -2.38446044921875, -2.2509765625, -2.11749267578125, -1.9840087890625, -1.85052490234375, -1.717041015625, -1.58355712890625, -1.4500732421875, -1.31658935546875, -1.18310546875, -1.04962158203125, -0.9161376953125, -0.78265380859375, -0.649169921875, -0.51568603515625, -0.3822021484375, -0.24871826171875, -0.115234375, 0.01824951171875, 0.1517333984375, 0.28521728515625, 0.418701171875, 0.55218505859375, 0.6856689453125, 0.81915283203125, 0.95263671875, 1.08612060546875, 1.2196044921875, 1.35308837890625, 1.486572265625, 1.62005615234375, 1.7535400390625, 1.88702392578125, 2.0205078125, 2.15399169921875, 2.2874755859375, 2.42095947265625, 2.554443359375, 2.68792724609375, 2.8214111328125, 2.95489501953125, 3.08837890625, 3.22186279296875, 3.3553466796875, 3.48883056640625, 3.622314453125, 3.75579833984375, 3.8892822265625, 4.02276611328125, 4.15625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 7.0, 14.0, 13.0, 11.0, 23.0, 27.0, 32.0, 30.0, 52.0, 65.0, 92.0, 106.0, 108.0, 87.0, 71.0, 51.0, 39.0, 38.0, 27.0, 18.0, 14.0, 12.0, 9.0, 7.0, 6.0, 7.0, 8.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00023818016052246094, -0.00023001432418823242, -0.0002218484878540039, -0.0002136826515197754, -0.00020551681518554688, -0.00019735097885131836, -0.00018918514251708984, -0.00018101930618286133, -0.0001728534698486328, -0.0001646876335144043, -0.00015652179718017578, -0.00014835596084594727, -0.00014019012451171875, -0.00013202428817749023, -0.00012385845184326172, -0.0001156926155090332, -0.00010752677917480469, -9.936094284057617e-05, -9.119510650634766e-05, -8.302927017211914e-05, -7.486343383789062e-05, -6.669759750366211e-05, -5.8531761169433594e-05, -5.036592483520508e-05, -4.220008850097656e-05, -3.403425216674805e-05, -2.586841583251953e-05, -1.7702579498291016e-05, -9.5367431640625e-06, -1.3709068298339844e-06, 6.794929504394531e-06, 1.4960765838623047e-05, 2.3126602172851562e-05, 3.129243850708008e-05, 3.9458274841308594e-05, 4.762411117553711e-05, 5.5789947509765625e-05, 6.395578384399414e-05, 7.212162017822266e-05, 8.028745651245117e-05, 8.845329284667969e-05, 9.66191291809082e-05, 0.00010478496551513672, 0.00011295080184936523, 0.00012111663818359375, 0.00012928247451782227, 0.00013744831085205078, 0.0001456141471862793, 0.0001537799835205078, 0.00016194581985473633, 0.00017011165618896484, 0.00017827749252319336, 0.00018644332885742188, 0.0001946091651916504, 0.0002027750015258789, 0.00021094083786010742, 0.00021910667419433594, 0.00022727251052856445, 0.00023543834686279297, 0.00024360418319702148, 0.00025177001953125, 0.0002599358558654785, 0.00026810169219970703, 0.00027626752853393555, 0.00028443336486816406]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 4.0, 10.0, 14.0, 14.0, 24.0, 40.0, 55.0, 83.0, 135.0, 147.0, 228.0, 324.0, 467.0, 656.0, 1069.0, 1569.0, 2442.0, 3905.0, 6144.0, 10465.0, 18950.0, 37314.0, 80225.0, 187366.0, 318166.0, 203173.0, 86332.0, 39772.0, 20220.0, 11160.0, 6593.0, 3978.0, 2506.0, 1605.0, 1024.0, 739.0, 519.0, 352.0, 228.0, 165.0, 125.0, 76.0, 57.0, 41.0, 23.0, 15.0, 13.0, 11.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-3.451171875, -3.348297119140625, -3.24542236328125, -3.142547607421875, -3.0396728515625, -2.936798095703125, -2.83392333984375, -2.731048583984375, -2.628173828125, -2.525299072265625, -2.42242431640625, -2.319549560546875, -2.2166748046875, -2.113800048828125, -2.01092529296875, -1.908050537109375, -1.80517578125, -1.702301025390625, -1.59942626953125, -1.496551513671875, -1.3936767578125, -1.290802001953125, -1.18792724609375, -1.085052490234375, -0.982177734375, -0.879302978515625, -0.77642822265625, -0.673553466796875, -0.5706787109375, -0.467803955078125, -0.36492919921875, -0.262054443359375, -0.1591796875, -0.056304931640625, 0.04656982421875, 0.149444580078125, 0.2523193359375, 0.355194091796875, 0.45806884765625, 0.560943603515625, 0.663818359375, 0.766693115234375, 0.86956787109375, 0.972442626953125, 1.0753173828125, 1.178192138671875, 1.28106689453125, 1.383941650390625, 1.48681640625, 1.589691162109375, 1.69256591796875, 1.795440673828125, 1.8983154296875, 2.001190185546875, 2.10406494140625, 2.206939697265625, 2.309814453125, 2.412689208984375, 2.51556396484375, 2.618438720703125, 2.7213134765625, 2.824188232421875, 2.92706298828125, 3.029937744140625, 3.1328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 7.0, 12.0, 10.0, 11.0, 22.0, 24.0, 16.0, 25.0, 35.0, 47.0, 55.0, 86.0, 118.0, 108.0, 69.0, 61.0, 54.0, 39.0, 28.0, 19.0, 27.0, 20.0, 14.0, 15.0, 13.0, 13.0, 8.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6318359375, -1.5824737548828125, -1.533111572265625, -1.4837493896484375, -1.43438720703125, -1.3850250244140625, -1.335662841796875, -1.2863006591796875, -1.2369384765625, -1.1875762939453125, -1.138214111328125, -1.0888519287109375, -1.03948974609375, -0.9901275634765625, -0.940765380859375, -0.8914031982421875, -0.842041015625, -0.7926788330078125, -0.743316650390625, -0.6939544677734375, -0.64459228515625, -0.5952301025390625, -0.545867919921875, -0.4965057373046875, -0.4471435546875, -0.3977813720703125, -0.348419189453125, -0.2990570068359375, -0.24969482421875, -0.2003326416015625, -0.150970458984375, -0.1016082763671875, -0.05224609375, -0.0028839111328125, 0.046478271484375, 0.0958404541015625, 0.14520263671875, 0.1945648193359375, 0.243927001953125, 0.2932891845703125, 0.3426513671875, 0.3920135498046875, 0.441375732421875, 0.4907379150390625, 0.54010009765625, 0.5894622802734375, 0.638824462890625, 0.6881866455078125, 0.737548828125, 0.7869110107421875, 0.836273193359375, 0.8856353759765625, 0.93499755859375, 0.9843597412109375, 1.033721923828125, 1.0830841064453125, 1.1324462890625, 1.1818084716796875, 1.231170654296875, 1.2805328369140625, 1.32989501953125, 1.3792572021484375, 1.428619384765625, 1.4779815673828125, 1.52734375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 3.0, 8.0, 10.0, 5.0, 16.0, 24.0, 34.0, 27.0, 30.0, 33.0, 38.0, 57.0, 43.0, 41.0, 58.0, 56.0, 59.0, 63.0, 44.0, 47.0, 51.0, 47.0, 33.0, 22.0, 34.0, 20.0, 17.0, 22.0, 12.0, 8.0, 8.0, 7.0, 6.0, 2.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.969135284423828, -9.637640953063965, -9.306146621704102, -8.974652290344238, -8.643157958984375, -8.311662673950195, -7.980168342590332, -7.648674011230469, -7.3171796798706055, -6.985685348510742, -6.654191017150879, -6.322696208953857, -5.991201877593994, -5.659707546234131, -5.328212738037109, -4.996718406677246, -4.665224075317383, -4.3337297439575195, -4.002235412597656, -3.6707406044006348, -3.3392462730407715, -3.007751941680908, -2.676257371902466, -2.3447628021240234, -2.01326847076416, -1.6817740201950073, -1.3502795696258545, -1.0187851190567017, -0.6872906684875488, -0.355796217918396, -0.024301767349243164, 0.3071928024291992, 0.6386880874633789, 0.9701825380325317, 1.3016769886016846, 1.6331714391708374, 1.9646658897399902, 2.2961602210998535, 2.627654790878296, 2.9591493606567383, 3.2906436920166016, 3.622138023376465, 3.9536325931549072, 4.28512716293335, 4.616621494293213, 4.948115825653076, 5.279610633850098, 5.611104965209961, 5.942599296569824, 6.2740936279296875, 6.605587959289551, 6.937082767486572, 7.2685770988464355, 7.600071430206299, 7.93156623840332, 8.263060569763184, 8.594554901123047, 8.92604923248291, 9.257543563842773, 9.589037895202637, 9.9205322265625, 10.25202751159668, 10.583521842956543, 10.915016174316406, 11.24651050567627]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 8.0, 6.0, 3.0, 8.0, 6.0, 21.0, 9.0, 23.0, 20.0, 21.0, 23.0, 26.0, 28.0, 34.0, 32.0, 34.0, 46.0, 37.0, 33.0, 45.0, 33.0, 34.0, 40.0, 43.0, 42.0, 45.0, 27.0, 30.0, 24.0, 34.0, 23.0, 29.0, 19.0, 16.0, 19.0, 13.0, 13.0, 13.0, 8.0, 7.0, 7.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-10.81541919708252, -10.488164901733398, -10.160911560058594, -9.833657264709473, -9.506403923034668, -9.179149627685547, -8.851896286010742, -8.524641990661621, -8.1973876953125, -7.870133876800537, -7.542880058288574, -7.215626239776611, -6.888372421264648, -6.561118125915527, -6.2338643074035645, -5.906610488891602, -5.579357147216797, -5.252103328704834, -4.924849510192871, -4.597595691680908, -4.270341873168945, -3.9430878162384033, -3.6158337593078613, -3.2885799407958984, -2.9613261222839355, -2.6340723037719727, -2.3068184852600098, -1.9795644283294678, -1.6523106098175049, -1.325056791305542, -0.9978028535842896, -0.6705489158630371, -0.3432941436767578, -0.016040265560150146, 0.3112136125564575, 0.6384674906730652, 0.9657213687896729, 1.2929751873016357, 1.6202291250228882, 1.9474830627441406, 2.2747368812561035, 2.6019906997680664, 2.9292445182800293, 3.2564985752105713, 3.583752393722534, 3.911006212234497, 4.238260269165039, 4.565514087677002, 4.892767906188965, 5.220021724700928, 5.547275543212891, 5.8745293617248535, 6.201783180236816, 6.5290374755859375, 6.8562912940979, 7.183545112609863, 7.510798931121826, 7.838052749633789, 8.16530704498291, 8.492560386657715, 8.819814682006836, 9.14706802368164, 9.474322319030762, 9.801576614379883, 10.128829956054688]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 8.0, 9.0, 9.0, 10.0, 25.0, 18.0, 38.0, 57.0, 113.0, 138.0, 231.0, 346.0, 488.0, 792.0, 1085.0, 1676.0, 2572.0, 4025.0, 5781.0, 8697.0, 13251.0, 19252.0, 28097.0, 39480.0, 54060.0, 70644.0, 86911.0, 99925.0, 106551.0, 104969.0, 95648.0, 81009.0, 63887.0, 48361.0, 35083.0, 24633.0, 16674.0, 11265.0, 7570.0, 5175.0, 3481.0, 2130.0, 1499.0, 966.0, 641.0, 427.0, 270.0, 193.0, 127.0, 97.0, 50.0, 40.0, 29.0, 14.0, 15.0, 12.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-6.359375, -6.15301513671875, -5.9466552734375, -5.74029541015625, -5.533935546875, -5.32757568359375, -5.1212158203125, -4.91485595703125, -4.70849609375, -4.50213623046875, -4.2957763671875, -4.08941650390625, -3.883056640625, -3.67669677734375, -3.4703369140625, -3.26397705078125, -3.0576171875, -2.85125732421875, -2.6448974609375, -2.43853759765625, -2.232177734375, -2.02581787109375, -1.8194580078125, -1.61309814453125, -1.40673828125, -1.20037841796875, -0.9940185546875, -0.78765869140625, -0.581298828125, -0.37493896484375, -0.1685791015625, 0.03778076171875, 0.244140625, 0.45050048828125, 0.6568603515625, 0.86322021484375, 1.069580078125, 1.27593994140625, 1.4822998046875, 1.68865966796875, 1.89501953125, 2.10137939453125, 2.3077392578125, 2.51409912109375, 2.720458984375, 2.92681884765625, 3.1331787109375, 3.33953857421875, 3.5458984375, 3.75225830078125, 3.9586181640625, 4.16497802734375, 4.371337890625, 4.57769775390625, 4.7840576171875, 4.99041748046875, 5.19677734375, 5.40313720703125, 5.6094970703125, 5.81585693359375, 6.022216796875, 6.22857666015625, 6.4349365234375, 6.64129638671875, 6.84765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 2.0, 9.0, 8.0, 8.0, 16.0, 19.0, 18.0, 19.0, 30.0, 27.0, 23.0, 21.0, 41.0, 44.0, 33.0, 40.0, 34.0, 41.0, 36.0, 37.0, 49.0, 47.0, 39.0, 39.0, 36.0, 34.0, 21.0, 23.0, 27.0, 24.0, 25.0, 26.0, 19.0, 9.0, 13.0, 14.0, 12.0, 5.0, 6.0, 4.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-11.234375, -10.9068603515625, -10.579345703125, -10.2518310546875, -9.92431640625, -9.5968017578125, -9.269287109375, -8.9417724609375, -8.6142578125, -8.2867431640625, -7.959228515625, -7.6317138671875, -7.30419921875, -6.9766845703125, -6.649169921875, -6.3216552734375, -5.994140625, -5.6666259765625, -5.339111328125, -5.0115966796875, -4.68408203125, -4.3565673828125, -4.029052734375, -3.7015380859375, -3.3740234375, -3.0465087890625, -2.718994140625, -2.3914794921875, -2.06396484375, -1.7364501953125, -1.408935546875, -1.0814208984375, -0.75390625, -0.4263916015625, -0.098876953125, 0.2286376953125, 0.55615234375, 0.8836669921875, 1.211181640625, 1.5386962890625, 1.8662109375, 2.1937255859375, 2.521240234375, 2.8487548828125, 3.17626953125, 3.5037841796875, 3.831298828125, 4.1588134765625, 4.486328125, 4.8138427734375, 5.141357421875, 5.4688720703125, 5.79638671875, 6.1239013671875, 6.451416015625, 6.7789306640625, 7.1064453125, 7.4339599609375, 7.761474609375, 8.0889892578125, 8.41650390625, 8.7440185546875, 9.071533203125, 9.3990478515625, 9.7265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 6.0, 5.0, 12.0, 17.0, 26.0, 38.0, 59.0, 93.0, 131.0, 175.0, 262.0, 458.0, 580.0, 868.0, 1233.0, 1904.0, 2906.0, 4318.0, 6596.0, 9673.0, 14731.0, 21847.0, 31073.0, 44239.0, 60664.0, 78865.0, 94934.0, 106572.0, 110378.0, 104628.0, 91513.0, 74273.0, 56238.0, 40957.0, 28538.0, 19815.0, 13203.0, 8939.0, 5879.0, 4019.0, 2615.0, 1737.0, 1185.0, 773.0, 504.0, 363.0, 247.0, 143.0, 98.0, 81.0, 49.0, 34.0, 28.0, 13.0, 11.0, 8.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.4765625, -6.256103515625, -6.03564453125, -5.815185546875, -5.5947265625, -5.374267578125, -5.15380859375, -4.933349609375, -4.712890625, -4.492431640625, -4.27197265625, -4.051513671875, -3.8310546875, -3.610595703125, -3.39013671875, -3.169677734375, -2.94921875, -2.728759765625, -2.50830078125, -2.287841796875, -2.0673828125, -1.846923828125, -1.62646484375, -1.406005859375, -1.185546875, -0.965087890625, -0.74462890625, -0.524169921875, -0.3037109375, -0.083251953125, 0.13720703125, 0.357666015625, 0.578125, 0.798583984375, 1.01904296875, 1.239501953125, 1.4599609375, 1.680419921875, 1.90087890625, 2.121337890625, 2.341796875, 2.562255859375, 2.78271484375, 3.003173828125, 3.2236328125, 3.444091796875, 3.66455078125, 3.885009765625, 4.10546875, 4.325927734375, 4.54638671875, 4.766845703125, 4.9873046875, 5.207763671875, 5.42822265625, 5.648681640625, 5.869140625, 6.089599609375, 6.31005859375, 6.530517578125, 6.7509765625, 6.971435546875, 7.19189453125, 7.412353515625, 7.6328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 5.0, 7.0, 6.0, 6.0, 17.0, 12.0, 21.0, 20.0, 22.0, 23.0, 24.0, 20.0, 31.0, 33.0, 30.0, 35.0, 46.0, 45.0, 50.0, 44.0, 38.0, 42.0, 47.0, 37.0, 39.0, 35.0, 34.0, 31.0, 25.0, 23.0, 20.0, 14.0, 24.0, 17.0, 12.0, 7.0, 10.0, 8.0, 8.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.984375, -6.757568359375, -6.53076171875, -6.303955078125, -6.0771484375, -5.850341796875, -5.62353515625, -5.396728515625, -5.169921875, -4.943115234375, -4.71630859375, -4.489501953125, -4.2626953125, -4.035888671875, -3.80908203125, -3.582275390625, -3.35546875, -3.128662109375, -2.90185546875, -2.675048828125, -2.4482421875, -2.221435546875, -1.99462890625, -1.767822265625, -1.541015625, -1.314208984375, -1.08740234375, -0.860595703125, -0.6337890625, -0.406982421875, -0.18017578125, 0.046630859375, 0.2734375, 0.500244140625, 0.72705078125, 0.953857421875, 1.1806640625, 1.407470703125, 1.63427734375, 1.861083984375, 2.087890625, 2.314697265625, 2.54150390625, 2.768310546875, 2.9951171875, 3.221923828125, 3.44873046875, 3.675537109375, 3.90234375, 4.129150390625, 4.35595703125, 4.582763671875, 4.8095703125, 5.036376953125, 5.26318359375, 5.489990234375, 5.716796875, 5.943603515625, 6.17041015625, 6.397216796875, 6.6240234375, 6.850830078125, 7.07763671875, 7.304443359375, 7.53125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 9.0, 7.0, 24.0, 21.0, 28.0, 48.0, 57.0, 119.0, 160.0, 219.0, 377.0, 511.0, 891.0, 1424.0, 2335.0, 4110.0, 7347.0, 12842.0, 24509.0, 45744.0, 83897.0, 138597.0, 186924.0, 191021.0, 146114.0, 91002.0, 50251.0, 26596.0, 14250.0, 8003.0, 4392.0, 2585.0, 1495.0, 937.0, 583.0, 349.0, 242.0, 167.0, 115.0, 90.0, 52.0, 23.0, 34.0, 17.0, 6.0, 8.0, 10.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.26953125, -5.105224609375, -4.94091796875, -4.776611328125, -4.6123046875, -4.447998046875, -4.28369140625, -4.119384765625, -3.955078125, -3.790771484375, -3.62646484375, -3.462158203125, -3.2978515625, -3.133544921875, -2.96923828125, -2.804931640625, -2.640625, -2.476318359375, -2.31201171875, -2.147705078125, -1.9833984375, -1.819091796875, -1.65478515625, -1.490478515625, -1.326171875, -1.161865234375, -0.99755859375, -0.833251953125, -0.6689453125, -0.504638671875, -0.34033203125, -0.176025390625, -0.01171875, 0.152587890625, 0.31689453125, 0.481201171875, 0.6455078125, 0.809814453125, 0.97412109375, 1.138427734375, 1.302734375, 1.467041015625, 1.63134765625, 1.795654296875, 1.9599609375, 2.124267578125, 2.28857421875, 2.452880859375, 2.6171875, 2.781494140625, 2.94580078125, 3.110107421875, 3.2744140625, 3.438720703125, 3.60302734375, 3.767333984375, 3.931640625, 4.095947265625, 4.26025390625, 4.424560546875, 4.5888671875, 4.753173828125, 4.91748046875, 5.081787109375, 5.24609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 7.0, 2.0, 10.0, 10.0, 14.0, 19.0, 24.0, 29.0, 39.0, 43.0, 37.0, 42.0, 46.0, 42.0, 70.0, 54.0, 39.0, 45.0, 46.0, 63.0, 48.0, 45.0, 36.0, 35.0, 35.0, 27.0, 24.0, 16.0, 15.0, 13.0, 10.0, 6.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00045418739318847656, -0.00044137611985206604, -0.0004285648465156555, -0.000415753573179245, -0.00040294229984283447, -0.00039013102650642395, -0.00037731975317001343, -0.0003645084798336029, -0.0003516972064971924, -0.00033888593316078186, -0.00032607465982437134, -0.0003132633864879608, -0.0003004521131515503, -0.00028764083981513977, -0.00027482956647872925, -0.0002620182931423187, -0.0002492070198059082, -0.00023639574646949768, -0.00022358447313308716, -0.00021077319979667664, -0.0001979619264602661, -0.0001851506531238556, -0.00017233937978744507, -0.00015952810645103455, -0.00014671683311462402, -0.0001339055597782135, -0.00012109428644180298, -0.00010828301310539246, -9.547173976898193e-05, -8.266046643257141e-05, -6.984919309616089e-05, -5.7037919759750366e-05, -4.4226646423339844e-05, -3.141537308692932e-05, -1.86040997505188e-05, -5.792826414108276e-06, 7.018446922302246e-06, 1.982972025871277e-05, 3.264099359512329e-05, 4.5452266931533813e-05, 5.8263540267944336e-05, 7.107481360435486e-05, 8.388608694076538e-05, 9.66973602771759e-05, 0.00010950863361358643, 0.00012231990694999695, 0.00013513118028640747, 0.000147942453622818, 0.00016075372695922852, 0.00017356500029563904, 0.00018637627363204956, 0.00019918754696846008, 0.0002119988203048706, 0.00022481009364128113, 0.00023762136697769165, 0.00025043264031410217, 0.0002632439136505127, 0.0002760551869869232, 0.00028886646032333374, 0.00030167773365974426, 0.0003144890069961548, 0.0003273002803325653, 0.00034011155366897583, 0.00035292282700538635, 0.0003657341003417969]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 11.0, 15.0, 18.0, 31.0, 36.0, 43.0, 82.0, 128.0, 188.0, 285.0, 424.0, 708.0, 1094.0, 1751.0, 2925.0, 5052.0, 8425.0, 14482.0, 25043.0, 43285.0, 70648.0, 107455.0, 144418.0, 162377.0, 149743.0, 115954.0, 77648.0, 48350.0, 28272.0, 16388.0, 9467.0, 5374.0, 3232.0, 1891.0, 1172.0, 757.0, 473.0, 292.0, 186.0, 124.0, 95.0, 81.0, 36.0, 25.0, 17.0, 20.0, 4.0, 4.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.1953125, -4.06256103515625, -3.9298095703125, -3.79705810546875, -3.664306640625, -3.53155517578125, -3.3988037109375, -3.26605224609375, -3.13330078125, -3.00054931640625, -2.8677978515625, -2.73504638671875, -2.602294921875, -2.46954345703125, -2.3367919921875, -2.20404052734375, -2.0712890625, -1.93853759765625, -1.8057861328125, -1.67303466796875, -1.540283203125, -1.40753173828125, -1.2747802734375, -1.14202880859375, -1.00927734375, -0.87652587890625, -0.7437744140625, -0.61102294921875, -0.478271484375, -0.34552001953125, -0.2127685546875, -0.08001708984375, 0.052734375, 0.18548583984375, 0.3182373046875, 0.45098876953125, 0.583740234375, 0.71649169921875, 0.8492431640625, 0.98199462890625, 1.11474609375, 1.24749755859375, 1.3802490234375, 1.51300048828125, 1.645751953125, 1.77850341796875, 1.9112548828125, 2.04400634765625, 2.1767578125, 2.30950927734375, 2.4422607421875, 2.57501220703125, 2.707763671875, 2.84051513671875, 2.9732666015625, 3.10601806640625, 3.23876953125, 3.37152099609375, 3.5042724609375, 3.63702392578125, 3.769775390625, 3.90252685546875, 4.0352783203125, 4.16802978515625, 4.30078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 8.0, 12.0, 15.0, 20.0, 24.0, 34.0, 40.0, 52.0, 61.0, 72.0, 83.0, 80.0, 86.0, 83.0, 67.0, 53.0, 43.0, 36.0, 24.0, 19.0, 21.0, 12.0, 6.0, 9.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.25, -4.140045166015625, -4.03009033203125, -3.920135498046875, -3.8101806640625, -3.700225830078125, -3.59027099609375, -3.480316162109375, -3.370361328125, -3.260406494140625, -3.15045166015625, -3.040496826171875, -2.9305419921875, -2.820587158203125, -2.71063232421875, -2.600677490234375, -2.49072265625, -2.380767822265625, -2.27081298828125, -2.160858154296875, -2.0509033203125, -1.940948486328125, -1.83099365234375, -1.721038818359375, -1.611083984375, -1.501129150390625, -1.39117431640625, -1.281219482421875, -1.1712646484375, -1.061309814453125, -0.95135498046875, -0.841400146484375, -0.7314453125, -0.621490478515625, -0.51153564453125, -0.401580810546875, -0.2916259765625, -0.181671142578125, -0.07171630859375, 0.038238525390625, 0.148193359375, 0.258148193359375, 0.36810302734375, 0.478057861328125, 0.5880126953125, 0.697967529296875, 0.80792236328125, 0.917877197265625, 1.02783203125, 1.137786865234375, 1.24774169921875, 1.357696533203125, 1.4676513671875, 1.577606201171875, 1.68756103515625, 1.797515869140625, 1.907470703125, 2.017425537109375, 2.12738037109375, 2.237335205078125, 2.3472900390625, 2.457244873046875, 2.56719970703125, 2.677154541015625, 2.787109375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 8.0, 7.0, 11.0, 13.0, 12.0, 9.0, 16.0, 15.0, 25.0, 18.0, 26.0, 37.0, 32.0, 27.0, 39.0, 45.0, 43.0, 34.0, 46.0, 63.0, 38.0, 57.0, 45.0, 45.0, 43.0, 37.0, 30.0, 26.0, 16.0, 27.0, 18.0, 16.0, 15.0, 14.0, 16.0, 4.0, 8.0, 3.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.9874348640441895, -7.70811653137207, -7.428798675537109, -7.149480819702148, -6.870162487030029, -6.59084415435791, -6.311526298522949, -6.032208442687988, -5.752890110015869, -5.47357177734375, -5.194253921508789, -4.914936065673828, -4.635617733001709, -4.35629940032959, -4.076981544494629, -3.797663450241089, -3.518345355987549, -3.239027261734009, -2.9597091674804688, -2.6803910732269287, -2.4010729789733887, -2.1217548847198486, -1.8424367904663086, -1.5631186962127686, -1.2838006019592285, -1.0044825077056885, -0.7251644134521484, -0.4458463191986084, -0.16652822494506836, 0.11278986930847168, 0.3921079635620117, 0.6714260578155518, 0.9507436752319336, 1.2300617694854736, 1.5093798637390137, 1.7886979579925537, 2.0680160522460938, 2.347334146499634, 2.626652240753174, 2.905970335006714, 3.185288429260254, 3.464606523513794, 3.743924617767334, 4.023242950439453, 4.302560806274414, 4.581878662109375, 4.861196994781494, 5.140515327453613, 5.419833183288574, 5.699151039123535, 5.978469371795654, 6.257787704467773, 6.537105560302734, 6.816423416137695, 7.0957417488098145, 7.375060081481934, 7.6543779373168945, 7.9336957931518555, 8.213014602661133, 8.492332458496094, 8.771650314331055, 9.050968170166016, 9.330286026000977, 9.609604835510254, 9.888922691345215]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 7.0, 11.0, 19.0, 17.0, 15.0, 20.0, 17.0, 16.0, 31.0, 24.0, 28.0, 33.0, 28.0, 37.0, 35.0, 38.0, 54.0, 47.0, 35.0, 34.0, 48.0, 32.0, 30.0, 31.0, 31.0, 27.0, 23.0, 33.0, 23.0, 16.0, 23.0, 15.0, 18.0, 10.0, 3.0, 19.0, 8.0, 9.0, 15.0, 4.0, 4.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-10.890793800354004, -10.569063186645508, -10.247332572937012, -9.925602912902832, -9.603872299194336, -9.28214168548584, -8.960411071777344, -8.638680458068848, -8.316949844360352, -7.9952192306518555, -7.673489093780518, -7.3517584800720215, -7.030028343200684, -6.7082977294921875, -6.386567115783691, -6.064836502075195, -5.743106842041016, -5.4213762283325195, -5.099646091461182, -4.7779154777526855, -4.456185340881348, -4.134454727172852, -3.8127241134643555, -3.4909937381744385, -3.1692633628845215, -2.8475329875946045, -2.5258026123046875, -2.2040719985961914, -1.8823416233062744, -1.5606112480163574, -1.2388807535171509, -0.9171502590179443, -0.5954198837280273, -0.2736894488334656, 0.04804098606109619, 0.36977142095565796, 0.6915018558502197, 1.0132322311401367, 1.3349627256393433, 1.6566932201385498, 1.9784235954284668, 2.300153970718384, 2.621884346008301, 2.943614959716797, 3.265345335006714, 3.587075710296631, 3.908806324005127, 4.230536460876465, 4.552267074584961, 4.873997688293457, 5.195727825164795, 5.517458438873291, 5.839188575744629, 6.160919189453125, 6.482649803161621, 6.804380416870117, 7.126110553741455, 7.447841167449951, 7.769571304321289, 8.091301918029785, 8.413032531738281, 8.734762191772461, 9.056492805480957, 9.378223419189453, 9.69995403289795]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 8.0, 6.0, 6.0, 28.0, 31.0, 42.0, 68.0, 102.0, 139.0, 250.0, 372.0, 661.0, 973.0, 1628.0, 2679.0, 4341.0, 7310.0, 12330.0, 20511.0, 34167.0, 57686.0, 95419.0, 153635.0, 238944.0, 347147.0, 463416.0, 545488.0, 561958.0, 500422.0, 394208.0, 278611.0, 181774.0, 114346.0, 69873.0, 41970.0, 25374.0, 15067.0, 8996.0, 5446.0, 3348.0, 2017.0, 1249.0, 850.0, 531.0, 317.0, 187.0, 122.0, 89.0, 64.0, 35.0, 17.0, 14.0, 6.0, 9.0, 5.0, 2.0, 1.0, 1.0], "bins": [-7.45703125, -7.232421875, -7.0078125, -6.783203125, -6.55859375, -6.333984375, -6.109375, -5.884765625, -5.66015625, -5.435546875, -5.2109375, -4.986328125, -4.76171875, -4.537109375, -4.3125, -4.087890625, -3.86328125, -3.638671875, -3.4140625, -3.189453125, -2.96484375, -2.740234375, -2.515625, -2.291015625, -2.06640625, -1.841796875, -1.6171875, -1.392578125, -1.16796875, -0.943359375, -0.71875, -0.494140625, -0.26953125, -0.044921875, 0.1796875, 0.404296875, 0.62890625, 0.853515625, 1.078125, 1.302734375, 1.52734375, 1.751953125, 1.9765625, 2.201171875, 2.42578125, 2.650390625, 2.875, 3.099609375, 3.32421875, 3.548828125, 3.7734375, 3.998046875, 4.22265625, 4.447265625, 4.671875, 4.896484375, 5.12109375, 5.345703125, 5.5703125, 5.794921875, 6.01953125, 6.244140625, 6.46875, 6.693359375, 6.91796875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 9.0, 9.0, 8.0, 15.0, 15.0, 15.0, 19.0, 18.0, 16.0, 18.0, 27.0, 32.0, 30.0, 49.0, 32.0, 29.0, 43.0, 38.0, 38.0, 47.0, 44.0, 35.0, 44.0, 42.0, 26.0, 27.0, 30.0, 32.0, 26.0, 13.0, 20.0, 19.0, 26.0, 22.0, 10.0, 13.0, 8.0, 12.0, 10.0, 8.0, 6.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-8.578125, -8.3184814453125, -8.058837890625, -7.7991943359375, -7.53955078125, -7.2799072265625, -7.020263671875, -6.7606201171875, -6.5009765625, -6.2413330078125, -5.981689453125, -5.7220458984375, -5.46240234375, -5.2027587890625, -4.943115234375, -4.6834716796875, -4.423828125, -4.1641845703125, -3.904541015625, -3.6448974609375, -3.38525390625, -3.1256103515625, -2.865966796875, -2.6063232421875, -2.3466796875, -2.0870361328125, -1.827392578125, -1.5677490234375, -1.30810546875, -1.0484619140625, -0.788818359375, -0.5291748046875, -0.26953125, -0.0098876953125, 0.249755859375, 0.5093994140625, 0.76904296875, 1.0286865234375, 1.288330078125, 1.5479736328125, 1.8076171875, 2.0672607421875, 2.326904296875, 2.5865478515625, 2.84619140625, 3.1058349609375, 3.365478515625, 3.6251220703125, 3.884765625, 4.1444091796875, 4.404052734375, 4.6636962890625, 4.92333984375, 5.1829833984375, 5.442626953125, 5.7022705078125, 5.9619140625, 6.2215576171875, 6.481201171875, 6.7408447265625, 7.00048828125, 7.2601318359375, 7.519775390625, 7.7794189453125, 8.0390625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 15.0, 30.0, 38.0, 77.0, 116.0, 214.0, 352.0, 654.0, 1106.0, 2082.0, 4007.0, 7139.0, 12976.0, 24416.0, 43242.0, 76630.0, 128233.0, 206265.0, 309850.0, 422667.0, 519976.0, 562899.0, 533229.0, 444061.0, 332155.0, 225072.0, 142324.0, 85031.0, 48880.0, 27433.0, 14903.0, 8282.0, 4410.0, 2454.0, 1317.0, 768.0, 399.0, 231.0, 137.0, 90.0, 50.0, 20.0, 18.0, 10.0, 9.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0546875, -7.8076171875, -7.560546875, -7.3134765625, -7.06640625, -6.8193359375, -6.572265625, -6.3251953125, -6.078125, -5.8310546875, -5.583984375, -5.3369140625, -5.08984375, -4.8427734375, -4.595703125, -4.3486328125, -4.1015625, -3.8544921875, -3.607421875, -3.3603515625, -3.11328125, -2.8662109375, -2.619140625, -2.3720703125, -2.125, -1.8779296875, -1.630859375, -1.3837890625, -1.13671875, -0.8896484375, -0.642578125, -0.3955078125, -0.1484375, 0.0986328125, 0.345703125, 0.5927734375, 0.83984375, 1.0869140625, 1.333984375, 1.5810546875, 1.828125, 2.0751953125, 2.322265625, 2.5693359375, 2.81640625, 3.0634765625, 3.310546875, 3.5576171875, 3.8046875, 4.0517578125, 4.298828125, 4.5458984375, 4.79296875, 5.0400390625, 5.287109375, 5.5341796875, 5.78125, 6.0283203125, 6.275390625, 6.5224609375, 6.76953125, 7.0166015625, 7.263671875, 7.5107421875, 7.7578125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 9.0, 7.0, 8.0, 9.0, 18.0, 29.0, 29.0, 45.0, 70.0, 84.0, 105.0, 150.0, 176.0, 200.0, 240.0, 222.0, 275.0, 259.0, 262.0, 277.0, 251.0, 230.0, 229.0, 164.0, 167.0, 120.0, 98.0, 78.0, 48.0, 52.0, 49.0, 35.0, 24.0, 14.0, 10.0, 14.0, 4.0, 10.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.919921875, -3.770172119140625, -3.62042236328125, -3.470672607421875, -3.3209228515625, -3.171173095703125, -3.02142333984375, -2.871673583984375, -2.721923828125, -2.572174072265625, -2.42242431640625, -2.272674560546875, -2.1229248046875, -1.973175048828125, -1.82342529296875, -1.673675537109375, -1.52392578125, -1.374176025390625, -1.22442626953125, -1.074676513671875, -0.9249267578125, -0.775177001953125, -0.62542724609375, -0.475677490234375, -0.325927734375, -0.176177978515625, -0.02642822265625, 0.123321533203125, 0.2730712890625, 0.422821044921875, 0.57257080078125, 0.722320556640625, 0.8720703125, 1.021820068359375, 1.17156982421875, 1.321319580078125, 1.4710693359375, 1.620819091796875, 1.77056884765625, 1.920318603515625, 2.070068359375, 2.219818115234375, 2.36956787109375, 2.519317626953125, 2.6690673828125, 2.818817138671875, 2.96856689453125, 3.118316650390625, 3.26806640625, 3.417816162109375, 3.56756591796875, 3.717315673828125, 3.8670654296875, 4.016815185546875, 4.16656494140625, 4.316314697265625, 4.466064453125, 4.615814208984375, 4.76556396484375, 4.915313720703125, 5.0650634765625, 5.214813232421875, 5.36456298828125, 5.514312744140625, 5.6640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 9.0, 8.0, 7.0, 8.0, 8.0, 18.0, 16.0, 22.0, 13.0, 21.0, 31.0, 44.0, 28.0, 41.0, 43.0, 52.0, 52.0, 34.0, 53.0, 53.0, 50.0, 37.0, 39.0, 41.0, 33.0, 32.0, 31.0, 33.0, 21.0, 25.0, 16.0, 14.0, 19.0, 11.0, 14.0, 6.0, 7.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4514923095703125, -7.182847023010254, -6.914201736450195, -6.645556449890137, -6.376911163330078, -6.1082658767700195, -5.839620590209961, -5.570975303649902, -5.302330017089844, -5.033684730529785, -4.765039443969727, -4.496394157409668, -4.227748870849609, -3.959103584289551, -3.690458297729492, -3.4218130111694336, -3.153167724609375, -2.8845224380493164, -2.615877151489258, -2.347231864929199, -2.0785865783691406, -1.809941291809082, -1.5412960052490234, -1.2726507186889648, -1.0040054321289062, -0.7353601455688477, -0.46671485900878906, -0.19806957244873047, 0.07057571411132812, 0.3392210006713867, 0.6078662872314453, 0.8765115737915039, 1.1451568603515625, 1.413802146911621, 1.6824474334716797, 1.9510927200317383, 2.219738006591797, 2.4883832931518555, 2.757028579711914, 3.0256738662719727, 3.2943191528320312, 3.56296443939209, 3.8316097259521484, 4.100255012512207, 4.368900299072266, 4.637545585632324, 4.906190872192383, 5.174836158752441, 5.4434814453125, 5.712126731872559, 5.980772018432617, 6.249417304992676, 6.518062591552734, 6.786707878112793, 7.055353164672852, 7.32399845123291, 7.592643737792969, 7.861289024353027, 8.129934310913086, 8.398579597473145, 8.667224884033203, 8.935870170593262, 9.20451545715332, 9.473160743713379, 9.741806030273438]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 8.0, 7.0, 10.0, 10.0, 16.0, 26.0, 10.0, 16.0, 22.0, 27.0, 18.0, 29.0, 28.0, 35.0, 37.0, 34.0, 36.0, 44.0, 43.0, 40.0, 47.0, 40.0, 49.0, 42.0, 38.0, 40.0, 31.0, 24.0, 26.0, 29.0, 20.0, 16.0, 18.0, 15.0, 16.0, 12.0, 5.0, 5.0, 9.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.997974395751953, -9.673428535461426, -9.348882675170898, -9.024337768554688, -8.69979190826416, -8.375246047973633, -8.050700187683105, -7.726154327392578, -7.401608467102051, -7.077062606811523, -6.752517223358154, -6.427971363067627, -6.1034255027771, -5.7788801193237305, -5.454334259033203, -5.129788398742676, -4.805243015289307, -4.480697154998779, -4.15615177154541, -3.831605911254883, -3.5070600509643555, -3.1825144290924072, -2.857968807220459, -2.5334229469299316, -2.2088773250579834, -1.8843315839767456, -1.5597858428955078, -1.2352402210235596, -0.9106944799423218, -0.586148738861084, -0.26160311698913574, 0.0629427433013916, 0.38748836517333984, 0.7120341062545776, 1.0365798473358154, 1.3611254692077637, 1.6856712102890015, 2.0102169513702393, 2.3347625732421875, 2.659308433532715, 2.983854055404663, 3.3083996772766113, 3.6329455375671387, 3.957491159439087, 4.282036781311035, 4.6065826416015625, 4.93112850189209, 5.255674362182617, 5.580219745635986, 5.904765605926514, 6.229310989379883, 6.55385684967041, 6.8784027099609375, 7.202948570251465, 7.527493953704834, 7.852039813995361, 8.17658519744873, 8.501131057739258, 8.825676918029785, 9.150222778320312, 9.474767684936523, 9.79931354522705, 10.123859405517578, 10.448405265808105, 10.772951126098633]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 11.0, 13.0, 10.0, 28.0, 41.0, 60.0, 83.0, 105.0, 180.0, 262.0, 386.0, 558.0, 913.0, 1547.0, 2615.0, 4945.0, 10341.0, 21965.0, 47870.0, 102610.0, 193939.0, 254771.0, 200179.0, 108480.0, 50570.0, 23085.0, 10613.0, 5222.0, 2827.0, 1602.0, 1000.0, 598.0, 359.0, 229.0, 178.0, 117.0, 83.0, 46.0, 34.0, 31.0, 17.0, 11.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.43359375, -4.28839111328125, -4.1431884765625, -3.99798583984375, -3.852783203125, -3.70758056640625, -3.5623779296875, -3.41717529296875, -3.27197265625, -3.12677001953125, -2.9815673828125, -2.83636474609375, -2.691162109375, -2.54595947265625, -2.4007568359375, -2.25555419921875, -2.1103515625, -1.96514892578125, -1.8199462890625, -1.67474365234375, -1.529541015625, -1.38433837890625, -1.2391357421875, -1.09393310546875, -0.94873046875, -0.80352783203125, -0.6583251953125, -0.51312255859375, -0.367919921875, -0.22271728515625, -0.0775146484375, 0.06768798828125, 0.212890625, 0.35809326171875, 0.5032958984375, 0.64849853515625, 0.793701171875, 0.93890380859375, 1.0841064453125, 1.22930908203125, 1.37451171875, 1.51971435546875, 1.6649169921875, 1.81011962890625, 1.955322265625, 2.10052490234375, 2.2457275390625, 2.39093017578125, 2.5361328125, 2.68133544921875, 2.8265380859375, 2.97174072265625, 3.116943359375, 3.26214599609375, 3.4073486328125, 3.55255126953125, 3.69775390625, 3.84295654296875, 3.9881591796875, 4.13336181640625, 4.278564453125, 4.42376708984375, 4.5689697265625, 4.71417236328125, 4.859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 11.0, 10.0, 12.0, 14.0, 14.0, 22.0, 14.0, 18.0, 25.0, 30.0, 31.0, 28.0, 29.0, 36.0, 38.0, 49.0, 55.0, 47.0, 47.0, 43.0, 46.0, 41.0, 40.0, 38.0, 34.0, 35.0, 20.0, 33.0, 20.0, 24.0, 19.0, 18.0, 13.0, 12.0, 8.0, 9.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.46875, -9.110107421875, -8.75146484375, -8.392822265625, -8.0341796875, -7.675537109375, -7.31689453125, -6.958251953125, -6.599609375, -6.240966796875, -5.88232421875, -5.523681640625, -5.1650390625, -4.806396484375, -4.44775390625, -4.089111328125, -3.73046875, -3.371826171875, -3.01318359375, -2.654541015625, -2.2958984375, -1.937255859375, -1.57861328125, -1.219970703125, -0.861328125, -0.502685546875, -0.14404296875, 0.214599609375, 0.5732421875, 0.931884765625, 1.29052734375, 1.649169921875, 2.0078125, 2.366455078125, 2.72509765625, 3.083740234375, 3.4423828125, 3.801025390625, 4.15966796875, 4.518310546875, 4.876953125, 5.235595703125, 5.59423828125, 5.952880859375, 6.3115234375, 6.670166015625, 7.02880859375, 7.387451171875, 7.74609375, 8.104736328125, 8.46337890625, 8.822021484375, 9.1806640625, 9.539306640625, 9.89794921875, 10.256591796875, 10.615234375, 10.973876953125, 11.33251953125, 11.691162109375, 12.0498046875, 12.408447265625, 12.76708984375, 13.125732421875, 13.484375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 7.0, 9.0, 21.0, 8.0, 30.0, 30.0, 61.0, 81.0, 120.0, 194.0, 253.0, 472.0, 795.0, 1514.0, 3185.0, 7374.0, 19345.0, 58170.0, 179749.0, 360745.0, 268782.0, 96380.0, 31091.0, 10974.0, 4533.0, 2092.0, 1021.0, 591.0, 341.0, 195.0, 128.0, 94.0, 53.0, 35.0, 24.0, 16.0, 12.0, 10.0, 7.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.265625, -7.072998046875, -6.88037109375, -6.687744140625, -6.4951171875, -6.302490234375, -6.10986328125, -5.917236328125, -5.724609375, -5.531982421875, -5.33935546875, -5.146728515625, -4.9541015625, -4.761474609375, -4.56884765625, -4.376220703125, -4.18359375, -3.990966796875, -3.79833984375, -3.605712890625, -3.4130859375, -3.220458984375, -3.02783203125, -2.835205078125, -2.642578125, -2.449951171875, -2.25732421875, -2.064697265625, -1.8720703125, -1.679443359375, -1.48681640625, -1.294189453125, -1.1015625, -0.908935546875, -0.71630859375, -0.523681640625, -0.3310546875, -0.138427734375, 0.05419921875, 0.246826171875, 0.439453125, 0.632080078125, 0.82470703125, 1.017333984375, 1.2099609375, 1.402587890625, 1.59521484375, 1.787841796875, 1.98046875, 2.173095703125, 2.36572265625, 2.558349609375, 2.7509765625, 2.943603515625, 3.13623046875, 3.328857421875, 3.521484375, 3.714111328125, 3.90673828125, 4.099365234375, 4.2919921875, 4.484619140625, 4.67724609375, 4.869873046875, 5.0625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 6.0, 4.0, 10.0, 19.0, 12.0, 13.0, 18.0, 24.0, 15.0, 30.0, 32.0, 30.0, 37.0, 40.0, 46.0, 45.0, 44.0, 49.0, 43.0, 66.0, 39.0, 35.0, 49.0, 40.0, 33.0, 33.0, 22.0, 31.0, 22.0, 18.0, 15.0, 14.0, 14.0, 9.0, 10.0, 11.0, 6.0, 3.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.05859375, -6.8297119140625, -6.600830078125, -6.3719482421875, -6.14306640625, -5.9141845703125, -5.685302734375, -5.4564208984375, -5.2275390625, -4.9986572265625, -4.769775390625, -4.5408935546875, -4.31201171875, -4.0831298828125, -3.854248046875, -3.6253662109375, -3.396484375, -3.1676025390625, -2.938720703125, -2.7098388671875, -2.48095703125, -2.2520751953125, -2.023193359375, -1.7943115234375, -1.5654296875, -1.3365478515625, -1.107666015625, -0.8787841796875, -0.64990234375, -0.4210205078125, -0.192138671875, 0.0367431640625, 0.265625, 0.4945068359375, 0.723388671875, 0.9522705078125, 1.18115234375, 1.4100341796875, 1.638916015625, 1.8677978515625, 2.0966796875, 2.3255615234375, 2.554443359375, 2.7833251953125, 3.01220703125, 3.2410888671875, 3.469970703125, 3.6988525390625, 3.927734375, 4.1566162109375, 4.385498046875, 4.6143798828125, 4.84326171875, 5.0721435546875, 5.301025390625, 5.5299072265625, 5.7587890625, 5.9876708984375, 6.216552734375, 6.4454345703125, 6.67431640625, 6.9031982421875, 7.132080078125, 7.3609619140625, 7.58984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 8.0, 6.0, 10.0, 7.0, 12.0, 14.0, 14.0, 34.0, 30.0, 49.0, 56.0, 96.0, 148.0, 163.0, 251.0, 345.0, 537.0, 808.0, 1352.0, 2314.0, 4760.0, 12857.0, 63887.0, 556339.0, 346993.0, 38485.0, 9485.0, 3902.0, 1971.0, 1199.0, 761.0, 485.0, 332.0, 221.0, 158.0, 122.0, 85.0, 75.0, 52.0, 36.0, 21.0, 24.0, 21.0, 12.0, 7.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.080078125, -2.96954345703125, -2.8590087890625, -2.74847412109375, -2.637939453125, -2.52740478515625, -2.4168701171875, -2.30633544921875, -2.19580078125, -2.08526611328125, -1.9747314453125, -1.86419677734375, -1.753662109375, -1.64312744140625, -1.5325927734375, -1.42205810546875, -1.3115234375, -1.20098876953125, -1.0904541015625, -0.97991943359375, -0.869384765625, -0.75885009765625, -0.6483154296875, -0.53778076171875, -0.42724609375, -0.31671142578125, -0.2061767578125, -0.09564208984375, 0.014892578125, 0.12542724609375, 0.2359619140625, 0.34649658203125, 0.45703125, 0.56756591796875, 0.6781005859375, 0.78863525390625, 0.899169921875, 1.00970458984375, 1.1202392578125, 1.23077392578125, 1.34130859375, 1.45184326171875, 1.5623779296875, 1.67291259765625, 1.783447265625, 1.89398193359375, 2.0045166015625, 2.11505126953125, 2.2255859375, 2.33612060546875, 2.4466552734375, 2.55718994140625, 2.667724609375, 2.77825927734375, 2.8887939453125, 2.99932861328125, 3.10986328125, 3.22039794921875, 3.3309326171875, 3.44146728515625, 3.552001953125, 3.66253662109375, 3.7730712890625, 3.88360595703125, 3.994140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 8.0, 11.0, 17.0, 11.0, 26.0, 35.0, 62.0, 102.0, 137.0, 188.0, 136.0, 99.0, 50.0, 42.0, 23.0, 14.0, 9.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022530555725097656, -0.00021875649690628052, -0.00021220743656158447, -0.00020565837621688843, -0.00019910931587219238, -0.00019256025552749634, -0.0001860111951828003, -0.00017946213483810425, -0.0001729130744934082, -0.00016636401414871216, -0.0001598149538040161, -0.00015326589345932007, -0.00014671683311462402, -0.00014016777276992798, -0.00013361871242523193, -0.0001270696520805359, -0.00012052059173583984, -0.0001139715313911438, -0.00010742247104644775, -0.00010087341070175171, -9.432435035705566e-05, -8.777529001235962e-05, -8.122622966766357e-05, -7.467716932296753e-05, -6.812810897827148e-05, -6.157904863357544e-05, -5.5029988288879395e-05, -4.848092794418335e-05, -4.1931867599487305e-05, -3.538280725479126e-05, -2.8833746910095215e-05, -2.228468656539917e-05, -1.5735626220703125e-05, -9.18656587600708e-06, -2.637505531311035e-06, 3.91155481338501e-06, 1.0460615158081055e-05, 1.70096755027771e-05, 2.3558735847473145e-05, 3.010779619216919e-05, 3.6656856536865234e-05, 4.320591688156128e-05, 4.9754977226257324e-05, 5.630403757095337e-05, 6.285309791564941e-05, 6.940215826034546e-05, 7.59512186050415e-05, 8.250027894973755e-05, 8.90493392944336e-05, 9.559839963912964e-05, 0.00010214745998382568, 0.00010869652032852173, 0.00011524558067321777, 0.00012179464101791382, 0.00012834370136260986, 0.0001348927617073059, 0.00014144182205200195, 0.000147990882396698, 0.00015453994274139404, 0.0001610890030860901, 0.00016763806343078613, 0.00017418712377548218, 0.00018073618412017822, 0.00018728524446487427, 0.0001938343048095703]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 9.0, 5.0, 12.0, 23.0, 34.0, 27.0, 41.0, 49.0, 66.0, 98.0, 123.0, 175.0, 239.0, 314.0, 462.0, 711.0, 966.0, 1483.0, 2258.0, 3664.0, 6517.0, 13650.0, 35873.0, 129976.0, 403587.0, 311173.0, 85592.0, 25944.0, 10619.0, 5523.0, 3192.0, 1956.0, 1186.0, 840.0, 578.0, 420.0, 295.0, 232.0, 159.0, 124.0, 84.0, 83.0, 57.0, 43.0, 26.0, 27.0, 14.0, 12.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.04296875, -2.947418212890625, -2.85186767578125, -2.756317138671875, -2.6607666015625, -2.565216064453125, -2.46966552734375, -2.374114990234375, -2.278564453125, -2.183013916015625, -2.08746337890625, -1.991912841796875, -1.8963623046875, -1.800811767578125, -1.70526123046875, -1.609710693359375, -1.51416015625, -1.418609619140625, -1.32305908203125, -1.227508544921875, -1.1319580078125, -1.036407470703125, -0.94085693359375, -0.845306396484375, -0.749755859375, -0.654205322265625, -0.55865478515625, -0.463104248046875, -0.3675537109375, -0.272003173828125, -0.17645263671875, -0.080902099609375, 0.0146484375, 0.110198974609375, 0.20574951171875, 0.301300048828125, 0.3968505859375, 0.492401123046875, 0.58795166015625, 0.683502197265625, 0.779052734375, 0.874603271484375, 0.97015380859375, 1.065704345703125, 1.1612548828125, 1.256805419921875, 1.35235595703125, 1.447906494140625, 1.54345703125, 1.639007568359375, 1.73455810546875, 1.830108642578125, 1.9256591796875, 2.021209716796875, 2.11676025390625, 2.212310791015625, 2.307861328125, 2.403411865234375, 2.49896240234375, 2.594512939453125, 2.6900634765625, 2.785614013671875, 2.88116455078125, 2.976715087890625, 3.072265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 2.0, 7.0, 4.0, 9.0, 11.0, 11.0, 8.0, 39.0, 59.0, 93.0, 146.0, 185.0, 145.0, 100.0, 59.0, 36.0, 12.0, 11.0, 13.0, 7.0, 4.0, 5.0, 10.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5087890625, -1.462493896484375, -1.41619873046875, -1.369903564453125, -1.3236083984375, -1.277313232421875, -1.23101806640625, -1.184722900390625, -1.138427734375, -1.092132568359375, -1.04583740234375, -0.999542236328125, -0.9532470703125, -0.906951904296875, -0.86065673828125, -0.814361572265625, -0.76806640625, -0.721771240234375, -0.67547607421875, -0.629180908203125, -0.5828857421875, -0.536590576171875, -0.49029541015625, -0.444000244140625, -0.397705078125, -0.351409912109375, -0.30511474609375, -0.258819580078125, -0.2125244140625, -0.166229248046875, -0.11993408203125, -0.073638916015625, -0.02734375, 0.018951416015625, 0.06524658203125, 0.111541748046875, 0.1578369140625, 0.204132080078125, 0.25042724609375, 0.296722412109375, 0.343017578125, 0.389312744140625, 0.43560791015625, 0.481903076171875, 0.5281982421875, 0.574493408203125, 0.62078857421875, 0.667083740234375, 0.71337890625, 0.759674072265625, 0.80596923828125, 0.852264404296875, 0.8985595703125, 0.944854736328125, 0.99114990234375, 1.037445068359375, 1.083740234375, 1.130035400390625, 1.17633056640625, 1.222625732421875, 1.2689208984375, 1.315216064453125, 1.36151123046875, 1.407806396484375, 1.4541015625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 6.0, 5.0, 6.0, 9.0, 6.0, 11.0, 12.0, 19.0, 22.0, 14.0, 29.0, 29.0, 30.0, 32.0, 54.0, 52.0, 50.0, 55.0, 45.0, 43.0, 42.0, 50.0, 50.0, 48.0, 37.0, 35.0, 31.0, 29.0, 26.0, 19.0, 24.0, 23.0, 8.0, 17.0, 11.0, 9.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.953832626342773, -7.675090789794922, -7.39634895324707, -7.117607116699219, -6.838865280151367, -6.560123443603516, -6.281382083892822, -6.002640247344971, -5.723898410797119, -5.445156574249268, -5.166414737701416, -4.8876729011535645, -4.608931541442871, -4.3301897048950195, -4.051447868347168, -3.7727060317993164, -3.493964195251465, -3.2152223587036133, -2.9364805221557617, -2.6577389240264893, -2.3789970874786377, -2.100255250930786, -1.8215135335922241, -1.542771816253662, -1.2640299797058105, -0.9852882027626038, -0.706546425819397, -0.4278046488761902, -0.1490628719329834, 0.12967896461486816, 0.4084206819534302, 0.6871623992919922, 0.9659042358398438, 1.2446460723876953, 1.5233877897262573, 1.8021295070648193, 2.080871343612671, 2.3596131801605225, 2.638354778289795, 2.9170966148376465, 3.195838451385498, 3.4745802879333496, 3.753322124481201, 4.032063961029053, 4.310805320739746, 4.589547157287598, 4.868288993835449, 5.147030830383301, 5.425772666931152, 5.704514503479004, 5.9832563400268555, 6.261998176574707, 6.540740013122559, 6.81948184967041, 7.0982232093811035, 7.376965045928955, 7.655706882476807, 7.934448719024658, 8.213190078735352, 8.491931915283203, 8.770673751831055, 9.049415588378906, 9.328157424926758, 9.60689926147461, 9.885641098022461]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 10.0, 5.0, 11.0, 8.0, 20.0, 20.0, 11.0, 18.0, 22.0, 21.0, 24.0, 21.0, 34.0, 32.0, 28.0, 43.0, 37.0, 36.0, 57.0, 42.0, 39.0, 42.0, 54.0, 33.0, 40.0, 40.0, 30.0, 31.0, 30.0, 29.0, 18.0, 15.0, 16.0, 16.0, 16.0, 8.0, 10.0, 3.0, 8.0, 8.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.035689353942871, -9.710077285766602, -9.384464263916016, -9.05885124206543, -8.73323917388916, -8.40762710571289, -8.082014083862305, -7.756401538848877, -7.430788993835449, -7.1051764488220215, -6.779563903808594, -6.453951358795166, -6.128338813781738, -5.8027262687683105, -5.477113723754883, -5.151501178741455, -4.825888633728027, -4.5002760887146, -4.174663543701172, -3.849050998687744, -3.5234384536743164, -3.1978259086608887, -2.872213363647461, -2.546600818634033, -2.2209882736206055, -1.8953757286071777, -1.56976318359375, -1.2441506385803223, -0.9185380935668945, -0.5929255485534668, -0.26731300354003906, 0.05829954147338867, 0.3839120864868164, 0.7095246315002441, 1.0351371765136719, 1.3607497215270996, 1.6863622665405273, 2.011974811553955, 2.337587356567383, 2.6631999015808105, 2.9888124465942383, 3.314424991607666, 3.6400375366210938, 3.9656500816345215, 4.291262626647949, 4.616875171661377, 4.942487716674805, 5.268100261688232, 5.59371280670166, 5.919325351715088, 6.244937896728516, 6.570550441741943, 6.896162986755371, 7.221775531768799, 7.547388076782227, 7.873000621795654, 8.198613166809082, 8.524225234985352, 8.849838256835938, 9.175451278686523, 9.501063346862793, 9.826675415039062, 10.152288436889648, 10.477901458740234, 10.803513526916504]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 19.0, 18.0, 37.0, 42.0, 62.0, 100.0, 186.0, 285.0, 419.0, 603.0, 880.0, 1333.0, 2287.0, 3352.0, 5225.0, 8196.0, 12246.0, 18893.0, 27367.0, 39194.0, 54056.0, 71234.0, 86397.0, 100763.0, 106773.0, 105744.0, 96367.0, 82524.0, 66028.0, 49155.0, 35743.0, 24827.0, 16585.0, 11007.0, 7291.0, 4715.0, 2982.0, 1944.0, 1278.0, 819.0, 547.0, 353.0, 243.0, 149.0, 87.0, 72.0, 43.0, 33.0, 21.0, 13.0, 10.0, 6.0, 1.0, 0.0, 1.0], "bins": [-6.15625, -5.97442626953125, -5.7926025390625, -5.61077880859375, -5.428955078125, -5.24713134765625, -5.0653076171875, -4.88348388671875, -4.70166015625, -4.51983642578125, -4.3380126953125, -4.15618896484375, -3.974365234375, -3.79254150390625, -3.6107177734375, -3.42889404296875, -3.2470703125, -3.06524658203125, -2.8834228515625, -2.70159912109375, -2.519775390625, -2.33795166015625, -2.1561279296875, -1.97430419921875, -1.79248046875, -1.61065673828125, -1.4288330078125, -1.24700927734375, -1.065185546875, -0.88336181640625, -0.7015380859375, -0.51971435546875, -0.337890625, -0.15606689453125, 0.0257568359375, 0.20758056640625, 0.389404296875, 0.57122802734375, 0.7530517578125, 0.93487548828125, 1.11669921875, 1.29852294921875, 1.4803466796875, 1.66217041015625, 1.843994140625, 2.02581787109375, 2.2076416015625, 2.38946533203125, 2.5712890625, 2.75311279296875, 2.9349365234375, 3.11676025390625, 3.298583984375, 3.48040771484375, 3.6622314453125, 3.84405517578125, 4.02587890625, 4.20770263671875, 4.3895263671875, 4.57135009765625, 4.753173828125, 4.93499755859375, 5.1168212890625, 5.29864501953125, 5.48046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 9.0, 8.0, 6.0, 12.0, 15.0, 21.0, 18.0, 17.0, 17.0, 20.0, 20.0, 22.0, 30.0, 36.0, 40.0, 34.0, 36.0, 30.0, 36.0, 42.0, 53.0, 53.0, 38.0, 38.0, 40.0, 32.0, 36.0, 36.0, 26.0, 26.0, 14.0, 18.0, 20.0, 20.0, 12.0, 12.0, 10.0, 7.0, 5.0, 6.0, 4.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.671875, -9.3604736328125, -9.049072265625, -8.7376708984375, -8.42626953125, -8.1148681640625, -7.803466796875, -7.4920654296875, -7.1806640625, -6.8692626953125, -6.557861328125, -6.2464599609375, -5.93505859375, -5.6236572265625, -5.312255859375, -5.0008544921875, -4.689453125, -4.3780517578125, -4.066650390625, -3.7552490234375, -3.44384765625, -3.1324462890625, -2.821044921875, -2.5096435546875, -2.1982421875, -1.8868408203125, -1.575439453125, -1.2640380859375, -0.95263671875, -0.6412353515625, -0.329833984375, -0.0184326171875, 0.29296875, 0.6043701171875, 0.915771484375, 1.2271728515625, 1.53857421875, 1.8499755859375, 2.161376953125, 2.4727783203125, 2.7841796875, 3.0955810546875, 3.406982421875, 3.7183837890625, 4.02978515625, 4.3411865234375, 4.652587890625, 4.9639892578125, 5.275390625, 5.5867919921875, 5.898193359375, 6.2095947265625, 6.52099609375, 6.8323974609375, 7.143798828125, 7.4552001953125, 7.7666015625, 8.0780029296875, 8.389404296875, 8.7008056640625, 9.01220703125, 9.3236083984375, 9.635009765625, 9.9464111328125, 10.2578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 7.0, 3.0, 7.0, 11.0, 21.0, 20.0, 44.0, 69.0, 117.0, 166.0, 257.0, 385.0, 583.0, 922.0, 1306.0, 2056.0, 3014.0, 4712.0, 6982.0, 10261.0, 15405.0, 22097.0, 31417.0, 43546.0, 58176.0, 73158.0, 88066.0, 98706.0, 102514.0, 99449.0, 90942.0, 76444.0, 61761.0, 46394.0, 34038.0, 24455.0, 16900.0, 11442.0, 7704.0, 5059.0, 3429.0, 2262.0, 1428.0, 918.0, 607.0, 459.0, 302.0, 180.0, 128.0, 83.0, 60.0, 35.0, 25.0, 11.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-5.76953125, -5.5926513671875, -5.415771484375, -5.2388916015625, -5.06201171875, -4.8851318359375, -4.708251953125, -4.5313720703125, -4.3544921875, -4.1776123046875, -4.000732421875, -3.8238525390625, -3.64697265625, -3.4700927734375, -3.293212890625, -3.1163330078125, -2.939453125, -2.7625732421875, -2.585693359375, -2.4088134765625, -2.23193359375, -2.0550537109375, -1.878173828125, -1.7012939453125, -1.5244140625, -1.3475341796875, -1.170654296875, -0.9937744140625, -0.81689453125, -0.6400146484375, -0.463134765625, -0.2862548828125, -0.109375, 0.0675048828125, 0.244384765625, 0.4212646484375, 0.59814453125, 0.7750244140625, 0.951904296875, 1.1287841796875, 1.3056640625, 1.4825439453125, 1.659423828125, 1.8363037109375, 2.01318359375, 2.1900634765625, 2.366943359375, 2.5438232421875, 2.720703125, 2.8975830078125, 3.074462890625, 3.2513427734375, 3.42822265625, 3.6051025390625, 3.781982421875, 3.9588623046875, 4.1357421875, 4.3126220703125, 4.489501953125, 4.6663818359375, 4.84326171875, 5.0201416015625, 5.197021484375, 5.3739013671875, 5.55078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 9.0, 10.0, 8.0, 12.0, 10.0, 12.0, 19.0, 15.0, 15.0, 20.0, 16.0, 27.0, 30.0, 28.0, 33.0, 35.0, 42.0, 36.0, 37.0, 46.0, 47.0, 31.0, 40.0, 39.0, 36.0, 36.0, 30.0, 26.0, 20.0, 33.0, 21.0, 29.0, 12.0, 20.0, 19.0, 14.0, 19.0, 10.0, 9.0, 8.0, 8.0, 7.0, 7.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.74609375, -5.559814453125, -5.37353515625, -5.187255859375, -5.0009765625, -4.814697265625, -4.62841796875, -4.442138671875, -4.255859375, -4.069580078125, -3.88330078125, -3.697021484375, -3.5107421875, -3.324462890625, -3.13818359375, -2.951904296875, -2.765625, -2.579345703125, -2.39306640625, -2.206787109375, -2.0205078125, -1.834228515625, -1.64794921875, -1.461669921875, -1.275390625, -1.089111328125, -0.90283203125, -0.716552734375, -0.5302734375, -0.343994140625, -0.15771484375, 0.028564453125, 0.21484375, 0.401123046875, 0.58740234375, 0.773681640625, 0.9599609375, 1.146240234375, 1.33251953125, 1.518798828125, 1.705078125, 1.891357421875, 2.07763671875, 2.263916015625, 2.4501953125, 2.636474609375, 2.82275390625, 3.009033203125, 3.1953125, 3.381591796875, 3.56787109375, 3.754150390625, 3.9404296875, 4.126708984375, 4.31298828125, 4.499267578125, 4.685546875, 4.871826171875, 5.05810546875, 5.244384765625, 5.4306640625, 5.616943359375, 5.80322265625, 5.989501953125, 6.17578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 11.0, 18.0, 15.0, 29.0, 36.0, 50.0, 58.0, 101.0, 121.0, 166.0, 234.0, 361.0, 505.0, 687.0, 1032.0, 1748.0, 2547.0, 4062.0, 6934.0, 11955.0, 21054.0, 36859.0, 63006.0, 98728.0, 137241.0, 161400.0, 156849.0, 126141.0, 87662.0, 53605.0, 31089.0, 17692.0, 10299.0, 5949.0, 3611.0, 2171.0, 1411.0, 967.0, 607.0, 448.0, 313.0, 192.0, 168.0, 124.0, 90.0, 57.0, 49.0, 36.0, 20.0, 17.0, 12.0, 10.0, 1.0, 2.0, 4.0, 1.0, 0.0, 4.0], "bins": [-3.310546875, -3.20660400390625, -3.1026611328125, -2.99871826171875, -2.894775390625, -2.79083251953125, -2.6868896484375, -2.58294677734375, -2.47900390625, -2.37506103515625, -2.2711181640625, -2.16717529296875, -2.063232421875, -1.95928955078125, -1.8553466796875, -1.75140380859375, -1.6474609375, -1.54351806640625, -1.4395751953125, -1.33563232421875, -1.231689453125, -1.12774658203125, -1.0238037109375, -0.91986083984375, -0.81591796875, -0.71197509765625, -0.6080322265625, -0.50408935546875, -0.400146484375, -0.29620361328125, -0.1922607421875, -0.08831787109375, 0.015625, 0.11956787109375, 0.2235107421875, 0.32745361328125, 0.431396484375, 0.53533935546875, 0.6392822265625, 0.74322509765625, 0.84716796875, 0.95111083984375, 1.0550537109375, 1.15899658203125, 1.262939453125, 1.36688232421875, 1.4708251953125, 1.57476806640625, 1.6787109375, 1.78265380859375, 1.8865966796875, 1.99053955078125, 2.094482421875, 2.19842529296875, 2.3023681640625, 2.40631103515625, 2.51025390625, 2.61419677734375, 2.7181396484375, 2.82208251953125, 2.926025390625, 3.02996826171875, 3.1339111328125, 3.23785400390625, 3.341796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 4.0, 9.0, 17.0, 15.0, 18.0, 24.0, 24.0, 22.0, 42.0, 49.0, 46.0, 63.0, 55.0, 53.0, 58.0, 53.0, 48.0, 51.0, 53.0, 59.0, 36.0, 39.0, 25.0, 27.0, 18.0, 16.0, 12.0, 16.0, 15.0, 9.0, 2.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002980232238769531, -0.00028768181800842285, -0.0002773404121398926, -0.0002669990062713623, -0.00025665760040283203, -0.00024631619453430176, -0.00023597478866577148, -0.0002256333827972412, -0.00021529197692871094, -0.00020495057106018066, -0.0001946091651916504, -0.00018426775932312012, -0.00017392635345458984, -0.00016358494758605957, -0.0001532435417175293, -0.00014290213584899902, -0.00013256072998046875, -0.00012221932411193848, -0.0001118779182434082, -0.00010153651237487793, -9.119510650634766e-05, -8.085370063781738e-05, -7.051229476928711e-05, -6.0170888900756836e-05, -4.982948303222656e-05, -3.948807716369629e-05, -2.9146671295166016e-05, -1.8805265426635742e-05, -8.463859558105469e-06, 1.8775463104248047e-06, 1.2218952178955078e-05, 2.256035804748535e-05, 3.2901763916015625e-05, 4.32431697845459e-05, 5.358457565307617e-05, 6.392598152160645e-05, 7.426738739013672e-05, 8.460879325866699e-05, 9.495019912719727e-05, 0.00010529160499572754, 0.00011563301086425781, 0.00012597441673278809, 0.00013631582260131836, 0.00014665722846984863, 0.0001569986343383789, 0.00016734004020690918, 0.00017768144607543945, 0.00018802285194396973, 0.0001983642578125, 0.00020870566368103027, 0.00021904706954956055, 0.00022938847541809082, 0.0002397298812866211, 0.00025007128715515137, 0.00026041269302368164, 0.0002707540988922119, 0.0002810955047607422, 0.00029143691062927246, 0.00030177831649780273, 0.000312119722366333, 0.0003224611282348633, 0.00033280253410339355, 0.00034314393997192383, 0.0003534853458404541, 0.0003638267517089844]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 2.0, 6.0, 8.0, 14.0, 20.0, 12.0, 20.0, 33.0, 47.0, 82.0, 70.0, 132.0, 215.0, 338.0, 485.0, 819.0, 1500.0, 2716.0, 5835.0, 11803.0, 26254.0, 56824.0, 111135.0, 180368.0, 218661.0, 189056.0, 121887.0, 63350.0, 29995.0, 13477.0, 6178.0, 2999.0, 1638.0, 996.0, 550.0, 324.0, 212.0, 147.0, 110.0, 71.0, 50.0, 37.0, 18.0, 18.0, 15.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.53125, -4.383056640625, -4.23486328125, -4.086669921875, -3.9384765625, -3.790283203125, -3.64208984375, -3.493896484375, -3.345703125, -3.197509765625, -3.04931640625, -2.901123046875, -2.7529296875, -2.604736328125, -2.45654296875, -2.308349609375, -2.16015625, -2.011962890625, -1.86376953125, -1.715576171875, -1.5673828125, -1.419189453125, -1.27099609375, -1.122802734375, -0.974609375, -0.826416015625, -0.67822265625, -0.530029296875, -0.3818359375, -0.233642578125, -0.08544921875, 0.062744140625, 0.2109375, 0.359130859375, 0.50732421875, 0.655517578125, 0.8037109375, 0.951904296875, 1.10009765625, 1.248291015625, 1.396484375, 1.544677734375, 1.69287109375, 1.841064453125, 1.9892578125, 2.137451171875, 2.28564453125, 2.433837890625, 2.58203125, 2.730224609375, 2.87841796875, 3.026611328125, 3.1748046875, 3.322998046875, 3.47119140625, 3.619384765625, 3.767578125, 3.915771484375, 4.06396484375, 4.212158203125, 4.3603515625, 4.508544921875, 4.65673828125, 4.804931640625, 4.953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 2.0, 3.0, 4.0, 3.0, 8.0, 15.0, 14.0, 17.0, 12.0, 18.0, 33.0, 39.0, 43.0, 42.0, 59.0, 62.0, 78.0, 77.0, 63.0, 55.0, 53.0, 50.0, 42.0, 45.0, 30.0, 19.0, 12.0, 17.0, 11.0, 14.0, 11.0, 8.0, 6.0, 8.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.975860595703125, -1.90875244140625, -1.841644287109375, -1.7745361328125, -1.707427978515625, -1.64031982421875, -1.573211669921875, -1.506103515625, -1.438995361328125, -1.37188720703125, -1.304779052734375, -1.2376708984375, -1.170562744140625, -1.10345458984375, -1.036346435546875, -0.96923828125, -0.902130126953125, -0.83502197265625, -0.767913818359375, -0.7008056640625, -0.633697509765625, -0.56658935546875, -0.499481201171875, -0.432373046875, -0.365264892578125, -0.29815673828125, -0.231048583984375, -0.1639404296875, -0.096832275390625, -0.02972412109375, 0.037384033203125, 0.1044921875, 0.171600341796875, 0.23870849609375, 0.305816650390625, 0.3729248046875, 0.440032958984375, 0.50714111328125, 0.574249267578125, 0.641357421875, 0.708465576171875, 0.77557373046875, 0.842681884765625, 0.9097900390625, 0.976898193359375, 1.04400634765625, 1.111114501953125, 1.17822265625, 1.245330810546875, 1.31243896484375, 1.379547119140625, 1.4466552734375, 1.513763427734375, 1.58087158203125, 1.647979736328125, 1.715087890625, 1.782196044921875, 1.84930419921875, 1.916412353515625, 1.9835205078125, 2.050628662109375, 2.11773681640625, 2.184844970703125, 2.251953125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 7.0, 13.0, 11.0, 16.0, 15.0, 21.0, 25.0, 27.0, 35.0, 37.0, 41.0, 44.0, 52.0, 43.0, 38.0, 47.0, 59.0, 44.0, 40.0, 51.0, 55.0, 42.0, 33.0, 27.0, 24.0, 20.0, 17.0, 25.0, 20.0, 20.0, 7.0, 14.0, 10.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.537844181060791, -7.249553203582764, -6.961262226104736, -6.672971248626709, -6.384680271148682, -6.096389293670654, -5.808098793029785, -5.519807815551758, -5.2315168380737305, -4.943225860595703, -4.654934883117676, -4.366643905639648, -4.078352928161621, -3.7900619506835938, -3.5017712116241455, -3.213480234146118, -2.9251890182495117, -2.6368980407714844, -2.348607063293457, -2.0603160858154297, -1.772025227546692, -1.4837342500686646, -1.1954433917999268, -0.9071524143218994, -0.6188614368438721, -0.3305704891681671, -0.04227954149246216, 0.2460113763809204, 0.5343023538589478, 0.8225933313369751, 1.110884189605713, 1.3991751670837402, 1.6874656677246094, 1.9757566452026367, 2.264047622680664, 2.5523386001586914, 2.8406295776367188, 3.128920555114746, 3.4172112941741943, 3.7055022716522217, 3.993793249130249, 4.282083988189697, 4.570374965667725, 4.858665943145752, 5.146956920623779, 5.435247898101807, 5.723538875579834, 6.011829853057861, 6.300120830535889, 6.588411808013916, 6.876702785491943, 7.164993762969971, 7.453284740447998, 7.741575717926025, 8.029866218566895, 8.318157196044922, 8.60644817352295, 8.894739151000977, 9.183030128479004, 9.471321105957031, 9.759612083435059, 10.047903060913086, 10.336194038391113, 10.62448501586914, 10.912775993347168]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 9.0, 5.0, 5.0, 10.0, 10.0, 18.0, 9.0, 17.0, 13.0, 18.0, 21.0, 22.0, 20.0, 33.0, 22.0, 30.0, 42.0, 41.0, 33.0, 37.0, 58.0, 42.0, 48.0, 41.0, 42.0, 41.0, 33.0, 26.0, 30.0, 29.0, 29.0, 22.0, 26.0, 21.0, 16.0, 13.0, 17.0, 13.0, 9.0, 6.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.409263610839844, -9.083836555480957, -8.75840950012207, -8.432982444763184, -8.107555389404297, -7.78212833404541, -7.456701278686523, -7.131274223327637, -6.80584716796875, -6.480420112609863, -6.154993057250977, -5.82956600189209, -5.504138946533203, -5.178711891174316, -4.85328483581543, -4.527857780456543, -4.202430725097656, -3.8770036697387695, -3.551576614379883, -3.226149559020996, -2.9007225036621094, -2.5752954483032227, -2.249868392944336, -1.9244413375854492, -1.5990142822265625, -1.2735872268676758, -0.9481601715087891, -0.6227331161499023, -0.2973060607910156, 0.028120994567871094, 0.3535480499267578, 0.6789751052856445, 1.0044031143188477, 1.3298301696777344, 1.655257225036621, 1.9806842803955078, 2.3061113357543945, 2.6315383911132812, 2.956965446472168, 3.2823925018310547, 3.6078195571899414, 3.933246612548828, 4.258673667907715, 4.584100723266602, 4.909527778625488, 5.234954833984375, 5.560381889343262, 5.885808944702148, 6.211236000061035, 6.536663055419922, 6.862090110778809, 7.187517166137695, 7.512944221496582, 7.838371276855469, 8.163798332214355, 8.489225387573242, 8.814652442932129, 9.140079498291016, 9.465506553649902, 9.790933609008789, 10.116360664367676, 10.441787719726562, 10.76721477508545, 11.092641830444336, 11.418068885803223]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 10.0, 13.0, 32.0, 42.0, 64.0, 101.0, 128.0, 233.0, 391.0, 614.0, 1040.0, 1813.0, 2900.0, 4788.0, 8110.0, 13350.0, 22250.0, 36693.0, 60382.0, 95602.0, 149521.0, 223152.0, 315193.0, 412555.0, 489583.0, 518600.0, 488628.0, 412711.0, 315347.0, 223338.0, 149432.0, 95987.0, 59321.0, 36428.0, 22048.0, 13292.0, 8165.0, 4874.0, 2781.0, 1727.0, 1175.0, 674.0, 457.0, 253.0, 187.0, 108.0, 74.0, 53.0, 21.0, 19.0, 15.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0], "bins": [-6.5625, -6.3541259765625, -6.145751953125, -5.9373779296875, -5.72900390625, -5.5206298828125, -5.312255859375, -5.1038818359375, -4.8955078125, -4.6871337890625, -4.478759765625, -4.2703857421875, -4.06201171875, -3.8536376953125, -3.645263671875, -3.4368896484375, -3.228515625, -3.0201416015625, -2.811767578125, -2.6033935546875, -2.39501953125, -2.1866455078125, -1.978271484375, -1.7698974609375, -1.5615234375, -1.3531494140625, -1.144775390625, -0.9364013671875, -0.72802734375, -0.5196533203125, -0.311279296875, -0.1029052734375, 0.10546875, 0.3138427734375, 0.522216796875, 0.7305908203125, 0.93896484375, 1.1473388671875, 1.355712890625, 1.5640869140625, 1.7724609375, 1.9808349609375, 2.189208984375, 2.3975830078125, 2.60595703125, 2.8143310546875, 3.022705078125, 3.2310791015625, 3.439453125, 3.6478271484375, 3.856201171875, 4.0645751953125, 4.27294921875, 4.4813232421875, 4.689697265625, 4.8980712890625, 5.1064453125, 5.3148193359375, 5.523193359375, 5.7315673828125, 5.93994140625, 6.1483154296875, 6.356689453125, 6.5650634765625, 6.7734375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 11.0, 4.0, 13.0, 10.0, 8.0, 6.0, 14.0, 20.0, 19.0, 15.0, 17.0, 25.0, 19.0, 23.0, 19.0, 27.0, 36.0, 31.0, 45.0, 54.0, 43.0, 43.0, 43.0, 43.0, 40.0, 40.0, 40.0, 33.0, 40.0, 19.0, 23.0, 29.0, 18.0, 23.0, 19.0, 16.0, 15.0, 9.0, 11.0, 7.0, 6.0, 8.0, 5.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.59375, -7.339599609375, -7.08544921875, -6.831298828125, -6.5771484375, -6.322998046875, -6.06884765625, -5.814697265625, -5.560546875, -5.306396484375, -5.05224609375, -4.798095703125, -4.5439453125, -4.289794921875, -4.03564453125, -3.781494140625, -3.52734375, -3.273193359375, -3.01904296875, -2.764892578125, -2.5107421875, -2.256591796875, -2.00244140625, -1.748291015625, -1.494140625, -1.239990234375, -0.98583984375, -0.731689453125, -0.4775390625, -0.223388671875, 0.03076171875, 0.284912109375, 0.5390625, 0.793212890625, 1.04736328125, 1.301513671875, 1.5556640625, 1.809814453125, 2.06396484375, 2.318115234375, 2.572265625, 2.826416015625, 3.08056640625, 3.334716796875, 3.5888671875, 3.843017578125, 4.09716796875, 4.351318359375, 4.60546875, 4.859619140625, 5.11376953125, 5.367919921875, 5.6220703125, 5.876220703125, 6.13037109375, 6.384521484375, 6.638671875, 6.892822265625, 7.14697265625, 7.401123046875, 7.6552734375, 7.909423828125, 8.16357421875, 8.417724609375, 8.671875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 9.0, 12.0, 21.0, 31.0, 81.0, 124.0, 240.0, 353.0, 669.0, 1113.0, 1964.0, 3460.0, 6150.0, 10181.0, 17207.0, 28993.0, 47039.0, 75064.0, 114871.0, 169436.0, 238852.0, 314909.0, 387671.0, 442118.0, 461608.0, 443154.0, 390528.0, 315741.0, 240037.0, 170696.0, 116660.0, 75577.0, 47770.0, 29515.0, 17684.0, 10402.0, 5977.0, 3460.0, 2045.0, 1222.0, 682.0, 392.0, 214.0, 147.0, 85.0, 43.0, 37.0, 17.0, 11.0, 5.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.25, -6.045166015625, -5.84033203125, -5.635498046875, -5.4306640625, -5.225830078125, -5.02099609375, -4.816162109375, -4.611328125, -4.406494140625, -4.20166015625, -3.996826171875, -3.7919921875, -3.587158203125, -3.38232421875, -3.177490234375, -2.97265625, -2.767822265625, -2.56298828125, -2.358154296875, -2.1533203125, -1.948486328125, -1.74365234375, -1.538818359375, -1.333984375, -1.129150390625, -0.92431640625, -0.719482421875, -0.5146484375, -0.309814453125, -0.10498046875, 0.099853515625, 0.3046875, 0.509521484375, 0.71435546875, 0.919189453125, 1.1240234375, 1.328857421875, 1.53369140625, 1.738525390625, 1.943359375, 2.148193359375, 2.35302734375, 2.557861328125, 2.7626953125, 2.967529296875, 3.17236328125, 3.377197265625, 3.58203125, 3.786865234375, 3.99169921875, 4.196533203125, 4.4013671875, 4.606201171875, 4.81103515625, 5.015869140625, 5.220703125, 5.425537109375, 5.63037109375, 5.835205078125, 6.0400390625, 6.244873046875, 6.44970703125, 6.654541015625, 6.859375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 5.0, 8.0, 11.0, 14.0, 20.0, 20.0, 25.0, 44.0, 52.0, 46.0, 79.0, 79.0, 102.0, 125.0, 132.0, 152.0, 174.0, 173.0, 198.0, 211.0, 214.0, 216.0, 192.0, 179.0, 178.0, 173.0, 181.0, 158.0, 156.0, 124.0, 118.0, 81.0, 78.0, 58.0, 52.0, 56.0, 42.0, 32.0, 28.0, 22.0, 18.0, 15.0, 11.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.404296875, -3.288787841796875, -3.17327880859375, -3.057769775390625, -2.9422607421875, -2.826751708984375, -2.71124267578125, -2.595733642578125, -2.480224609375, -2.364715576171875, -2.24920654296875, -2.133697509765625, -2.0181884765625, -1.902679443359375, -1.78717041015625, -1.671661376953125, -1.55615234375, -1.440643310546875, -1.32513427734375, -1.209625244140625, -1.0941162109375, -0.978607177734375, -0.86309814453125, -0.747589111328125, -0.632080078125, -0.516571044921875, -0.40106201171875, -0.285552978515625, -0.1700439453125, -0.054534912109375, 0.06097412109375, 0.176483154296875, 0.2919921875, 0.407501220703125, 0.52301025390625, 0.638519287109375, 0.7540283203125, 0.869537353515625, 0.98504638671875, 1.100555419921875, 1.216064453125, 1.331573486328125, 1.44708251953125, 1.562591552734375, 1.6781005859375, 1.793609619140625, 1.90911865234375, 2.024627685546875, 2.14013671875, 2.255645751953125, 2.37115478515625, 2.486663818359375, 2.6021728515625, 2.717681884765625, 2.83319091796875, 2.948699951171875, 3.064208984375, 3.179718017578125, 3.29522705078125, 3.410736083984375, 3.5262451171875, 3.641754150390625, 3.75726318359375, 3.872772216796875, 3.98828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 5.0, 6.0, 15.0, 24.0, 23.0, 29.0, 31.0, 38.0, 43.0, 46.0, 36.0, 48.0, 36.0, 61.0, 61.0, 51.0, 58.0, 60.0, 34.0, 53.0, 45.0, 32.0, 26.0, 20.0, 22.0, 8.0, 13.0, 19.0, 11.0, 8.0, 8.0, 9.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.647902488708496, -8.344167709350586, -8.040433883666992, -7.73669958114624, -7.432965278625488, -7.129230976104736, -6.825496673583984, -6.521762371063232, -6.2180280685424805, -5.9142937660217285, -5.610559463500977, -5.306825160980225, -5.003090858459473, -4.699356555938721, -4.395622253417969, -4.091887950897217, -3.788153648376465, -3.484419345855713, -3.180685043334961, -2.876950740814209, -2.573216438293457, -2.269482135772705, -1.9657478332519531, -1.6620135307312012, -1.3582792282104492, -1.0545449256896973, -0.7508106231689453, -0.44707632064819336, -0.1433420181274414, 0.16039228439331055, 0.4641265869140625, 0.7678608894348145, 1.07159423828125, 1.375328540802002, 1.679062843322754, 1.9827971458435059, 2.286531448364258, 2.5902657508850098, 2.8940000534057617, 3.1977343559265137, 3.5014686584472656, 3.8052029609680176, 4.1089372634887695, 4.4126715660095215, 4.716405868530273, 5.020140171051025, 5.323874473571777, 5.627608776092529, 5.931343078613281, 6.235077381134033, 6.538811683654785, 6.842545986175537, 7.146280288696289, 7.450014591217041, 7.753748893737793, 8.057483673095703, 8.361217498779297, 8.66495132446289, 8.9686861038208, 9.272420883178711, 9.576154708862305, 9.879888534545898, 10.183623313903809, 10.487358093261719, 10.791091918945312]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 10.0, 8.0, 14.0, 13.0, 15.0, 23.0, 11.0, 21.0, 21.0, 18.0, 32.0, 26.0, 45.0, 27.0, 47.0, 42.0, 41.0, 36.0, 37.0, 44.0, 33.0, 46.0, 34.0, 42.0, 27.0, 30.0, 39.0, 23.0, 22.0, 30.0, 26.0, 19.0, 11.0, 16.0, 10.0, 17.0, 6.0, 6.0, 10.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-9.788745880126953, -9.474998474121094, -9.16125202178955, -8.847504615783691, -8.533757209777832, -8.220010757446289, -7.90626335144043, -7.5925164222717285, -7.278769493103027, -6.965022563934326, -6.651275157928467, -6.337528228759766, -6.0237812995910645, -5.710034370422363, -5.396286964416504, -5.082540035247803, -4.768792629241943, -4.455045700073242, -4.141298294067383, -3.8275513648986816, -3.5138044357299805, -3.2000572681427, -2.88631010055542, -2.5725631713867188, -2.2588160037994385, -1.9450689554214478, -1.631321907043457, -1.3175747394561768, -1.003827691078186, -0.6900806427001953, -0.37633347511291504, -0.06258654594421387, 0.2511606216430664, 0.5649076700210571, 0.8786547780036926, 1.1924018859863281, 1.5061489343643188, 1.8198959827423096, 2.13364315032959, 2.447390079498291, 2.7611372470855713, 3.0748844146728516, 3.3886313438415527, 3.702378511428833, 4.016125679016113, 4.3298726081848145, 4.643619537353516, 4.957366943359375, 5.271113872528076, 5.584860801696777, 5.898608207702637, 6.212355136871338, 6.526102066040039, 6.839849472045898, 7.1535964012146, 7.467343330383301, 7.78109073638916, 8.09483814239502, 8.408584594726562, 8.722332000732422, 9.036079406738281, 9.349825859069824, 9.663573265075684, 9.977319717407227, 10.291067123413086]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 15.0, 13.0, 31.0, 58.0, 49.0, 95.0, 141.0, 251.0, 390.0, 626.0, 1193.0, 2145.0, 3789.0, 7014.0, 13742.0, 26449.0, 49966.0, 89756.0, 143126.0, 186615.0, 185772.0, 141499.0, 89736.0, 50146.0, 26577.0, 13748.0, 6987.0, 3782.0, 2031.0, 1090.0, 666.0, 387.0, 221.0, 157.0, 74.0, 56.0, 53.0, 19.0, 23.0, 19.0, 6.0, 12.0, 12.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.009765625, -2.921234130859375, -2.83270263671875, -2.744171142578125, -2.6556396484375, -2.567108154296875, -2.47857666015625, -2.390045166015625, -2.301513671875, -2.212982177734375, -2.12445068359375, -2.035919189453125, -1.9473876953125, -1.858856201171875, -1.77032470703125, -1.681793212890625, -1.59326171875, -1.504730224609375, -1.41619873046875, -1.327667236328125, -1.2391357421875, -1.150604248046875, -1.06207275390625, -0.973541259765625, -0.885009765625, -0.796478271484375, -0.70794677734375, -0.619415283203125, -0.5308837890625, -0.442352294921875, -0.35382080078125, -0.265289306640625, -0.1767578125, -0.088226318359375, 0.00030517578125, 0.088836669921875, 0.1773681640625, 0.265899658203125, 0.35443115234375, 0.442962646484375, 0.531494140625, 0.620025634765625, 0.70855712890625, 0.797088623046875, 0.8856201171875, 0.974151611328125, 1.06268310546875, 1.151214599609375, 1.23974609375, 1.328277587890625, 1.41680908203125, 1.505340576171875, 1.5938720703125, 1.682403564453125, 1.77093505859375, 1.859466552734375, 1.947998046875, 2.036529541015625, 2.12506103515625, 2.213592529296875, 2.3021240234375, 2.390655517578125, 2.47918701171875, 2.567718505859375, 2.65625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 9.0, 11.0, 7.0, 11.0, 8.0, 19.0, 16.0, 18.0, 22.0, 14.0, 25.0, 32.0, 37.0, 43.0, 42.0, 37.0, 40.0, 38.0, 42.0, 41.0, 59.0, 47.0, 36.0, 29.0, 38.0, 28.0, 29.0, 35.0, 41.0, 21.0, 17.0, 27.0, 14.0, 10.0, 15.0, 8.0, 11.0, 8.0, 6.0, 7.0, 2.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.4765625, -10.135009765625, -9.79345703125, -9.451904296875, -9.1103515625, -8.768798828125, -8.42724609375, -8.085693359375, -7.744140625, -7.402587890625, -7.06103515625, -6.719482421875, -6.3779296875, -6.036376953125, -5.69482421875, -5.353271484375, -5.01171875, -4.670166015625, -4.32861328125, -3.987060546875, -3.6455078125, -3.303955078125, -2.96240234375, -2.620849609375, -2.279296875, -1.937744140625, -1.59619140625, -1.254638671875, -0.9130859375, -0.571533203125, -0.22998046875, 0.111572265625, 0.453125, 0.794677734375, 1.13623046875, 1.477783203125, 1.8193359375, 2.160888671875, 2.50244140625, 2.843994140625, 3.185546875, 3.527099609375, 3.86865234375, 4.210205078125, 4.5517578125, 4.893310546875, 5.23486328125, 5.576416015625, 5.91796875, 6.259521484375, 6.60107421875, 6.942626953125, 7.2841796875, 7.625732421875, 7.96728515625, 8.308837890625, 8.650390625, 8.991943359375, 9.33349609375, 9.675048828125, 10.0166015625, 10.358154296875, 10.69970703125, 11.041259765625, 11.3828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 5.0, 10.0, 9.0, 26.0, 37.0, 30.0, 43.0, 63.0, 109.0, 140.0, 221.0, 374.0, 665.0, 1058.0, 1912.0, 3541.0, 7007.0, 13698.0, 29104.0, 61752.0, 122791.0, 202701.0, 234135.0, 176051.0, 99174.0, 48258.0, 22643.0, 10810.0, 5440.0, 2747.0, 1538.0, 950.0, 552.0, 341.0, 178.0, 137.0, 77.0, 52.0, 55.0, 31.0, 28.0, 11.0, 7.0, 8.0, 9.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0], "bins": [-3.44140625, -3.338165283203125, -3.23492431640625, -3.131683349609375, -3.0284423828125, -2.925201416015625, -2.82196044921875, -2.718719482421875, -2.615478515625, -2.512237548828125, -2.40899658203125, -2.305755615234375, -2.2025146484375, -2.099273681640625, -1.99603271484375, -1.892791748046875, -1.78955078125, -1.686309814453125, -1.58306884765625, -1.479827880859375, -1.3765869140625, -1.273345947265625, -1.17010498046875, -1.066864013671875, -0.963623046875, -0.860382080078125, -0.75714111328125, -0.653900146484375, -0.5506591796875, -0.447418212890625, -0.34417724609375, -0.240936279296875, -0.1376953125, -0.034454345703125, 0.06878662109375, 0.172027587890625, 0.2752685546875, 0.378509521484375, 0.48175048828125, 0.584991455078125, 0.688232421875, 0.791473388671875, 0.89471435546875, 0.997955322265625, 1.1011962890625, 1.204437255859375, 1.30767822265625, 1.410919189453125, 1.51416015625, 1.617401123046875, 1.72064208984375, 1.823883056640625, 1.9271240234375, 2.030364990234375, 2.13360595703125, 2.236846923828125, 2.340087890625, 2.443328857421875, 2.54656982421875, 2.649810791015625, 2.7530517578125, 2.856292724609375, 2.95953369140625, 3.062774658203125, 3.166015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 8.0, 5.0, 15.0, 16.0, 7.0, 15.0, 23.0, 20.0, 24.0, 36.0, 32.0, 30.0, 35.0, 41.0, 35.0, 45.0, 41.0, 42.0, 42.0, 40.0, 34.0, 32.0, 46.0, 45.0, 21.0, 34.0, 32.0, 24.0, 23.0, 26.0, 25.0, 24.0, 16.0, 11.0, 12.0, 9.0, 5.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4609375, -6.23907470703125, -6.0172119140625, -5.79534912109375, -5.573486328125, -5.35162353515625, -5.1297607421875, -4.90789794921875, -4.68603515625, -4.46417236328125, -4.2423095703125, -4.02044677734375, -3.798583984375, -3.57672119140625, -3.3548583984375, -3.13299560546875, -2.9111328125, -2.68927001953125, -2.4674072265625, -2.24554443359375, -2.023681640625, -1.80181884765625, -1.5799560546875, -1.35809326171875, -1.13623046875, -0.91436767578125, -0.6925048828125, -0.47064208984375, -0.248779296875, -0.02691650390625, 0.1949462890625, 0.41680908203125, 0.638671875, 0.86053466796875, 1.0823974609375, 1.30426025390625, 1.526123046875, 1.74798583984375, 1.9698486328125, 2.19171142578125, 2.41357421875, 2.63543701171875, 2.8572998046875, 3.07916259765625, 3.301025390625, 3.52288818359375, 3.7447509765625, 3.96661376953125, 4.1884765625, 4.41033935546875, 4.6322021484375, 4.85406494140625, 5.075927734375, 5.29779052734375, 5.5196533203125, 5.74151611328125, 5.96337890625, 6.18524169921875, 6.4071044921875, 6.62896728515625, 6.850830078125, 7.07269287109375, 7.2945556640625, 7.51641845703125, 7.73828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 9.0, 11.0, 15.0, 15.0, 17.0, 29.0, 24.0, 52.0, 61.0, 72.0, 95.0, 123.0, 179.0, 213.0, 302.0, 474.0, 637.0, 998.0, 1590.0, 2787.0, 5366.0, 13709.0, 50453.0, 282161.0, 522074.0, 122570.0, 25602.0, 8492.0, 3970.0, 2252.0, 1298.0, 767.0, 611.0, 387.0, 275.0, 220.0, 134.0, 133.0, 92.0, 63.0, 55.0, 27.0, 41.0, 20.0, 23.0, 18.0, 14.0, 9.0, 5.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0], "bins": [-2.1953125, -2.125091552734375, -2.05487060546875, -1.984649658203125, -1.9144287109375, -1.844207763671875, -1.77398681640625, -1.703765869140625, -1.633544921875, -1.563323974609375, -1.49310302734375, -1.422882080078125, -1.3526611328125, -1.282440185546875, -1.21221923828125, -1.141998291015625, -1.07177734375, -1.001556396484375, -0.93133544921875, -0.861114501953125, -0.7908935546875, -0.720672607421875, -0.65045166015625, -0.580230712890625, -0.510009765625, -0.439788818359375, -0.36956787109375, -0.299346923828125, -0.2291259765625, -0.158905029296875, -0.08868408203125, -0.018463134765625, 0.0517578125, 0.121978759765625, 0.19219970703125, 0.262420654296875, 0.3326416015625, 0.402862548828125, 0.47308349609375, 0.543304443359375, 0.613525390625, 0.683746337890625, 0.75396728515625, 0.824188232421875, 0.8944091796875, 0.964630126953125, 1.03485107421875, 1.105072021484375, 1.17529296875, 1.245513916015625, 1.31573486328125, 1.385955810546875, 1.4561767578125, 1.526397705078125, 1.59661865234375, 1.666839599609375, 1.737060546875, 1.807281494140625, 1.87750244140625, 1.947723388671875, 2.0179443359375, 2.088165283203125, 2.15838623046875, 2.228607177734375, 2.298828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 7.0, 5.0, 8.0, 8.0, 23.0, 27.0, 44.0, 63.0, 81.0, 97.0, 116.0, 92.0, 107.0, 100.0, 71.0, 52.0, 35.0, 23.0, 26.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011605024337768555, -0.00011232215911149979, -0.00010859407484531403, -0.00010486599057912827, -0.0001011379063129425, -9.740982204675674e-05, -9.368173778057098e-05, -8.995365351438522e-05, -8.622556924819946e-05, -8.24974849820137e-05, -7.876940071582794e-05, -7.504131644964218e-05, -7.131323218345642e-05, -6.758514791727066e-05, -6.38570636510849e-05, -6.012897938489914e-05, -5.640089511871338e-05, -5.267281085252762e-05, -4.894472658634186e-05, -4.52166423201561e-05, -4.148855805397034e-05, -3.7760473787784576e-05, -3.4032389521598816e-05, -3.0304305255413055e-05, -2.6576220989227295e-05, -2.2848136723041534e-05, -1.9120052456855774e-05, -1.5391968190670013e-05, -1.1663883924484253e-05, -7.935799658298492e-06, -4.207715392112732e-06, -4.796311259269714e-07, 3.248453140258789e-06, 6.9765374064445496e-06, 1.070462167263031e-05, 1.443270593881607e-05, 1.816079020500183e-05, 2.188887447118759e-05, 2.5616958737373352e-05, 2.9345043003559113e-05, 3.307312726974487e-05, 3.6801211535930634e-05, 4.0529295802116394e-05, 4.4257380068302155e-05, 4.7985464334487915e-05, 5.1713548600673676e-05, 5.5441632866859436e-05, 5.9169717133045197e-05, 6.289780139923096e-05, 6.662588566541672e-05, 7.035396993160248e-05, 7.408205419778824e-05, 7.7810138463974e-05, 8.153822273015976e-05, 8.526630699634552e-05, 8.899439126253128e-05, 9.272247552871704e-05, 9.64505597949028e-05, 0.00010017864406108856, 0.00010390672832727432, 0.00010763481259346008, 0.00011136289685964584, 0.0001150909811258316, 0.00011881906539201736, 0.00012254714965820312]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 4.0, 6.0, 8.0, 17.0, 12.0, 30.0, 58.0, 82.0, 113.0, 173.0, 263.0, 442.0, 676.0, 1116.0, 1965.0, 3617.0, 7638.0, 18702.0, 56913.0, 187302.0, 385359.0, 255618.0, 82383.0, 26036.0, 9647.0, 4575.0, 2373.0, 1355.0, 810.0, 452.0, 287.0, 193.0, 119.0, 67.0, 49.0, 31.0, 18.0, 22.0, 9.0, 7.0, 1.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.822265625, -1.7586669921875, -1.695068359375, -1.6314697265625, -1.56787109375, -1.5042724609375, -1.440673828125, -1.3770751953125, -1.3134765625, -1.2498779296875, -1.186279296875, -1.1226806640625, -1.05908203125, -0.9954833984375, -0.931884765625, -0.8682861328125, -0.8046875, -0.7410888671875, -0.677490234375, -0.6138916015625, -0.55029296875, -0.4866943359375, -0.423095703125, -0.3594970703125, -0.2958984375, -0.2322998046875, -0.168701171875, -0.1051025390625, -0.04150390625, 0.0220947265625, 0.085693359375, 0.1492919921875, 0.212890625, 0.2764892578125, 0.340087890625, 0.4036865234375, 0.46728515625, 0.5308837890625, 0.594482421875, 0.6580810546875, 0.7216796875, 0.7852783203125, 0.848876953125, 0.9124755859375, 0.97607421875, 1.0396728515625, 1.103271484375, 1.1668701171875, 1.23046875, 1.2940673828125, 1.357666015625, 1.4212646484375, 1.48486328125, 1.5484619140625, 1.612060546875, 1.6756591796875, 1.7392578125, 1.8028564453125, 1.866455078125, 1.9300537109375, 1.99365234375, 2.0572509765625, 2.120849609375, 2.1844482421875, 2.248046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 6.0, 8.0, 9.0, 17.0, 9.0, 22.0, 24.0, 38.0, 45.0, 64.0, 77.0, 98.0, 104.0, 89.0, 88.0, 63.0, 45.0, 47.0, 38.0, 24.0, 15.0, 9.0, 10.0, 5.0, 4.0, 8.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6513671875, -0.6284713745117188, -0.6055755615234375, -0.5826797485351562, -0.559783935546875, -0.5368881225585938, -0.5139923095703125, -0.49109649658203125, -0.46820068359375, -0.44530487060546875, -0.4224090576171875, -0.39951324462890625, -0.376617431640625, -0.35372161865234375, -0.3308258056640625, -0.30792999267578125, -0.2850341796875, -0.26213836669921875, -0.2392425537109375, -0.21634674072265625, -0.193450927734375, -0.17055511474609375, -0.1476593017578125, -0.12476348876953125, -0.10186767578125, -0.07897186279296875, -0.0560760498046875, -0.03318023681640625, -0.010284423828125, 0.01261138916015625, 0.0355072021484375, 0.05840301513671875, 0.081298828125, 0.10419464111328125, 0.1270904541015625, 0.14998626708984375, 0.172882080078125, 0.19577789306640625, 0.2186737060546875, 0.24156951904296875, 0.26446533203125, 0.28736114501953125, 0.3102569580078125, 0.33315277099609375, 0.356048583984375, 0.37894439697265625, 0.4018402099609375, 0.42473602294921875, 0.4476318359375, 0.47052764892578125, 0.4934234619140625, 0.5163192749023438, 0.539215087890625, 0.5621109008789062, 0.5850067138671875, 0.6079025268554688, 0.63079833984375, 0.6536941528320312, 0.6765899658203125, 0.6994857788085938, 0.722381591796875, 0.7452774047851562, 0.7681732177734375, 0.7910690307617188, 0.81396484375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 8.0, 5.0, 8.0, 9.0, 13.0, 23.0, 26.0, 26.0, 36.0, 39.0, 41.0, 46.0, 35.0, 41.0, 52.0, 49.0, 55.0, 55.0, 55.0, 58.0, 52.0, 37.0, 38.0, 33.0, 36.0, 19.0, 14.0, 17.0, 15.0, 11.0, 15.0, 11.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.820603370666504, -8.522157669067383, -8.223711967468262, -7.925266265869141, -7.6268205642700195, -7.328374862670898, -7.029928684234619, -6.731482982635498, -6.433037281036377, -6.134591579437256, -5.836145877838135, -5.537700176239014, -5.239253997802734, -4.940808296203613, -4.642362594604492, -4.343916893005371, -4.04547119140625, -3.747025489807129, -3.448579788208008, -3.1501338481903076, -2.8516881465911865, -2.5532424449920654, -2.2547965049743652, -1.9563508033752441, -1.657905101776123, -1.359459400177002, -1.0610135793685913, -0.7625678181648254, -0.46412205696105957, -0.16567635536193848, 0.13276946544647217, 0.4312152862548828, 0.7296619415283203, 1.0281076431274414, 1.326553463935852, 1.6249992847442627, 1.9234449863433838, 2.221890687942505, 2.520336627960205, 2.818782329559326, 3.1172280311584473, 3.4156737327575684, 3.7141194343566895, 4.0125651359558105, 4.31101131439209, 4.609457015991211, 4.907902717590332, 5.206348419189453, 5.504794120788574, 5.803239822387695, 6.101685523986816, 6.4001312255859375, 6.698576927185059, 6.99702262878418, 7.295468807220459, 7.59391450881958, 7.892360210418701, 8.19080638885498, 8.489252090454102, 8.787697792053223, 9.086143493652344, 9.384589195251465, 9.683034896850586, 9.981480598449707, 10.279926300048828]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 11.0, 6.0, 8.0, 18.0, 14.0, 14.0, 21.0, 17.0, 21.0, 18.0, 25.0, 29.0, 28.0, 44.0, 40.0, 41.0, 33.0, 45.0, 34.0, 42.0, 41.0, 34.0, 46.0, 32.0, 35.0, 33.0, 36.0, 29.0, 26.0, 27.0, 26.0, 23.0, 12.0, 18.0, 13.0, 7.0, 14.0, 6.0, 9.0, 10.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-9.933987617492676, -9.621888160705566, -9.30978775024414, -8.997688293457031, -8.685588836669922, -8.373489379882812, -8.061388969421387, -7.749289512634277, -7.43718957901001, -7.125089645385742, -6.812990188598633, -6.500890254974365, -6.188790321350098, -5.876690864562988, -5.564590930938721, -5.252490997314453, -4.940391540527344, -4.628291606903076, -4.316192150115967, -4.004092216491699, -3.6919925212860107, -3.3798928260803223, -3.0677928924560547, -2.755693197250366, -2.4435935020446777, -2.1314938068389893, -1.8193939924240112, -1.5072941780090332, -1.1951944828033447, -0.8830947875976562, -0.5709949731826782, -0.2588951587677002, 0.05320453643798828, 0.36530429124832153, 0.6774040460586548, 0.989503800868988, 1.3016035556793213, 1.6137032508850098, 1.9258030652999878, 2.237902879714966, 2.5500025749206543, 2.8621022701263428, 3.1742019653320312, 3.486301898956299, 3.7984015941619873, 4.110501289367676, 4.422601222991943, 4.734701156616211, 5.04680061340332, 5.358900547027588, 5.671000003814697, 5.983099937438965, 6.295199394226074, 6.607299327850342, 6.919399261474609, 7.231498718261719, 7.543598651885986, 7.855698585510254, 8.167798042297363, 8.479897499084473, 8.791997909545898, 9.104097366333008, 9.416196823120117, 9.728297233581543, 10.040396690368652]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 13.0, 25.0, 39.0, 40.0, 51.0, 117.0, 163.0, 247.0, 403.0, 628.0, 891.0, 1420.0, 2253.0, 3377.0, 5218.0, 7514.0, 11417.0, 16708.0, 23581.0, 33346.0, 44648.0, 58229.0, 71745.0, 83886.0, 93430.0, 97412.0, 95609.0, 87645.0, 76068.0, 62729.0, 49007.0, 36824.0, 26734.0, 18739.0, 12747.0, 8833.0, 5671.0, 3875.0, 2545.0, 1651.0, 1050.0, 710.0, 442.0, 328.0, 191.0, 135.0, 69.0, 51.0, 38.0, 22.0, 15.0, 7.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.9921875, -4.83453369140625, -4.6768798828125, -4.51922607421875, -4.361572265625, -4.20391845703125, -4.0462646484375, -3.88861083984375, -3.73095703125, -3.57330322265625, -3.4156494140625, -3.25799560546875, -3.100341796875, -2.94268798828125, -2.7850341796875, -2.62738037109375, -2.4697265625, -2.31207275390625, -2.1544189453125, -1.99676513671875, -1.839111328125, -1.68145751953125, -1.5238037109375, -1.36614990234375, -1.20849609375, -1.05084228515625, -0.8931884765625, -0.73553466796875, -0.577880859375, -0.42022705078125, -0.2625732421875, -0.10491943359375, 0.052734375, 0.21038818359375, 0.3680419921875, 0.52569580078125, 0.683349609375, 0.84100341796875, 0.9986572265625, 1.15631103515625, 1.31396484375, 1.47161865234375, 1.6292724609375, 1.78692626953125, 1.944580078125, 2.10223388671875, 2.2598876953125, 2.41754150390625, 2.5751953125, 2.73284912109375, 2.8905029296875, 3.04815673828125, 3.205810546875, 3.36346435546875, 3.5211181640625, 3.67877197265625, 3.83642578125, 3.99407958984375, 4.1517333984375, 4.30938720703125, 4.467041015625, 4.62469482421875, 4.7823486328125, 4.94000244140625, 5.09765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 6.0, 3.0, 13.0, 5.0, 12.0, 16.0, 14.0, 18.0, 14.0, 17.0, 16.0, 24.0, 28.0, 30.0, 35.0, 42.0, 39.0, 34.0, 40.0, 34.0, 30.0, 41.0, 38.0, 30.0, 30.0, 42.0, 32.0, 42.0, 38.0, 29.0, 28.0, 17.0, 27.0, 21.0, 15.0, 14.0, 15.0, 17.0, 16.0, 7.0, 5.0, 6.0, 2.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.5234375, -8.226318359375, -7.92919921875, -7.632080078125, -7.3349609375, -7.037841796875, -6.74072265625, -6.443603515625, -6.146484375, -5.849365234375, -5.55224609375, -5.255126953125, -4.9580078125, -4.660888671875, -4.36376953125, -4.066650390625, -3.76953125, -3.472412109375, -3.17529296875, -2.878173828125, -2.5810546875, -2.283935546875, -1.98681640625, -1.689697265625, -1.392578125, -1.095458984375, -0.79833984375, -0.501220703125, -0.2041015625, 0.093017578125, 0.39013671875, 0.687255859375, 0.984375, 1.281494140625, 1.57861328125, 1.875732421875, 2.1728515625, 2.469970703125, 2.76708984375, 3.064208984375, 3.361328125, 3.658447265625, 3.95556640625, 4.252685546875, 4.5498046875, 4.846923828125, 5.14404296875, 5.441162109375, 5.73828125, 6.035400390625, 6.33251953125, 6.629638671875, 6.9267578125, 7.223876953125, 7.52099609375, 7.818115234375, 8.115234375, 8.412353515625, 8.70947265625, 9.006591796875, 9.3037109375, 9.600830078125, 9.89794921875, 10.195068359375, 10.4921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 23.0, 15.0, 28.0, 55.0, 55.0, 85.0, 152.0, 224.0, 312.0, 504.0, 758.0, 1126.0, 1687.0, 2639.0, 4084.0, 5923.0, 9116.0, 13429.0, 19764.0, 27888.0, 38762.0, 51732.0, 66129.0, 80016.0, 91609.0, 98645.0, 99042.0, 93129.0, 83129.0, 68652.0, 54455.0, 40917.0, 29885.0, 20967.0, 14526.0, 9779.0, 6548.0, 4265.0, 3014.0, 1830.0, 1261.0, 851.0, 565.0, 362.0, 202.0, 159.0, 88.0, 48.0, 41.0, 23.0, 28.0, 9.0, 10.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-5.28125, -5.11669921875, -4.9521484375, -4.78759765625, -4.623046875, -4.45849609375, -4.2939453125, -4.12939453125, -3.96484375, -3.80029296875, -3.6357421875, -3.47119140625, -3.306640625, -3.14208984375, -2.9775390625, -2.81298828125, -2.6484375, -2.48388671875, -2.3193359375, -2.15478515625, -1.990234375, -1.82568359375, -1.6611328125, -1.49658203125, -1.33203125, -1.16748046875, -1.0029296875, -0.83837890625, -0.673828125, -0.50927734375, -0.3447265625, -0.18017578125, -0.015625, 0.14892578125, 0.3134765625, 0.47802734375, 0.642578125, 0.80712890625, 0.9716796875, 1.13623046875, 1.30078125, 1.46533203125, 1.6298828125, 1.79443359375, 1.958984375, 2.12353515625, 2.2880859375, 2.45263671875, 2.6171875, 2.78173828125, 2.9462890625, 3.11083984375, 3.275390625, 3.43994140625, 3.6044921875, 3.76904296875, 3.93359375, 4.09814453125, 4.2626953125, 4.42724609375, 4.591796875, 4.75634765625, 4.9208984375, 5.08544921875, 5.25]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 10.0, 10.0, 15.0, 7.0, 15.0, 22.0, 10.0, 18.0, 28.0, 25.0, 22.0, 30.0, 38.0, 20.0, 39.0, 39.0, 28.0, 28.0, 49.0, 37.0, 37.0, 53.0, 36.0, 34.0, 34.0, 31.0, 41.0, 25.0, 19.0, 37.0, 21.0, 26.0, 24.0, 12.0, 11.0, 10.0, 10.0, 7.0, 9.0, 3.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.02734375, -5.83624267578125, -5.6451416015625, -5.45404052734375, -5.262939453125, -5.07183837890625, -4.8807373046875, -4.68963623046875, -4.49853515625, -4.30743408203125, -4.1163330078125, -3.92523193359375, -3.734130859375, -3.54302978515625, -3.3519287109375, -3.16082763671875, -2.9697265625, -2.77862548828125, -2.5875244140625, -2.39642333984375, -2.205322265625, -2.01422119140625, -1.8231201171875, -1.63201904296875, -1.44091796875, -1.24981689453125, -1.0587158203125, -0.86761474609375, -0.676513671875, -0.48541259765625, -0.2943115234375, -0.10321044921875, 0.087890625, 0.27899169921875, 0.4700927734375, 0.66119384765625, 0.852294921875, 1.04339599609375, 1.2344970703125, 1.42559814453125, 1.61669921875, 1.80780029296875, 1.9989013671875, 2.19000244140625, 2.381103515625, 2.57220458984375, 2.7633056640625, 2.95440673828125, 3.1455078125, 3.33660888671875, 3.5277099609375, 3.71881103515625, 3.909912109375, 4.10101318359375, 4.2921142578125, 4.48321533203125, 4.67431640625, 4.86541748046875, 5.0565185546875, 5.24761962890625, 5.438720703125, 5.62982177734375, 5.8209228515625, 6.01202392578125, 6.203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 7.0, 11.0, 15.0, 23.0, 33.0, 45.0, 75.0, 94.0, 129.0, 209.0, 345.0, 537.0, 892.0, 1568.0, 2818.0, 5354.0, 10747.0, 22444.0, 45260.0, 87500.0, 145148.0, 193538.0, 195023.0, 148997.0, 91528.0, 48146.0, 23820.0, 11450.0, 5634.0, 2991.0, 1648.0, 927.0, 551.0, 325.0, 234.0, 169.0, 95.0, 72.0, 44.0, 34.0, 18.0, 13.0, 16.0, 7.0, 7.0, 6.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.666015625, -3.543975830078125, -3.42193603515625, -3.299896240234375, -3.1778564453125, -3.055816650390625, -2.93377685546875, -2.811737060546875, -2.689697265625, -2.567657470703125, -2.44561767578125, -2.323577880859375, -2.2015380859375, -2.079498291015625, -1.95745849609375, -1.835418701171875, -1.71337890625, -1.591339111328125, -1.46929931640625, -1.347259521484375, -1.2252197265625, -1.103179931640625, -0.98114013671875, -0.859100341796875, -0.737060546875, -0.615020751953125, -0.49298095703125, -0.370941162109375, -0.2489013671875, -0.126861572265625, -0.00482177734375, 0.117218017578125, 0.2392578125, 0.361297607421875, 0.48333740234375, 0.605377197265625, 0.7274169921875, 0.849456787109375, 0.97149658203125, 1.093536376953125, 1.215576171875, 1.337615966796875, 1.45965576171875, 1.581695556640625, 1.7037353515625, 1.825775146484375, 1.94781494140625, 2.069854736328125, 2.19189453125, 2.313934326171875, 2.43597412109375, 2.558013916015625, 2.6800537109375, 2.802093505859375, 2.92413330078125, 3.046173095703125, 3.168212890625, 3.290252685546875, 3.41229248046875, 3.534332275390625, 3.6563720703125, 3.778411865234375, 3.90045166015625, 4.022491455078125, 4.14453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 1.0, 6.0, 3.0, 4.0, 11.0, 18.0, 18.0, 19.0, 15.0, 15.0, 18.0, 33.0, 35.0, 36.0, 41.0, 41.0, 45.0, 47.0, 45.0, 50.0, 44.0, 41.0, 46.0, 40.0, 36.0, 52.0, 44.0, 29.0, 20.0, 28.0, 22.0, 17.0, 13.0, 8.0, 13.0, 14.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00028514862060546875, -0.00027682632207870483, -0.0002685040235519409, -0.000260181725025177, -0.0002518594264984131, -0.00024353712797164917, -0.00023521482944488525, -0.00022689253091812134, -0.00021857023239135742, -0.0002102479338645935, -0.0002019256353378296, -0.00019360333681106567, -0.00018528103828430176, -0.00017695873975753784, -0.00016863644123077393, -0.00016031414270401, -0.0001519918441772461, -0.00014366954565048218, -0.00013534724712371826, -0.00012702494859695435, -0.00011870265007019043, -0.00011038035154342651, -0.0001020580530166626, -9.373575448989868e-05, -8.541345596313477e-05, -7.709115743637085e-05, -6.876885890960693e-05, -6.044656038284302e-05, -5.21242618560791e-05, -4.3801963329315186e-05, -3.547966480255127e-05, -2.7157366275787354e-05, -1.8835067749023438e-05, -1.0512769222259521e-05, -2.1904706954956055e-06, 6.1318278312683105e-06, 1.4454126358032227e-05, 2.2776424884796143e-05, 3.109872341156006e-05, 3.9421021938323975e-05, 4.774332046508789e-05, 5.606561899185181e-05, 6.438791751861572e-05, 7.271021604537964e-05, 8.103251457214355e-05, 8.935481309890747e-05, 9.767711162567139e-05, 0.0001059994101524353, 0.00011432170867919922, 0.00012264400720596313, 0.00013096630573272705, 0.00013928860425949097, 0.00014761090278625488, 0.0001559332013130188, 0.00016425549983978271, 0.00017257779836654663, 0.00018090009689331055, 0.00018922239542007446, 0.00019754469394683838, 0.0002058669924736023, 0.0002141892910003662, 0.00022251158952713013, 0.00023083388805389404, 0.00023915618658065796, 0.0002474784851074219]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 9.0, 12.0, 28.0, 33.0, 41.0, 65.0, 97.0, 123.0, 192.0, 328.0, 472.0, 812.0, 1372.0, 2344.0, 4496.0, 9239.0, 20183.0, 45803.0, 95761.0, 170972.0, 224397.0, 205772.0, 135631.0, 69822.0, 31825.0, 14068.0, 6642.0, 3350.0, 1759.0, 1034.0, 649.0, 434.0, 259.0, 173.0, 125.0, 80.0, 48.0, 42.0, 19.0, 16.0, 13.0, 8.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.23828125, -5.09185791015625, -4.9454345703125, -4.79901123046875, -4.652587890625, -4.50616455078125, -4.3597412109375, -4.21331787109375, -4.06689453125, -3.92047119140625, -3.7740478515625, -3.62762451171875, -3.481201171875, -3.33477783203125, -3.1883544921875, -3.04193115234375, -2.8955078125, -2.74908447265625, -2.6026611328125, -2.45623779296875, -2.309814453125, -2.16339111328125, -2.0169677734375, -1.87054443359375, -1.72412109375, -1.57769775390625, -1.4312744140625, -1.28485107421875, -1.138427734375, -0.99200439453125, -0.8455810546875, -0.69915771484375, -0.552734375, -0.40631103515625, -0.2598876953125, -0.11346435546875, 0.032958984375, 0.17938232421875, 0.3258056640625, 0.47222900390625, 0.61865234375, 0.76507568359375, 0.9114990234375, 1.05792236328125, 1.204345703125, 1.35076904296875, 1.4971923828125, 1.64361572265625, 1.7900390625, 1.93646240234375, 2.0828857421875, 2.22930908203125, 2.375732421875, 2.52215576171875, 2.6685791015625, 2.81500244140625, 2.96142578125, 3.10784912109375, 3.2542724609375, 3.40069580078125, 3.547119140625, 3.69354248046875, 3.8399658203125, 3.98638916015625, 4.1328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 7.0, 8.0, 9.0, 12.0, 25.0, 20.0, 22.0, 33.0, 41.0, 57.0, 74.0, 66.0, 58.0, 54.0, 69.0, 71.0, 59.0, 41.0, 40.0, 30.0, 29.0, 28.0, 30.0, 22.0, 13.0, 10.0, 8.0, 6.0, 6.0, 7.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6806640625, -1.623626708984375, -1.56658935546875, -1.509552001953125, -1.4525146484375, -1.395477294921875, -1.33843994140625, -1.281402587890625, -1.224365234375, -1.167327880859375, -1.11029052734375, -1.053253173828125, -0.9962158203125, -0.939178466796875, -0.88214111328125, -0.825103759765625, -0.76806640625, -0.711029052734375, -0.65399169921875, -0.596954345703125, -0.5399169921875, -0.482879638671875, -0.42584228515625, -0.368804931640625, -0.311767578125, -0.254730224609375, -0.19769287109375, -0.140655517578125, -0.0836181640625, -0.026580810546875, 0.03045654296875, 0.087493896484375, 0.14453125, 0.201568603515625, 0.25860595703125, 0.315643310546875, 0.3726806640625, 0.429718017578125, 0.48675537109375, 0.543792724609375, 0.600830078125, 0.657867431640625, 0.71490478515625, 0.771942138671875, 0.8289794921875, 0.886016845703125, 0.94305419921875, 1.000091552734375, 1.05712890625, 1.114166259765625, 1.17120361328125, 1.228240966796875, 1.2852783203125, 1.342315673828125, 1.39935302734375, 1.456390380859375, 1.513427734375, 1.570465087890625, 1.62750244140625, 1.684539794921875, 1.7415771484375, 1.798614501953125, 1.85565185546875, 1.912689208984375, 1.9697265625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 10.0, 2.0, 11.0, 7.0, 11.0, 14.0, 14.0, 23.0, 29.0, 22.0, 30.0, 35.0, 36.0, 36.0, 37.0, 42.0, 53.0, 42.0, 48.0, 37.0, 41.0, 41.0, 59.0, 62.0, 31.0, 28.0, 29.0, 30.0, 25.0, 19.0, 9.0, 20.0, 12.0, 13.0, 13.0, 7.0, 8.0, 3.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.932397365570068, -7.667779922485352, -7.403162956237793, -7.138545989990234, -6.873928546905518, -6.609311103820801, -6.344694137573242, -6.080077171325684, -5.815459728240967, -5.55084228515625, -5.286225318908691, -5.021608352661133, -4.756990909576416, -4.492373466491699, -4.227756500244141, -3.963139295578003, -3.6985220909118652, -3.4339048862457275, -3.16928768157959, -2.904670476913452, -2.6400532722473145, -2.3754360675811768, -2.110818862915039, -1.8462016582489014, -1.5815844535827637, -1.316967248916626, -1.0523500442504883, -0.7877328395843506, -0.5231156349182129, -0.2584984302520752, 0.0061187744140625, 0.2707359790802002, 0.5353527069091797, 0.7999699115753174, 1.064587116241455, 1.3292043209075928, 1.5938215255737305, 1.8584387302398682, 2.123055934906006, 2.3876731395721436, 2.6522903442382812, 2.916907548904419, 3.1815247535705566, 3.4461419582366943, 3.710759162902832, 3.9753763675689697, 4.239993572235107, 4.504611015319824, 4.769227981567383, 5.033844947814941, 5.298462390899658, 5.563079833984375, 5.827696800231934, 6.092313766479492, 6.356931209564209, 6.621548652648926, 6.886165618896484, 7.150782585144043, 7.41540002822876, 7.680017471313477, 7.944634437561035, 8.209251403808594, 8.473869323730469, 8.738486289978027, 9.003103256225586]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 9.0, 13.0, 10.0, 10.0, 9.0, 22.0, 15.0, 33.0, 25.0, 42.0, 31.0, 34.0, 32.0, 38.0, 49.0, 47.0, 49.0, 44.0, 39.0, 34.0, 33.0, 39.0, 41.0, 42.0, 37.0, 29.0, 39.0, 29.0, 20.0, 19.0, 20.0, 13.0, 10.0, 11.0, 7.0, 5.0, 5.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.678979873657227, -11.324647903442383, -10.970315933227539, -10.615984916687012, -10.261652946472168, -9.907320976257324, -9.55298900604248, -9.198657989501953, -8.84432601928711, -8.489994049072266, -8.135662078857422, -7.781330585479736, -7.426999092102051, -7.072667121887207, -6.718335151672363, -6.364003658294678, -6.009671688079834, -5.65533971786499, -5.301008224487305, -4.946676254272461, -4.592344760894775, -4.238012790679932, -3.883681058883667, -3.5293493270874023, -3.1750175952911377, -2.820685863494873, -2.4663541316986084, -2.1120223999023438, -1.7576905488967896, -1.403358817100525, -1.0490269660949707, -0.694695234298706, -0.3403635025024414, 0.01396825909614563, 0.36830002069473267, 0.7226318120956421, 1.0769635438919067, 1.4312952756881714, 1.7856271266937256, 2.1399588584899902, 2.494290590286255, 2.8486223220825195, 3.202954053878784, 3.557285785675049, 3.9116177558898926, 4.265949249267578, 4.620281219482422, 4.974613189697266, 5.328944683074951, 5.683276653289795, 6.0376081466674805, 6.391940116882324, 6.74627161026001, 7.1006035804748535, 7.454935073852539, 7.809267044067383, 8.163599014282227, 8.51793098449707, 8.872262954711914, 9.226593971252441, 9.580925941467285, 9.935257911682129, 10.289589881896973, 10.6439208984375, 10.998252868652344]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 5.0, 15.0, 18.0, 24.0, 31.0, 49.0, 86.0, 158.0, 261.0, 354.0, 639.0, 1031.0, 1692.0, 2777.0, 4473.0, 7537.0, 12511.0, 19781.0, 32176.0, 51376.0, 78722.0, 120260.0, 178700.0, 252484.0, 333567.0, 411400.0, 464256.0, 477694.0, 442369.0, 374792.0, 291628.0, 214331.0, 148122.0, 98770.0, 63898.0, 40561.0, 25556.0, 15873.0, 9963.0, 6204.0, 3755.0, 2400.0, 1457.0, 921.0, 593.0, 389.0, 222.0, 145.0, 106.0, 52.0, 35.0, 28.0, 22.0, 10.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.9609375, -5.763916015625, -5.56689453125, -5.369873046875, -5.1728515625, -4.975830078125, -4.77880859375, -4.581787109375, -4.384765625, -4.187744140625, -3.99072265625, -3.793701171875, -3.5966796875, -3.399658203125, -3.20263671875, -3.005615234375, -2.80859375, -2.611572265625, -2.41455078125, -2.217529296875, -2.0205078125, -1.823486328125, -1.62646484375, -1.429443359375, -1.232421875, -1.035400390625, -0.83837890625, -0.641357421875, -0.4443359375, -0.247314453125, -0.05029296875, 0.146728515625, 0.34375, 0.540771484375, 0.73779296875, 0.934814453125, 1.1318359375, 1.328857421875, 1.52587890625, 1.722900390625, 1.919921875, 2.116943359375, 2.31396484375, 2.510986328125, 2.7080078125, 2.905029296875, 3.10205078125, 3.299072265625, 3.49609375, 3.693115234375, 3.89013671875, 4.087158203125, 4.2841796875, 4.481201171875, 4.67822265625, 4.875244140625, 5.072265625, 5.269287109375, 5.46630859375, 5.663330078125, 5.8603515625, 6.057373046875, 6.25439453125, 6.451416015625, 6.6484375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 12.0, 11.0, 10.0, 16.0, 20.0, 16.0, 28.0, 34.0, 39.0, 34.0, 37.0, 28.0, 40.0, 39.0, 53.0, 39.0, 40.0, 48.0, 44.0, 36.0, 35.0, 30.0, 38.0, 40.0, 34.0, 24.0, 29.0, 28.0, 16.0, 21.0, 12.0, 13.0, 8.0, 10.0, 5.0, 6.0, 2.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.078125, -8.7940673828125, -8.510009765625, -8.2259521484375, -7.94189453125, -7.6578369140625, -7.373779296875, -7.0897216796875, -6.8056640625, -6.5216064453125, -6.237548828125, -5.9534912109375, -5.66943359375, -5.3853759765625, -5.101318359375, -4.8172607421875, -4.533203125, -4.2491455078125, -3.965087890625, -3.6810302734375, -3.39697265625, -3.1129150390625, -2.828857421875, -2.5447998046875, -2.2607421875, -1.9766845703125, -1.692626953125, -1.4085693359375, -1.12451171875, -0.8404541015625, -0.556396484375, -0.2723388671875, 0.01171875, 0.2957763671875, 0.579833984375, 0.8638916015625, 1.14794921875, 1.4320068359375, 1.716064453125, 2.0001220703125, 2.2841796875, 2.5682373046875, 2.852294921875, 3.1363525390625, 3.42041015625, 3.7044677734375, 3.988525390625, 4.2725830078125, 4.556640625, 4.8406982421875, 5.124755859375, 5.4088134765625, 5.69287109375, 5.9769287109375, 6.260986328125, 6.5450439453125, 6.8291015625, 7.1131591796875, 7.397216796875, 7.6812744140625, 7.96533203125, 8.2493896484375, 8.533447265625, 8.8175048828125, 9.1015625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 11.0, 18.0, 26.0, 60.0, 94.0, 161.0, 298.0, 491.0, 869.0, 1520.0, 2671.0, 4555.0, 7220.0, 12314.0, 19881.0, 31850.0, 50271.0, 75743.0, 112892.0, 161889.0, 220474.0, 285313.0, 348332.0, 395992.0, 422439.0, 419330.0, 385377.0, 331249.0, 266643.0, 203419.0, 146965.0, 101799.0, 68221.0, 44021.0, 27854.0, 17415.0, 10742.0, 6430.0, 3926.0, 2226.0, 1396.0, 779.0, 454.0, 288.0, 154.0, 93.0, 60.0, 30.0, 23.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.640625, -6.44451904296875, -6.2484130859375, -6.05230712890625, -5.856201171875, -5.66009521484375, -5.4639892578125, -5.26788330078125, -5.07177734375, -4.87567138671875, -4.6795654296875, -4.48345947265625, -4.287353515625, -4.09124755859375, -3.8951416015625, -3.69903564453125, -3.5029296875, -3.30682373046875, -3.1107177734375, -2.91461181640625, -2.718505859375, -2.52239990234375, -2.3262939453125, -2.13018798828125, -1.93408203125, -1.73797607421875, -1.5418701171875, -1.34576416015625, -1.149658203125, -0.95355224609375, -0.7574462890625, -0.56134033203125, -0.365234375, -0.16912841796875, 0.0269775390625, 0.22308349609375, 0.419189453125, 0.61529541015625, 0.8114013671875, 1.00750732421875, 1.20361328125, 1.39971923828125, 1.5958251953125, 1.79193115234375, 1.988037109375, 2.18414306640625, 2.3802490234375, 2.57635498046875, 2.7724609375, 2.96856689453125, 3.1646728515625, 3.36077880859375, 3.556884765625, 3.75299072265625, 3.9490966796875, 4.14520263671875, 4.34130859375, 4.53741455078125, 4.7335205078125, 4.92962646484375, 5.125732421875, 5.32183837890625, 5.5179443359375, 5.71405029296875, 5.91015625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 10.0, 12.0, 10.0, 17.0, 23.0, 28.0, 33.0, 36.0, 61.0, 60.0, 67.0, 95.0, 108.0, 117.0, 134.0, 149.0, 163.0, 196.0, 204.0, 210.0, 199.0, 225.0, 199.0, 196.0, 177.0, 195.0, 159.0, 150.0, 139.0, 105.0, 97.0, 96.0, 83.0, 67.0, 57.0, 35.0, 32.0, 30.0, 28.0, 20.0, 17.0, 4.0, 7.0, 8.0, 6.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.765625, -3.645599365234375, -3.52557373046875, -3.405548095703125, -3.2855224609375, -3.165496826171875, -3.04547119140625, -2.925445556640625, -2.805419921875, -2.685394287109375, -2.56536865234375, -2.445343017578125, -2.3253173828125, -2.205291748046875, -2.08526611328125, -1.965240478515625, -1.84521484375, -1.725189208984375, -1.60516357421875, -1.485137939453125, -1.3651123046875, -1.245086669921875, -1.12506103515625, -1.005035400390625, -0.885009765625, -0.764984130859375, -0.64495849609375, -0.524932861328125, -0.4049072265625, -0.284881591796875, -0.16485595703125, -0.044830322265625, 0.0751953125, 0.195220947265625, 0.31524658203125, 0.435272216796875, 0.5552978515625, 0.675323486328125, 0.79534912109375, 0.915374755859375, 1.035400390625, 1.155426025390625, 1.27545166015625, 1.395477294921875, 1.5155029296875, 1.635528564453125, 1.75555419921875, 1.875579833984375, 1.99560546875, 2.115631103515625, 2.23565673828125, 2.355682373046875, 2.4757080078125, 2.595733642578125, 2.71575927734375, 2.835784912109375, 2.955810546875, 3.075836181640625, 3.19586181640625, 3.315887451171875, 3.4359130859375, 3.555938720703125, 3.67596435546875, 3.795989990234375, 3.916015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 9.0, 10.0, 9.0, 14.0, 14.0, 14.0, 23.0, 22.0, 21.0, 38.0, 28.0, 38.0, 45.0, 49.0, 49.0, 47.0, 53.0, 39.0, 46.0, 49.0, 43.0, 38.0, 36.0, 37.0, 40.0, 22.0, 30.0, 27.0, 22.0, 13.0, 12.0, 10.0, 9.0, 8.0, 3.0, 4.0, 4.0, 5.0, 4.0, 0.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.935565948486328, -8.657419204711914, -8.379273414611816, -8.101126670837402, -7.822979927062988, -7.544833660125732, -7.266687393188477, -6.9885406494140625, -6.710393905639648, -6.432247638702393, -6.1541008949279785, -5.875954627990723, -5.597807884216309, -5.319661617279053, -5.041515350341797, -4.763368606567383, -4.485222339630127, -4.207076072692871, -3.928929328918457, -3.650783061981201, -3.372636318206787, -3.0944900512695312, -2.8163435459136963, -2.5381970405578613, -2.2600505352020264, -1.9819040298461914, -1.7037575244903564, -1.425611138343811, -1.147464632987976, -0.8693181276321411, -0.5911717414855957, -0.31302523612976074, -0.03487873077392578, 0.2432677447795868, 0.5214142203330994, 0.7995606660842896, 1.0777071714401245, 1.3558536767959595, 1.6340000629425049, 1.9121465682983398, 2.190293073654175, 2.4684395790100098, 2.7465860843658447, 3.0247325897216797, 3.3028788566589355, 3.5810256004333496, 3.8591718673706055, 4.1373186111450195, 4.415464878082275, 4.693611145019531, 4.971757888793945, 5.249904155731201, 5.528050899505615, 5.806197166442871, 6.084343910217285, 6.362490177154541, 6.640636444091797, 6.918782711029053, 7.196929454803467, 7.475075721740723, 7.753222465515137, 8.03136920928955, 8.309514999389648, 8.587661743164062, 8.865808486938477]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 5.0, 3.0, 4.0, 5.0, 8.0, 8.0, 14.0, 18.0, 11.0, 19.0, 19.0, 30.0, 28.0, 22.0, 35.0, 33.0, 25.0, 35.0, 35.0, 47.0, 48.0, 37.0, 44.0, 35.0, 41.0, 37.0, 37.0, 41.0, 36.0, 24.0, 26.0, 35.0, 15.0, 20.0, 20.0, 15.0, 14.0, 11.0, 14.0, 8.0, 9.0, 4.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-10.641361236572266, -10.323243141174316, -10.005125045776367, -9.687006950378418, -9.368888854980469, -9.05077075958252, -8.73265266418457, -8.414533615112305, -8.096416473388672, -7.778298377990723, -7.460180282592773, -7.142062187194824, -6.823944091796875, -6.505825996398926, -6.187707424163818, -5.869589328765869, -5.551470756530762, -5.2333526611328125, -4.915234565734863, -4.597116470336914, -4.278998374938965, -3.9608800411224365, -3.642761707305908, -3.324643611907959, -3.0065255165100098, -2.6884074211120605, -2.3702893257141113, -2.052170991897583, -1.7340528964996338, -1.4159348011016846, -1.0978165864944458, -0.779698371887207, -0.4615802764892578, -0.14346212148666382, 0.17465603351593018, 0.49277418851852417, 0.8108923435211182, 1.1290104389190674, 1.4471286535263062, 1.765246868133545, 2.083364963531494, 2.4014830589294434, 2.7196011543273926, 3.037719488143921, 3.35583758354187, 3.6739556789398193, 3.9920740127563477, 4.310192108154297, 4.628310203552246, 4.946428298950195, 5.2645463943481445, 5.582664489746094, 5.900782585144043, 6.218900680541992, 6.5370192527771, 6.855137348175049, 7.173255443572998, 7.491373538970947, 7.8094916343688965, 8.127610206604004, 8.445728302001953, 8.763846397399902, 9.081964492797852, 9.4000825881958, 9.71820068359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 9.0, 16.0, 16.0, 32.0, 39.0, 52.0, 94.0, 142.0, 242.0, 391.0, 655.0, 977.0, 1626.0, 2499.0, 4171.0, 6729.0, 10500.0, 16763.0, 26098.0, 39839.0, 58897.0, 82100.0, 106103.0, 125909.0, 130666.0, 119105.0, 97501.0, 72625.0, 51024.0, 34070.0, 21912.0, 14345.0, 8842.0, 5466.0, 3490.0, 2144.0, 1288.0, 823.0, 514.0, 324.0, 186.0, 104.0, 95.0, 45.0, 35.0, 21.0, 15.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.69921875, -1.6449432373046875, -1.590667724609375, -1.5363922119140625, -1.48211669921875, -1.4278411865234375, -1.373565673828125, -1.3192901611328125, -1.2650146484375, -1.2107391357421875, -1.156463623046875, -1.1021881103515625, -1.04791259765625, -0.9936370849609375, -0.939361572265625, -0.8850860595703125, -0.830810546875, -0.7765350341796875, -0.722259521484375, -0.6679840087890625, -0.61370849609375, -0.5594329833984375, -0.505157470703125, -0.4508819580078125, -0.3966064453125, -0.3423309326171875, -0.288055419921875, -0.2337799072265625, -0.17950439453125, -0.1252288818359375, -0.070953369140625, -0.0166778564453125, 0.03759765625, 0.0918731689453125, 0.146148681640625, 0.2004241943359375, 0.25469970703125, 0.3089752197265625, 0.363250732421875, 0.4175262451171875, 0.4718017578125, 0.5260772705078125, 0.580352783203125, 0.6346282958984375, 0.68890380859375, 0.7431793212890625, 0.797454833984375, 0.8517303466796875, 0.906005859375, 0.9602813720703125, 1.014556884765625, 1.0688323974609375, 1.12310791015625, 1.1773834228515625, 1.231658935546875, 1.2859344482421875, 1.3402099609375, 1.3944854736328125, 1.448760986328125, 1.5030364990234375, 1.55731201171875, 1.6115875244140625, 1.665863037109375, 1.7201385498046875, 1.7744140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 9.0, 5.0, 6.0, 9.0, 8.0, 11.0, 10.0, 11.0, 17.0, 19.0, 26.0, 21.0, 24.0, 30.0, 37.0, 34.0, 34.0, 40.0, 37.0, 34.0, 45.0, 59.0, 50.0, 46.0, 29.0, 42.0, 41.0, 30.0, 28.0, 33.0, 30.0, 21.0, 21.0, 23.0, 18.0, 13.0, 11.0, 12.0, 8.0, 6.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-11.5078125, -11.1646728515625, -10.821533203125, -10.4783935546875, -10.13525390625, -9.7921142578125, -9.448974609375, -9.1058349609375, -8.7626953125, -8.4195556640625, -8.076416015625, -7.7332763671875, -7.39013671875, -7.0469970703125, -6.703857421875, -6.3607177734375, -6.017578125, -5.6744384765625, -5.331298828125, -4.9881591796875, -4.64501953125, -4.3018798828125, -3.958740234375, -3.6156005859375, -3.2724609375, -2.9293212890625, -2.586181640625, -2.2430419921875, -1.89990234375, -1.5567626953125, -1.213623046875, -0.8704833984375, -0.52734375, -0.1842041015625, 0.158935546875, 0.5020751953125, 0.84521484375, 1.1883544921875, 1.531494140625, 1.8746337890625, 2.2177734375, 2.5609130859375, 2.904052734375, 3.2471923828125, 3.59033203125, 3.9334716796875, 4.276611328125, 4.6197509765625, 4.962890625, 5.3060302734375, 5.649169921875, 5.9923095703125, 6.33544921875, 6.6785888671875, 7.021728515625, 7.3648681640625, 7.7080078125, 8.0511474609375, 8.394287109375, 8.7374267578125, 9.08056640625, 9.4237060546875, 9.766845703125, 10.1099853515625, 10.453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [6.0, 4.0, 2.0, 3.0, 3.0, 6.0, 12.0, 16.0, 19.0, 31.0, 18.0, 48.0, 73.0, 111.0, 144.0, 215.0, 325.0, 500.0, 701.0, 1088.0, 1755.0, 2750.0, 4483.0, 7601.0, 12889.0, 22075.0, 39078.0, 65713.0, 105901.0, 150584.0, 174859.0, 159650.0, 116840.0, 74379.0, 44156.0, 25617.0, 14796.0, 8555.0, 5005.0, 3148.0, 1884.0, 1196.0, 742.0, 516.0, 360.0, 221.0, 146.0, 115.0, 78.0, 49.0, 30.0, 20.0, 11.0, 15.0, 6.0, 4.0, 7.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0], "bins": [-2.2109375, -2.13873291015625, -2.0665283203125, -1.99432373046875, -1.922119140625, -1.84991455078125, -1.7777099609375, -1.70550537109375, -1.63330078125, -1.56109619140625, -1.4888916015625, -1.41668701171875, -1.344482421875, -1.27227783203125, -1.2000732421875, -1.12786865234375, -1.0556640625, -0.98345947265625, -0.9112548828125, -0.83905029296875, -0.766845703125, -0.69464111328125, -0.6224365234375, -0.55023193359375, -0.47802734375, -0.40582275390625, -0.3336181640625, -0.26141357421875, -0.189208984375, -0.11700439453125, -0.0447998046875, 0.02740478515625, 0.099609375, 0.17181396484375, 0.2440185546875, 0.31622314453125, 0.388427734375, 0.46063232421875, 0.5328369140625, 0.60504150390625, 0.67724609375, 0.74945068359375, 0.8216552734375, 0.89385986328125, 0.966064453125, 1.03826904296875, 1.1104736328125, 1.18267822265625, 1.2548828125, 1.32708740234375, 1.3992919921875, 1.47149658203125, 1.543701171875, 1.61590576171875, 1.6881103515625, 1.76031494140625, 1.83251953125, 1.90472412109375, 1.9769287109375, 2.04913330078125, 2.121337890625, 2.19354248046875, 2.2657470703125, 2.33795166015625, 2.41015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 3.0, 7.0, 6.0, 16.0, 13.0, 13.0, 16.0, 24.0, 33.0, 29.0, 29.0, 34.0, 50.0, 33.0, 43.0, 36.0, 37.0, 53.0, 39.0, 32.0, 38.0, 46.0, 32.0, 34.0, 36.0, 34.0, 32.0, 24.0, 33.0, 27.0, 23.0, 15.0, 12.0, 11.0, 11.0, 11.0, 5.0, 4.0, 3.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.2901611328125, -6.072509765625, -5.8548583984375, -5.63720703125, -5.4195556640625, -5.201904296875, -4.9842529296875, -4.7666015625, -4.5489501953125, -4.331298828125, -4.1136474609375, -3.89599609375, -3.6783447265625, -3.460693359375, -3.2430419921875, -3.025390625, -2.8077392578125, -2.590087890625, -2.3724365234375, -2.15478515625, -1.9371337890625, -1.719482421875, -1.5018310546875, -1.2841796875, -1.0665283203125, -0.848876953125, -0.6312255859375, -0.41357421875, -0.1959228515625, 0.021728515625, 0.2393798828125, 0.45703125, 0.6746826171875, 0.892333984375, 1.1099853515625, 1.32763671875, 1.5452880859375, 1.762939453125, 1.9805908203125, 2.1982421875, 2.4158935546875, 2.633544921875, 2.8511962890625, 3.06884765625, 3.2864990234375, 3.504150390625, 3.7218017578125, 3.939453125, 4.1571044921875, 4.374755859375, 4.5924072265625, 4.81005859375, 5.0277099609375, 5.245361328125, 5.4630126953125, 5.6806640625, 5.8983154296875, 6.115966796875, 6.3336181640625, 6.55126953125, 6.7689208984375, 6.986572265625, 7.2042236328125, 7.421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 10.0, 9.0, 10.0, 13.0, 22.0, 22.0, 34.0, 35.0, 50.0, 80.0, 116.0, 147.0, 227.0, 321.0, 439.0, 746.0, 1237.0, 2403.0, 6197.0, 29839.0, 251289.0, 616164.0, 113743.0, 15607.0, 4315.0, 1991.0, 1123.0, 768.0, 468.0, 318.0, 209.0, 165.0, 101.0, 88.0, 61.0, 33.0, 39.0, 33.0, 18.0, 12.0, 12.0, 10.0, 2.0, 3.0, 6.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-2.513671875, -2.438232421875, -2.36279296875, -2.287353515625, -2.2119140625, -2.136474609375, -2.06103515625, -1.985595703125, -1.91015625, -1.834716796875, -1.75927734375, -1.683837890625, -1.6083984375, -1.532958984375, -1.45751953125, -1.382080078125, -1.306640625, -1.231201171875, -1.15576171875, -1.080322265625, -1.0048828125, -0.929443359375, -0.85400390625, -0.778564453125, -0.703125, -0.627685546875, -0.55224609375, -0.476806640625, -0.4013671875, -0.325927734375, -0.25048828125, -0.175048828125, -0.099609375, -0.024169921875, 0.05126953125, 0.126708984375, 0.2021484375, 0.277587890625, 0.35302734375, 0.428466796875, 0.50390625, 0.579345703125, 0.65478515625, 0.730224609375, 0.8056640625, 0.881103515625, 0.95654296875, 1.031982421875, 1.107421875, 1.182861328125, 1.25830078125, 1.333740234375, 1.4091796875, 1.484619140625, 1.56005859375, 1.635498046875, 1.7109375, 1.786376953125, 1.86181640625, 1.937255859375, 2.0126953125, 2.088134765625, 2.16357421875, 2.239013671875, 2.314453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 9.0, 26.0, 31.0, 41.0, 65.0, 93.0, 124.0, 120.0, 139.0, 111.0, 80.0, 60.0, 25.0, 25.0, 9.0, 11.0, 7.0, 9.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.386373519897461e-05, -8.032936602830887e-05, -7.679499685764313e-05, -7.326062768697739e-05, -6.972625851631165e-05, -6.61918893456459e-05, -6.265752017498016e-05, -5.912315100431442e-05, -5.558878183364868e-05, -5.205441266298294e-05, -4.85200434923172e-05, -4.498567432165146e-05, -4.145130515098572e-05, -3.791693598031998e-05, -3.4382566809654236e-05, -3.0848197638988495e-05, -2.7313828468322754e-05, -2.3779459297657013e-05, -2.0245090126991272e-05, -1.671072095632553e-05, -1.317635178565979e-05, -9.641982614994049e-06, -6.107613444328308e-06, -2.573244273662567e-06, 9.611248970031738e-07, 4.495494067668915e-06, 8.029863238334656e-06, 1.1564232409000397e-05, 1.5098601579666138e-05, 1.863297075033188e-05, 2.216733992099762e-05, 2.570170909166336e-05, 2.92360782623291e-05, 3.277044743299484e-05, 3.6304816603660583e-05, 3.9839185774326324e-05, 4.3373554944992065e-05, 4.6907924115657806e-05, 5.044229328632355e-05, 5.397666245698929e-05, 5.751103162765503e-05, 6.104540079832077e-05, 6.457976996898651e-05, 6.811413913965225e-05, 7.164850831031799e-05, 7.518287748098373e-05, 7.871724665164948e-05, 8.225161582231522e-05, 8.578598499298096e-05, 8.93203541636467e-05, 9.285472333431244e-05, 9.638909250497818e-05, 9.992346167564392e-05, 0.00010345783084630966, 0.0001069922000169754, 0.00011052656918764114, 0.00011406093835830688, 0.00011759530752897263, 0.00012112967669963837, 0.0001246640458703041, 0.00012819841504096985, 0.0001317327842116356, 0.00013526715338230133, 0.00013880152255296707, 0.0001423358917236328]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 3.0, 7.0, 7.0, 10.0, 13.0, 20.0, 22.0, 25.0, 49.0, 44.0, 74.0, 92.0, 114.0, 175.0, 228.0, 268.0, 430.0, 663.0, 882.0, 1570.0, 2693.0, 5230.0, 10902.0, 24672.0, 55253.0, 119139.0, 214021.0, 257338.0, 181716.0, 92974.0, 42411.0, 18538.0, 8603.0, 4176.0, 2151.0, 1258.0, 766.0, 525.0, 385.0, 293.0, 202.0, 174.0, 109.0, 97.0, 51.0, 39.0, 51.0, 29.0, 23.0, 13.0, 15.0, 5.0, 7.0, 3.0, 2.0, 4.0], "bins": [-1.2841796875, -1.247833251953125, -1.21148681640625, -1.175140380859375, -1.1387939453125, -1.102447509765625, -1.06610107421875, -1.029754638671875, -0.993408203125, -0.957061767578125, -0.92071533203125, -0.884368896484375, -0.8480224609375, -0.811676025390625, -0.77532958984375, -0.738983154296875, -0.70263671875, -0.666290283203125, -0.62994384765625, -0.593597412109375, -0.5572509765625, -0.520904541015625, -0.48455810546875, -0.448211669921875, -0.411865234375, -0.375518798828125, -0.33917236328125, -0.302825927734375, -0.2664794921875, -0.230133056640625, -0.19378662109375, -0.157440185546875, -0.12109375, -0.084747314453125, -0.04840087890625, -0.012054443359375, 0.0242919921875, 0.060638427734375, 0.09698486328125, 0.133331298828125, 0.169677734375, 0.206024169921875, 0.24237060546875, 0.278717041015625, 0.3150634765625, 0.351409912109375, 0.38775634765625, 0.424102783203125, 0.46044921875, 0.496795654296875, 0.53314208984375, 0.569488525390625, 0.6058349609375, 0.642181396484375, 0.67852783203125, 0.714874267578125, 0.751220703125, 0.787567138671875, 0.82391357421875, 0.860260009765625, 0.8966064453125, 0.932952880859375, 0.96929931640625, 1.005645751953125, 1.0419921875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 8.0, 11.0, 8.0, 25.0, 22.0, 32.0, 49.0, 63.0, 74.0, 88.0, 110.0, 103.0, 86.0, 76.0, 57.0, 54.0, 43.0, 31.0, 20.0, 9.0, 9.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6201171875, -0.600128173828125, -0.58013916015625, -0.560150146484375, -0.5401611328125, -0.520172119140625, -0.50018310546875, -0.480194091796875, -0.460205078125, -0.440216064453125, -0.42022705078125, -0.400238037109375, -0.3802490234375, -0.360260009765625, -0.34027099609375, -0.320281982421875, -0.30029296875, -0.280303955078125, -0.26031494140625, -0.240325927734375, -0.2203369140625, -0.200347900390625, -0.18035888671875, -0.160369873046875, -0.140380859375, -0.120391845703125, -0.10040283203125, -0.080413818359375, -0.0604248046875, -0.040435791015625, -0.02044677734375, -0.000457763671875, 0.01953125, 0.039520263671875, 0.05950927734375, 0.079498291015625, 0.0994873046875, 0.119476318359375, 0.13946533203125, 0.159454345703125, 0.179443359375, 0.199432373046875, 0.21942138671875, 0.239410400390625, 0.2593994140625, 0.279388427734375, 0.29937744140625, 0.319366455078125, 0.33935546875, 0.359344482421875, 0.37933349609375, 0.399322509765625, 0.4193115234375, 0.439300537109375, 0.45928955078125, 0.479278564453125, 0.499267578125, 0.519256591796875, 0.53924560546875, 0.559234619140625, 0.5792236328125, 0.599212646484375, 0.61920166015625, 0.639190673828125, 0.6591796875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 5.0, 9.0, 11.0, 11.0, 20.0, 14.0, 15.0, 21.0, 23.0, 29.0, 29.0, 41.0, 47.0, 39.0, 49.0, 55.0, 43.0, 54.0, 40.0, 47.0, 45.0, 39.0, 35.0, 39.0, 39.0, 26.0, 29.0, 26.0, 19.0, 18.0, 18.0, 10.0, 9.0, 6.0, 5.0, 5.0, 2.0, 7.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.91954517364502, -8.644757270812988, -8.369969367980957, -8.095181465148926, -7.820393085479736, -7.545605182647705, -7.270816802978516, -6.996028900146484, -6.721240997314453, -6.446453094482422, -6.171665191650391, -5.896876811981201, -5.62208890914917, -5.347301006317139, -5.072512626647949, -4.797724723815918, -4.522936820983887, -4.2481489181518555, -3.973360776901245, -3.6985726356506348, -3.4237847328186035, -3.1489968299865723, -2.874208688735962, -2.5994205474853516, -2.3246326446533203, -2.049844741821289, -1.7750566005706787, -1.500268578529358, -1.225480556488037, -0.9506925344467163, -0.6759045124053955, -0.4011164903640747, -0.1263275146484375, 0.1484605073928833, 0.4232485294342041, 0.6980365514755249, 0.9728245735168457, 1.2476125955581665, 1.5224006175994873, 1.797188639640808, 2.071976661682129, 2.34676456451416, 2.6215527057647705, 2.896340847015381, 3.171128749847412, 3.4459166526794434, 3.7207047939300537, 3.995492935180664, 4.270280838012695, 4.545068740844727, 4.819856643676758, 5.094645023345947, 5.3694329261779785, 5.64422082901001, 5.919009208679199, 6.1937971115112305, 6.468585014343262, 6.743372917175293, 7.018160820007324, 7.292949199676514, 7.567737102508545, 7.842525005340576, 8.117313385009766, 8.392101287841797, 8.666889190673828]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 6.0, 2.0, 4.0, 8.0, 10.0, 11.0, 19.0, 13.0, 15.0, 16.0, 31.0, 29.0, 25.0, 33.0, 35.0, 26.0, 28.0, 41.0, 36.0, 47.0, 51.0, 40.0, 37.0, 43.0, 34.0, 34.0, 44.0, 36.0, 20.0, 34.0, 25.0, 22.0, 26.0, 17.0, 14.0, 15.0, 11.0, 15.0, 8.0, 8.0, 5.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-10.669568061828613, -10.350547790527344, -10.031526565551758, -9.712505340576172, -9.393485069274902, -9.074464797973633, -8.755443572998047, -8.436422348022461, -8.117402076721191, -7.798381328582764, -7.479360580444336, -7.160339832305908, -6.8413190841674805, -6.522298336029053, -6.203277587890625, -5.884256839752197, -5.5652360916137695, -5.246215343475342, -4.927194595336914, -4.608173847198486, -4.289153099060059, -3.970132350921631, -3.651111602783203, -3.3320908546447754, -3.0130701065063477, -2.69404935836792, -2.375028610229492, -2.0560078620910645, -1.7369871139526367, -1.417966365814209, -1.0989456176757812, -0.7799248695373535, -0.4609041213989258, -0.14188337326049805, 0.1771373748779297, 0.4961581230163574, 0.8151788711547852, 1.134199619293213, 1.4532203674316406, 1.7722411155700684, 2.091261863708496, 2.410282611846924, 2.7293033599853516, 3.0483241081237793, 3.367344856262207, 3.6863656044006348, 4.0053863525390625, 4.32440710067749, 4.643427848815918, 4.962448596954346, 5.281469345092773, 5.600490093231201, 5.919510841369629, 6.238531589508057, 6.557552337646484, 6.876573085784912, 7.19559383392334, 7.514614582061768, 7.833635330200195, 8.152656555175781, 8.47167682647705, 8.79069709777832, 9.109718322753906, 9.428739547729492, 9.747759819030762]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 16.0, 21.0, 21.0, 45.0, 64.0, 129.0, 175.0, 277.0, 470.0, 704.0, 1163.0, 1755.0, 2822.0, 4354.0, 6764.0, 10309.0, 15112.0, 22166.0, 31183.0, 43139.0, 56560.0, 70455.0, 84055.0, 94244.0, 99151.0, 98183.0, 90127.0, 78393.0, 65022.0, 50775.0, 37916.0, 27057.0, 18886.0, 12837.0, 8538.0, 5619.0, 3692.0, 2319.0, 1481.0, 941.0, 600.0, 384.0, 221.0, 137.0, 84.0, 63.0, 48.0, 31.0, 18.0, 8.0, 6.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.81640625, -4.65997314453125, -4.5035400390625, -4.34710693359375, -4.190673828125, -4.03424072265625, -3.8778076171875, -3.72137451171875, -3.56494140625, -3.40850830078125, -3.2520751953125, -3.09564208984375, -2.939208984375, -2.78277587890625, -2.6263427734375, -2.46990966796875, -2.3134765625, -2.15704345703125, -2.0006103515625, -1.84417724609375, -1.687744140625, -1.53131103515625, -1.3748779296875, -1.21844482421875, -1.06201171875, -0.90557861328125, -0.7491455078125, -0.59271240234375, -0.436279296875, -0.27984619140625, -0.1234130859375, 0.03302001953125, 0.189453125, 0.34588623046875, 0.5023193359375, 0.65875244140625, 0.815185546875, 0.97161865234375, 1.1280517578125, 1.28448486328125, 1.44091796875, 1.59735107421875, 1.7537841796875, 1.91021728515625, 2.066650390625, 2.22308349609375, 2.3795166015625, 2.53594970703125, 2.6923828125, 2.84881591796875, 3.0052490234375, 3.16168212890625, 3.318115234375, 3.47454833984375, 3.6309814453125, 3.78741455078125, 3.94384765625, 4.10028076171875, 4.2567138671875, 4.41314697265625, 4.569580078125, 4.72601318359375, 4.8824462890625, 5.03887939453125, 5.1953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 8.0, 6.0, 7.0, 5.0, 18.0, 14.0, 16.0, 13.0, 15.0, 18.0, 31.0, 27.0, 30.0, 36.0, 28.0, 38.0, 36.0, 45.0, 38.0, 41.0, 43.0, 52.0, 45.0, 41.0, 31.0, 40.0, 32.0, 44.0, 35.0, 16.0, 21.0, 26.0, 17.0, 18.0, 16.0, 9.0, 12.0, 6.0, 7.0, 4.0, 6.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.359375, -11.0216064453125, -10.683837890625, -10.3460693359375, -10.00830078125, -9.6705322265625, -9.332763671875, -8.9949951171875, -8.6572265625, -8.3194580078125, -7.981689453125, -7.6439208984375, -7.30615234375, -6.9683837890625, -6.630615234375, -6.2928466796875, -5.955078125, -5.6173095703125, -5.279541015625, -4.9417724609375, -4.60400390625, -4.2662353515625, -3.928466796875, -3.5906982421875, -3.2529296875, -2.9151611328125, -2.577392578125, -2.2396240234375, -1.90185546875, -1.5640869140625, -1.226318359375, -0.8885498046875, -0.55078125, -0.2130126953125, 0.124755859375, 0.4625244140625, 0.80029296875, 1.1380615234375, 1.475830078125, 1.8135986328125, 2.1513671875, 2.4891357421875, 2.826904296875, 3.1646728515625, 3.50244140625, 3.8402099609375, 4.177978515625, 4.5157470703125, 4.853515625, 5.1912841796875, 5.529052734375, 5.8668212890625, 6.20458984375, 6.5423583984375, 6.880126953125, 7.2178955078125, 7.5556640625, 7.8934326171875, 8.231201171875, 8.5689697265625, 8.90673828125, 9.2445068359375, 9.582275390625, 9.9200439453125, 10.2578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 4.0, 15.0, 17.0, 30.0, 51.0, 89.0, 119.0, 211.0, 329.0, 555.0, 886.0, 1380.0, 2255.0, 3542.0, 5375.0, 8446.0, 12944.0, 19296.0, 27914.0, 39016.0, 52845.0, 67954.0, 82877.0, 95953.0, 102032.0, 102330.0, 95413.0, 83155.0, 68313.0, 52759.0, 39248.0, 27544.0, 19201.0, 12926.0, 8558.0, 5502.0, 3539.0, 2255.0, 1428.0, 884.0, 532.0, 328.0, 205.0, 116.0, 61.0, 56.0, 25.0, 23.0, 15.0, 5.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.5087890625, -4.341796875, -4.1748046875, -4.0078125, -3.8408203125, -3.673828125, -3.5068359375, -3.33984375, -3.1728515625, -3.005859375, -2.8388671875, -2.671875, -2.5048828125, -2.337890625, -2.1708984375, -2.00390625, -1.8369140625, -1.669921875, -1.5029296875, -1.3359375, -1.1689453125, -1.001953125, -0.8349609375, -0.66796875, -0.5009765625, -0.333984375, -0.1669921875, 0.0, 0.1669921875, 0.333984375, 0.5009765625, 0.66796875, 0.8349609375, 1.001953125, 1.1689453125, 1.3359375, 1.5029296875, 1.669921875, 1.8369140625, 2.00390625, 2.1708984375, 2.337890625, 2.5048828125, 2.671875, 2.8388671875, 3.005859375, 3.1728515625, 3.33984375, 3.5068359375, 3.673828125, 3.8408203125, 4.0078125, 4.1748046875, 4.341796875, 4.5087890625, 4.67578125, 4.8427734375, 5.009765625, 5.1767578125, 5.34375, 5.5107421875, 5.677734375, 5.8447265625, 6.01171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 3.0, 7.0, 4.0, 6.0, 12.0, 14.0, 11.0, 8.0, 14.0, 16.0, 14.0, 24.0, 35.0, 27.0, 25.0, 22.0, 28.0, 34.0, 25.0, 41.0, 29.0, 22.0, 25.0, 42.0, 27.0, 31.0, 35.0, 39.0, 31.0, 28.0, 32.0, 36.0, 30.0, 23.0, 18.0, 27.0, 24.0, 17.0, 20.0, 15.0, 12.0, 15.0, 11.0, 8.0, 13.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.65234375, -5.472412109375, -5.29248046875, -5.112548828125, -4.9326171875, -4.752685546875, -4.57275390625, -4.392822265625, -4.212890625, -4.032958984375, -3.85302734375, -3.673095703125, -3.4931640625, -3.313232421875, -3.13330078125, -2.953369140625, -2.7734375, -2.593505859375, -2.41357421875, -2.233642578125, -2.0537109375, -1.873779296875, -1.69384765625, -1.513916015625, -1.333984375, -1.154052734375, -0.97412109375, -0.794189453125, -0.6142578125, -0.434326171875, -0.25439453125, -0.074462890625, 0.10546875, 0.285400390625, 0.46533203125, 0.645263671875, 0.8251953125, 1.005126953125, 1.18505859375, 1.364990234375, 1.544921875, 1.724853515625, 1.90478515625, 2.084716796875, 2.2646484375, 2.444580078125, 2.62451171875, 2.804443359375, 2.984375, 3.164306640625, 3.34423828125, 3.524169921875, 3.7041015625, 3.884033203125, 4.06396484375, 4.243896484375, 4.423828125, 4.603759765625, 4.78369140625, 4.963623046875, 5.1435546875, 5.323486328125, 5.50341796875, 5.683349609375, 5.86328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 7.0, 3.0, 8.0, 13.0, 8.0, 15.0, 33.0, 56.0, 71.0, 122.0, 193.0, 305.0, 503.0, 757.0, 1269.0, 2056.0, 3212.0, 5462.0, 8709.0, 14531.0, 22919.0, 35728.0, 54251.0, 76470.0, 99609.0, 118520.0, 127481.0, 121657.0, 105292.0, 82477.0, 59276.0, 39683.0, 26150.0, 16016.0, 10072.0, 5943.0, 3592.0, 2326.0, 1410.0, 905.0, 517.0, 341.0, 214.0, 123.0, 104.0, 61.0, 33.0, 22.0, 15.0, 9.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.22235107421875, -2.1497802734375, -2.07720947265625, -2.004638671875, -1.93206787109375, -1.8594970703125, -1.78692626953125, -1.71435546875, -1.64178466796875, -1.5692138671875, -1.49664306640625, -1.424072265625, -1.35150146484375, -1.2789306640625, -1.20635986328125, -1.1337890625, -1.06121826171875, -0.9886474609375, -0.91607666015625, -0.843505859375, -0.77093505859375, -0.6983642578125, -0.62579345703125, -0.55322265625, -0.48065185546875, -0.4080810546875, -0.33551025390625, -0.262939453125, -0.19036865234375, -0.1177978515625, -0.04522705078125, 0.02734375, 0.09991455078125, 0.1724853515625, 0.24505615234375, 0.317626953125, 0.39019775390625, 0.4627685546875, 0.53533935546875, 0.60791015625, 0.68048095703125, 0.7530517578125, 0.82562255859375, 0.898193359375, 0.97076416015625, 1.0433349609375, 1.11590576171875, 1.1884765625, 1.26104736328125, 1.3336181640625, 1.40618896484375, 1.478759765625, 1.55133056640625, 1.6239013671875, 1.69647216796875, 1.76904296875, 1.84161376953125, 1.9141845703125, 1.98675537109375, 2.059326171875, 2.13189697265625, 2.2044677734375, 2.27703857421875, 2.349609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 0.0, 4.0, 5.0, 6.0, 2.0, 5.0, 5.0, 6.0, 9.0, 13.0, 6.0, 10.0, 15.0, 28.0, 25.0, 28.0, 27.0, 38.0, 40.0, 48.0, 47.0, 58.0, 48.0, 46.0, 48.0, 48.0, 49.0, 45.0, 41.0, 34.0, 42.0, 27.0, 35.0, 21.0, 15.0, 17.0, 13.0, 10.0, 16.0, 8.0, 4.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002162456512451172, -0.00020842626690864563, -0.00020060688257217407, -0.00019278749823570251, -0.00018496811389923096, -0.0001771487295627594, -0.00016932934522628784, -0.00016150996088981628, -0.00015369057655334473, -0.00014587119221687317, -0.0001380518078804016, -0.00013023242354393005, -0.0001224130392074585, -0.00011459365487098694, -0.00010677427053451538, -9.895488619804382e-05, -9.113550186157227e-05, -8.331611752510071e-05, -7.549673318862915e-05, -6.767734885215759e-05, -5.9857964515686035e-05, -5.203858017921448e-05, -4.421919584274292e-05, -3.639981150627136e-05, -2.8580427169799805e-05, -2.0761042833328247e-05, -1.294165849685669e-05, -5.122274160385132e-06, 2.6971101760864258e-06, 1.0516494512557983e-05, 1.833587884902954e-05, 2.61552631855011e-05, 3.3974647521972656e-05, 4.1794031858444214e-05, 4.961341619491577e-05, 5.743280053138733e-05, 6.525218486785889e-05, 7.307156920433044e-05, 8.0890953540802e-05, 8.871033787727356e-05, 9.652972221374512e-05, 0.00010434910655021667, 0.00011216849088668823, 0.00011998787522315979, 0.00012780725955963135, 0.0001356266438961029, 0.00014344602823257446, 0.00015126541256904602, 0.00015908479690551758, 0.00016690418124198914, 0.0001747235655784607, 0.00018254294991493225, 0.0001903623342514038, 0.00019818171858787537, 0.00020600110292434692, 0.00021382048726081848, 0.00022163987159729004, 0.0002294592559337616, 0.00023727864027023315, 0.0002450980246067047, 0.00025291740894317627, 0.00026073679327964783, 0.0002685561776161194, 0.00027637556195259094, 0.0002841949462890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 7.0, 10.0, 11.0, 11.0, 22.0, 30.0, 48.0, 58.0, 77.0, 134.0, 187.0, 323.0, 535.0, 865.0, 1563.0, 2886.0, 5648.0, 10931.0, 21927.0, 42400.0, 76229.0, 122808.0, 166206.0, 182072.0, 157755.0, 111690.0, 68133.0, 36554.0, 19283.0, 9414.0, 4766.0, 2580.0, 1319.0, 770.0, 491.0, 283.0, 162.0, 100.0, 77.0, 55.0, 36.0, 28.0, 23.0, 10.0, 8.0, 11.0, 5.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.365234375, -3.250732421875, -3.13623046875, -3.021728515625, -2.9072265625, -2.792724609375, -2.67822265625, -2.563720703125, -2.44921875, -2.334716796875, -2.22021484375, -2.105712890625, -1.9912109375, -1.876708984375, -1.76220703125, -1.647705078125, -1.533203125, -1.418701171875, -1.30419921875, -1.189697265625, -1.0751953125, -0.960693359375, -0.84619140625, -0.731689453125, -0.6171875, -0.502685546875, -0.38818359375, -0.273681640625, -0.1591796875, -0.044677734375, 0.06982421875, 0.184326171875, 0.298828125, 0.413330078125, 0.52783203125, 0.642333984375, 0.7568359375, 0.871337890625, 0.98583984375, 1.100341796875, 1.21484375, 1.329345703125, 1.44384765625, 1.558349609375, 1.6728515625, 1.787353515625, 1.90185546875, 2.016357421875, 2.130859375, 2.245361328125, 2.35986328125, 2.474365234375, 2.5888671875, 2.703369140625, 2.81787109375, 2.932373046875, 3.046875, 3.161376953125, 3.27587890625, 3.390380859375, 3.5048828125, 3.619384765625, 3.73388671875, 3.848388671875, 3.962890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 11.0, 9.0, 6.0, 17.0, 16.0, 22.0, 20.0, 35.0, 32.0, 37.0, 36.0, 53.0, 52.0, 60.0, 71.0, 47.0, 59.0, 50.0, 51.0, 55.0, 49.0, 39.0, 28.0, 27.0, 29.0, 19.0, 14.0, 13.0, 6.0, 8.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.475616455078125, -1.42584228515625, -1.376068115234375, -1.3262939453125, -1.276519775390625, -1.22674560546875, -1.176971435546875, -1.127197265625, -1.077423095703125, -1.02764892578125, -0.977874755859375, -0.9281005859375, -0.878326416015625, -0.82855224609375, -0.778778076171875, -0.72900390625, -0.679229736328125, -0.62945556640625, -0.579681396484375, -0.5299072265625, -0.480133056640625, -0.43035888671875, -0.380584716796875, -0.330810546875, -0.281036376953125, -0.23126220703125, -0.181488037109375, -0.1317138671875, -0.081939697265625, -0.03216552734375, 0.017608642578125, 0.0673828125, 0.117156982421875, 0.16693115234375, 0.216705322265625, 0.2664794921875, 0.316253662109375, 0.36602783203125, 0.415802001953125, 0.465576171875, 0.515350341796875, 0.56512451171875, 0.614898681640625, 0.6646728515625, 0.714447021484375, 0.76422119140625, 0.813995361328125, 0.86376953125, 0.913543701171875, 0.96331787109375, 1.013092041015625, 1.0628662109375, 1.112640380859375, 1.16241455078125, 1.212188720703125, 1.261962890625, 1.311737060546875, 1.36151123046875, 1.411285400390625, 1.4610595703125, 1.510833740234375, 1.56060791015625, 1.610382080078125, 1.66015625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 6.0, 6.0, 15.0, 22.0, 14.0, 18.0, 25.0, 23.0, 30.0, 24.0, 33.0, 31.0, 43.0, 39.0, 44.0, 53.0, 42.0, 44.0, 42.0, 49.0, 44.0, 36.0, 41.0, 32.0, 35.0, 32.0, 28.0, 26.0, 14.0, 20.0, 12.0, 16.0, 14.0, 9.0, 7.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.190849304199219, -8.923033714294434, -8.655219078063965, -8.38740348815918, -8.119587898254395, -7.851773262023926, -7.583957672119141, -7.316142559051514, -7.048327445983887, -6.78051233291626, -6.512696743011475, -6.244881629943848, -5.977066516876221, -5.709251403808594, -5.441435813903809, -5.173620700836182, -4.9058051109313965, -4.6379899978637695, -4.370174407958984, -4.102359294891357, -3.8345441818237305, -3.5667288303375244, -3.2989134788513184, -3.0310983657836914, -2.7632830142974854, -2.4954676628112793, -2.2276525497436523, -1.9598371982574463, -1.6920219659805298, -1.4242067337036133, -1.1563913822174072, -0.8885761499404907, -0.6207613945007324, -0.35294613242149353, -0.08513087034225464, 0.18268442153930664, 0.45049965381622314, 0.7183148860931396, 0.9861302375793457, 1.2539454698562622, 1.5217607021331787, 1.7895759344100952, 2.0573911666870117, 2.3252065181732178, 2.593021869659424, 2.860836982727051, 3.128652334213257, 3.396467685699463, 3.66428279876709, 3.932098150253296, 4.199913501739502, 4.467728614807129, 4.735543727874756, 5.003358840942383, 5.271174430847168, 5.538989543914795, 5.806804656982422, 6.074619770050049, 6.342435359954834, 6.610250473022461, 6.878065586090088, 7.145880699157715, 7.4136962890625, 7.681511402130127, 7.949326992034912]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 7.0, 4.0, 5.0, 9.0, 9.0, 18.0, 20.0, 23.0, 23.0, 31.0, 29.0, 33.0, 35.0, 39.0, 49.0, 35.0, 35.0, 43.0, 42.0, 40.0, 36.0, 42.0, 41.0, 43.0, 37.0, 32.0, 30.0, 35.0, 23.0, 25.0, 27.0, 14.0, 16.0, 13.0, 11.0, 10.0, 12.0, 7.0, 2.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.988386154174805, -11.627701759338379, -11.26701831817627, -10.906333923339844, -10.545650482177734, -10.184966087341309, -9.824281692504883, -9.463598251342773, -9.102913856506348, -8.742229461669922, -8.381546020507812, -8.020861625671387, -7.660177707672119, -7.299493789672852, -6.938809394836426, -6.578125476837158, -6.217441558837891, -5.856757640838623, -5.4960737228393555, -5.13538932800293, -4.774705410003662, -4.4140214920043945, -4.053337097167969, -3.692653179168701, -3.3319692611694336, -2.971285343170166, -2.6106011867523193, -2.2499170303344727, -1.889233112335205, -1.528549075126648, -1.1678650379180908, -0.8071808815002441, -0.44649600982666016, -0.08581197261810303, 0.2748720645904541, 0.6355561017990112, 0.9962401390075684, 1.3569241762161255, 1.7176082134246826, 2.0782923698425293, 2.438976287841797, 2.7996602058410645, 3.160344362258911, 3.521028518676758, 3.8817124366760254, 4.242396354675293, 4.603080749511719, 4.963764667510986, 5.324448585510254, 5.6851325035095215, 6.045816421508789, 6.406500816345215, 6.767184734344482, 7.12786865234375, 7.488553047180176, 7.849236965179443, 8.209920883178711, 8.570605278015137, 8.931288719177246, 9.291973114013672, 9.652656555175781, 10.013340950012207, 10.374025344848633, 10.734708786010742, 11.095393180847168]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 8.0, 17.0, 26.0, 31.0, 57.0, 75.0, 121.0, 239.0, 384.0, 603.0, 978.0, 1685.0, 2845.0, 4768.0, 8060.0, 13042.0, 21736.0, 35209.0, 56573.0, 86420.0, 130632.0, 187596.0, 257338.0, 334152.0, 401070.0, 445558.0, 455735.0, 425844.0, 366810.0, 292456.0, 219695.0, 155311.0, 105264.0, 69063.0, 44033.0, 27416.0, 16913.0, 10461.0, 6222.0, 3758.0, 2345.0, 1454.0, 900.0, 493.0, 328.0, 197.0, 137.0, 80.0, 62.0, 40.0, 17.0, 17.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0], "bins": [-6.8203125, -6.60870361328125, -6.3970947265625, -6.18548583984375, -5.973876953125, -5.76226806640625, -5.5506591796875, -5.33905029296875, -5.12744140625, -4.91583251953125, -4.7042236328125, -4.49261474609375, -4.281005859375, -4.06939697265625, -3.8577880859375, -3.64617919921875, -3.4345703125, -3.22296142578125, -3.0113525390625, -2.79974365234375, -2.588134765625, -2.37652587890625, -2.1649169921875, -1.95330810546875, -1.74169921875, -1.53009033203125, -1.3184814453125, -1.10687255859375, -0.895263671875, -0.68365478515625, -0.4720458984375, -0.26043701171875, -0.048828125, 0.16278076171875, 0.3743896484375, 0.58599853515625, 0.797607421875, 1.00921630859375, 1.2208251953125, 1.43243408203125, 1.64404296875, 1.85565185546875, 2.0672607421875, 2.27886962890625, 2.490478515625, 2.70208740234375, 2.9136962890625, 3.12530517578125, 3.3369140625, 3.54852294921875, 3.7601318359375, 3.97174072265625, 4.183349609375, 4.39495849609375, 4.6065673828125, 4.81817626953125, 5.02978515625, 5.24139404296875, 5.4530029296875, 5.66461181640625, 5.876220703125, 6.08782958984375, 6.2994384765625, 6.51104736328125, 6.72265625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 4.0, 6.0, 2.0, 12.0, 14.0, 16.0, 18.0, 19.0, 26.0, 31.0, 23.0, 31.0, 32.0, 31.0, 29.0, 42.0, 45.0, 40.0, 39.0, 46.0, 45.0, 45.0, 42.0, 31.0, 42.0, 28.0, 28.0, 37.0, 33.0, 24.0, 25.0, 17.0, 18.0, 10.0, 13.0, 16.0, 5.0, 8.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0703125, -8.773193359375, -8.47607421875, -8.178955078125, -7.8818359375, -7.584716796875, -7.28759765625, -6.990478515625, -6.693359375, -6.396240234375, -6.09912109375, -5.802001953125, -5.5048828125, -5.207763671875, -4.91064453125, -4.613525390625, -4.31640625, -4.019287109375, -3.72216796875, -3.425048828125, -3.1279296875, -2.830810546875, -2.53369140625, -2.236572265625, -1.939453125, -1.642333984375, -1.34521484375, -1.048095703125, -0.7509765625, -0.453857421875, -0.15673828125, 0.140380859375, 0.4375, 0.734619140625, 1.03173828125, 1.328857421875, 1.6259765625, 1.923095703125, 2.22021484375, 2.517333984375, 2.814453125, 3.111572265625, 3.40869140625, 3.705810546875, 4.0029296875, 4.300048828125, 4.59716796875, 4.894287109375, 5.19140625, 5.488525390625, 5.78564453125, 6.082763671875, 6.3798828125, 6.677001953125, 6.97412109375, 7.271240234375, 7.568359375, 7.865478515625, 8.16259765625, 8.459716796875, 8.7568359375, 9.053955078125, 9.35107421875, 9.648193359375, 9.9453125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 2.0, 8.0, 8.0, 12.0, 29.0, 46.0, 79.0, 138.0, 207.0, 353.0, 610.0, 1022.0, 1711.0, 2926.0, 4707.0, 7612.0, 12322.0, 19705.0, 31401.0, 47578.0, 71165.0, 102914.0, 143940.0, 192390.0, 246629.0, 299493.0, 346904.0, 378401.0, 388616.0, 377253.0, 344360.0, 297824.0, 243649.0, 190164.0, 141461.0, 100548.0, 70024.0, 46901.0, 30476.0, 19634.0, 12093.0, 7413.0, 4544.0, 2790.0, 1675.0, 997.0, 620.0, 382.0, 220.0, 150.0, 69.0, 46.0, 20.0, 22.0, 11.0, 9.0, 3.0, 6.0, 2.0, 1.0], "bins": [-6.40234375, -6.2052001953125, -6.008056640625, -5.8109130859375, -5.61376953125, -5.4166259765625, -5.219482421875, -5.0223388671875, -4.8251953125, -4.6280517578125, -4.430908203125, -4.2337646484375, -4.03662109375, -3.8394775390625, -3.642333984375, -3.4451904296875, -3.248046875, -3.0509033203125, -2.853759765625, -2.6566162109375, -2.45947265625, -2.2623291015625, -2.065185546875, -1.8680419921875, -1.6708984375, -1.4737548828125, -1.276611328125, -1.0794677734375, -0.88232421875, -0.6851806640625, -0.488037109375, -0.2908935546875, -0.09375, 0.1033935546875, 0.300537109375, 0.4976806640625, 0.69482421875, 0.8919677734375, 1.089111328125, 1.2862548828125, 1.4833984375, 1.6805419921875, 1.877685546875, 2.0748291015625, 2.27197265625, 2.4691162109375, 2.666259765625, 2.8634033203125, 3.060546875, 3.2576904296875, 3.454833984375, 3.6519775390625, 3.84912109375, 4.0462646484375, 4.243408203125, 4.4405517578125, 4.6376953125, 4.8348388671875, 5.031982421875, 5.2291259765625, 5.42626953125, 5.6234130859375, 5.820556640625, 6.0177001953125, 6.21484375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 11.0, 12.0, 19.0, 18.0, 21.0, 36.0, 50.0, 56.0, 69.0, 75.0, 100.0, 103.0, 114.0, 152.0, 155.0, 201.0, 211.0, 184.0, 224.0, 233.0, 241.0, 238.0, 217.0, 182.0, 173.0, 155.0, 134.0, 121.0, 114.0, 90.0, 78.0, 50.0, 42.0, 42.0, 34.0, 27.0, 21.0, 19.0, 15.0, 11.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.12890625, -3.99005126953125, -3.8511962890625, -3.71234130859375, -3.573486328125, -3.43463134765625, -3.2957763671875, -3.15692138671875, -3.01806640625, -2.87921142578125, -2.7403564453125, -2.60150146484375, -2.462646484375, -2.32379150390625, -2.1849365234375, -2.04608154296875, -1.9072265625, -1.76837158203125, -1.6295166015625, -1.49066162109375, -1.351806640625, -1.21295166015625, -1.0740966796875, -0.93524169921875, -0.79638671875, -0.65753173828125, -0.5186767578125, -0.37982177734375, -0.240966796875, -0.10211181640625, 0.0367431640625, 0.17559814453125, 0.314453125, 0.45330810546875, 0.5921630859375, 0.73101806640625, 0.869873046875, 1.00872802734375, 1.1475830078125, 1.28643798828125, 1.42529296875, 1.56414794921875, 1.7030029296875, 1.84185791015625, 1.980712890625, 2.11956787109375, 2.2584228515625, 2.39727783203125, 2.5361328125, 2.67498779296875, 2.8138427734375, 2.95269775390625, 3.091552734375, 3.23040771484375, 3.3692626953125, 3.50811767578125, 3.64697265625, 3.78582763671875, 3.9246826171875, 4.06353759765625, 4.202392578125, 4.34124755859375, 4.4801025390625, 4.61895751953125, 4.7578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 2.0, 8.0, 8.0, 10.0, 10.0, 11.0, 17.0, 19.0, 25.0, 18.0, 35.0, 29.0, 41.0, 44.0, 42.0, 37.0, 40.0, 46.0, 60.0, 52.0, 55.0, 37.0, 37.0, 40.0, 35.0, 31.0, 30.0, 32.0, 23.0, 25.0, 19.0, 18.0, 11.0, 8.0, 8.0, 3.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.394795417785645, -8.1011962890625, -7.807596206665039, -7.5139970779418945, -7.220397472381592, -6.926797866821289, -6.6331987380981445, -6.339599132537842, -6.045999526977539, -5.752399921417236, -5.458800315856934, -5.165201187133789, -4.871601581573486, -4.578001976013184, -4.284402847290039, -3.9908032417297363, -3.6972036361694336, -3.403604030609131, -3.1100046634674072, -2.8164052963256836, -2.522805690765381, -2.229206085205078, -1.9356067180633545, -1.6420073509216309, -1.3484077453613281, -1.054808259010315, -0.7612087726593018, -0.4676092863082886, -0.1740097999572754, 0.11958968639373779, 0.413189172744751, 0.7067885398864746, 1.0003881454467773, 1.2939876317977905, 1.5875871181488037, 1.881186604499817, 2.17478609085083, 2.468385696411133, 2.7619850635528564, 3.05558443069458, 3.349184036254883, 3.6427836418151855, 3.936383008956909, 4.229982376098633, 4.5235819816589355, 4.817181587219238, 5.110780715942383, 5.4043803215026855, 5.697979927062988, 5.991579532623291, 6.285179138183594, 6.578778266906738, 6.872377872467041, 7.165977478027344, 7.459576606750488, 7.753176212310791, 8.046775817871094, 8.340374946594238, 8.6339750289917, 8.927574157714844, 9.221174240112305, 9.51477336883545, 9.808372497558594, 10.101972579956055, 10.3955717086792]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 7.0, 10.0, 10.0, 13.0, 22.0, 22.0, 27.0, 21.0, 21.0, 30.0, 33.0, 43.0, 28.0, 36.0, 41.0, 41.0, 55.0, 36.0, 55.0, 34.0, 54.0, 32.0, 34.0, 44.0, 29.0, 33.0, 27.0, 33.0, 20.0, 12.0, 22.0, 11.0, 14.0, 15.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.127070426940918, -10.750505447387695, -10.373941421508789, -9.997376441955566, -9.620811462402344, -9.244247436523438, -8.867682456970215, -8.491117477416992, -8.114553451538086, -7.7379889488220215, -7.361424446105957, -6.984859466552734, -6.60829496383667, -6.2317304611206055, -5.855165481567383, -5.478600978851318, -5.102036476135254, -4.7254719734191895, -4.348907470703125, -3.9723424911499023, -3.595777988433838, -3.2192134857177734, -2.84264874458313, -2.4660840034484863, -2.089519500732422, -1.7129548788070679, -1.3363902568817139, -0.9598256349563599, -0.5832610130310059, -0.20669639110565186, 0.16986823081970215, 0.5464329719543457, 0.9229974746704102, 1.2995620965957642, 1.6761267185211182, 2.0526914596557617, 2.429255962371826, 2.8058204650878906, 3.182385206222534, 3.5589499473571777, 3.935514450073242, 4.312078952789307, 4.688643455505371, 5.065208435058594, 5.441772937774658, 5.818337440490723, 6.194902420043945, 6.57146692276001, 6.948031425476074, 7.324595928192139, 7.701160430908203, 8.077725410461426, 8.454290390014648, 8.830854415893555, 9.207419395446777, 9.583984375, 9.960548400878906, 10.337113380432129, 10.713677406311035, 11.090242385864258, 11.466806411743164, 11.843371391296387, 12.21993637084961, 12.596500396728516, 12.973065376281738]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 9.0, 7.0, 14.0, 13.0, 20.0, 23.0, 44.0, 66.0, 92.0, 173.0, 268.0, 400.0, 677.0, 1191.0, 2128.0, 3721.0, 6478.0, 11320.0, 20373.0, 35571.0, 59872.0, 94611.0, 134323.0, 164540.0, 161495.0, 129235.0, 89351.0, 56147.0, 32913.0, 18777.0, 10701.0, 5956.0, 3350.0, 1909.0, 1114.0, 640.0, 385.0, 251.0, 144.0, 99.0, 44.0, 37.0, 25.0, 14.0, 13.0, 13.0, 7.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.26953125, -2.198455810546875, -2.12738037109375, -2.056304931640625, -1.9852294921875, -1.914154052734375, -1.84307861328125, -1.772003173828125, -1.700927734375, -1.629852294921875, -1.55877685546875, -1.487701416015625, -1.4166259765625, -1.345550537109375, -1.27447509765625, -1.203399658203125, -1.13232421875, -1.061248779296875, -0.99017333984375, -0.919097900390625, -0.8480224609375, -0.776947021484375, -0.70587158203125, -0.634796142578125, -0.563720703125, -0.492645263671875, -0.42156982421875, -0.350494384765625, -0.2794189453125, -0.208343505859375, -0.13726806640625, -0.066192626953125, 0.0048828125, 0.075958251953125, 0.14703369140625, 0.218109130859375, 0.2891845703125, 0.360260009765625, 0.43133544921875, 0.502410888671875, 0.573486328125, 0.644561767578125, 0.71563720703125, 0.786712646484375, 0.8577880859375, 0.928863525390625, 0.99993896484375, 1.071014404296875, 1.14208984375, 1.213165283203125, 1.28424072265625, 1.355316162109375, 1.4263916015625, 1.497467041015625, 1.56854248046875, 1.639617919921875, 1.710693359375, 1.781768798828125, 1.85284423828125, 1.923919677734375, 1.9949951171875, 2.066070556640625, 2.13714599609375, 2.208221435546875, 2.279296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 5.0, 11.0, 13.0, 15.0, 14.0, 8.0, 27.0, 35.0, 28.0, 27.0, 31.0, 35.0, 42.0, 44.0, 52.0, 36.0, 54.0, 54.0, 41.0, 46.0, 48.0, 43.0, 40.0, 39.0, 31.0, 23.0, 30.0, 19.0, 24.0, 9.0, 16.0, 13.0, 7.0, 9.0, 12.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.265625, -12.8536376953125, -12.441650390625, -12.0296630859375, -11.61767578125, -11.2056884765625, -10.793701171875, -10.3817138671875, -9.9697265625, -9.5577392578125, -9.145751953125, -8.7337646484375, -8.32177734375, -7.9097900390625, -7.497802734375, -7.0858154296875, -6.673828125, -6.2618408203125, -5.849853515625, -5.4378662109375, -5.02587890625, -4.6138916015625, -4.201904296875, -3.7899169921875, -3.3779296875, -2.9659423828125, -2.553955078125, -2.1419677734375, -1.72998046875, -1.3179931640625, -0.906005859375, -0.4940185546875, -0.08203125, 0.3299560546875, 0.741943359375, 1.1539306640625, 1.56591796875, 1.9779052734375, 2.389892578125, 2.8018798828125, 3.2138671875, 3.6258544921875, 4.037841796875, 4.4498291015625, 4.86181640625, 5.2738037109375, 5.685791015625, 6.0977783203125, 6.509765625, 6.9217529296875, 7.333740234375, 7.7457275390625, 8.15771484375, 8.5697021484375, 8.981689453125, 9.3936767578125, 9.8056640625, 10.2176513671875, 10.629638671875, 11.0416259765625, 11.45361328125, 11.8656005859375, 12.277587890625, 12.6895751953125, 13.1015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 2.0, 10.0, 11.0, 14.0, 25.0, 44.0, 56.0, 67.0, 99.0, 191.0, 316.0, 545.0, 950.0, 1763.0, 3325.0, 6752.0, 13948.0, 30061.0, 64612.0, 130856.0, 214789.0, 238521.0, 169889.0, 89773.0, 42824.0, 19870.0, 9321.0, 4480.0, 2391.0, 1261.0, 690.0, 428.0, 224.0, 133.0, 97.0, 74.0, 42.0, 38.0, 12.0, 13.0, 9.0, 8.0, 6.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.935546875, -2.83154296875, -2.7275390625, -2.62353515625, -2.51953125, -2.41552734375, -2.3115234375, -2.20751953125, -2.103515625, -1.99951171875, -1.8955078125, -1.79150390625, -1.6875, -1.58349609375, -1.4794921875, -1.37548828125, -1.271484375, -1.16748046875, -1.0634765625, -0.95947265625, -0.85546875, -0.75146484375, -0.6474609375, -0.54345703125, -0.439453125, -0.33544921875, -0.2314453125, -0.12744140625, -0.0234375, 0.08056640625, 0.1845703125, 0.28857421875, 0.392578125, 0.49658203125, 0.6005859375, 0.70458984375, 0.80859375, 0.91259765625, 1.0166015625, 1.12060546875, 1.224609375, 1.32861328125, 1.4326171875, 1.53662109375, 1.640625, 1.74462890625, 1.8486328125, 1.95263671875, 2.056640625, 2.16064453125, 2.2646484375, 2.36865234375, 2.47265625, 2.57666015625, 2.6806640625, 2.78466796875, 2.888671875, 2.99267578125, 3.0966796875, 3.20068359375, 3.3046875, 3.40869140625, 3.5126953125, 3.61669921875, 3.720703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 7.0, 14.0, 9.0, 15.0, 17.0, 20.0, 21.0, 21.0, 43.0, 28.0, 26.0, 30.0, 39.0, 41.0, 40.0, 44.0, 46.0, 47.0, 39.0, 30.0, 41.0, 32.0, 30.0, 28.0, 32.0, 30.0, 39.0, 25.0, 27.0, 22.0, 16.0, 22.0, 15.0, 17.0, 12.0, 9.0, 3.0, 4.0, 2.0, 7.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0], "bins": [-8.0546875, -7.83135986328125, -7.6080322265625, -7.38470458984375, -7.161376953125, -6.93804931640625, -6.7147216796875, -6.49139404296875, -6.26806640625, -6.04473876953125, -5.8214111328125, -5.59808349609375, -5.374755859375, -5.15142822265625, -4.9281005859375, -4.70477294921875, -4.4814453125, -4.25811767578125, -4.0347900390625, -3.81146240234375, -3.588134765625, -3.36480712890625, -3.1414794921875, -2.91815185546875, -2.69482421875, -2.47149658203125, -2.2481689453125, -2.02484130859375, -1.801513671875, -1.57818603515625, -1.3548583984375, -1.13153076171875, -0.908203125, -0.68487548828125, -0.4615478515625, -0.23822021484375, -0.014892578125, 0.20843505859375, 0.4317626953125, 0.65509033203125, 0.87841796875, 1.10174560546875, 1.3250732421875, 1.54840087890625, 1.771728515625, 1.99505615234375, 2.2183837890625, 2.44171142578125, 2.6650390625, 2.88836669921875, 3.1116943359375, 3.33502197265625, 3.558349609375, 3.78167724609375, 4.0050048828125, 4.22833251953125, 4.45166015625, 4.67498779296875, 4.8983154296875, 5.12164306640625, 5.344970703125, 5.56829833984375, 5.7916259765625, 6.01495361328125, 6.23828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 7.0, 9.0, 4.0, 7.0, 15.0, 21.0, 32.0, 35.0, 46.0, 47.0, 86.0, 110.0, 169.0, 237.0, 321.0, 481.0, 730.0, 1405.0, 3134.0, 11671.0, 69903.0, 418915.0, 443487.0, 77857.0, 12749.0, 3266.0, 1432.0, 775.0, 468.0, 330.0, 220.0, 182.0, 97.0, 75.0, 58.0, 52.0, 32.0, 24.0, 18.0, 9.0, 13.0, 4.0, 7.0, 4.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.193359375, -2.1307373046875, -2.068115234375, -2.0054931640625, -1.94287109375, -1.8802490234375, -1.817626953125, -1.7550048828125, -1.6923828125, -1.6297607421875, -1.567138671875, -1.5045166015625, -1.44189453125, -1.3792724609375, -1.316650390625, -1.2540283203125, -1.19140625, -1.1287841796875, -1.066162109375, -1.0035400390625, -0.94091796875, -0.8782958984375, -0.815673828125, -0.7530517578125, -0.6904296875, -0.6278076171875, -0.565185546875, -0.5025634765625, -0.43994140625, -0.3773193359375, -0.314697265625, -0.2520751953125, -0.189453125, -0.1268310546875, -0.064208984375, -0.0015869140625, 0.06103515625, 0.1236572265625, 0.186279296875, 0.2489013671875, 0.3115234375, 0.3741455078125, 0.436767578125, 0.4993896484375, 0.56201171875, 0.6246337890625, 0.687255859375, 0.7498779296875, 0.8125, 0.8751220703125, 0.937744140625, 1.0003662109375, 1.06298828125, 1.1256103515625, 1.188232421875, 1.2508544921875, 1.3134765625, 1.3760986328125, 1.438720703125, 1.5013427734375, 1.56396484375, 1.6265869140625, 1.689208984375, 1.7518310546875, 1.814453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 8.0, 9.0, 15.0, 17.0, 34.0, 40.0, 48.0, 51.0, 62.0, 85.0, 103.0, 66.0, 81.0, 73.0, 60.0, 60.0, 41.0, 37.0, 25.0, 27.0, 10.0, 12.0, 5.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16312026977539e-05, -5.952548235654831e-05, -5.741976201534271e-05, -5.5314041674137115e-05, -5.320832133293152e-05, -5.110260099172592e-05, -4.8996880650520325e-05, -4.689116030931473e-05, -4.478543996810913e-05, -4.2679719626903534e-05, -4.057399928569794e-05, -3.846827894449234e-05, -3.636255860328674e-05, -3.4256838262081146e-05, -3.215111792087555e-05, -3.0045397579669952e-05, -2.7939677238464355e-05, -2.583395689725876e-05, -2.372823655605316e-05, -2.1622516214847565e-05, -1.9516795873641968e-05, -1.741107553243637e-05, -1.5305355191230774e-05, -1.3199634850025177e-05, -1.109391450881958e-05, -8.988194167613983e-06, -6.882473826408386e-06, -4.776753485202789e-06, -2.6710331439971924e-06, -5.653128027915955e-07, 1.5404075384140015e-06, 3.6461278796195984e-06, 5.751848220825195e-06, 7.857568562030792e-06, 9.96328890323639e-06, 1.2069009244441986e-05, 1.4174729585647583e-05, 1.628044992685318e-05, 1.8386170268058777e-05, 2.0491890609264374e-05, 2.259761095046997e-05, 2.4703331291675568e-05, 2.6809051632881165e-05, 2.891477197408676e-05, 3.102049231529236e-05, 3.3126212656497955e-05, 3.523193299770355e-05, 3.733765333890915e-05, 3.9443373680114746e-05, 4.154909402132034e-05, 4.365481436252594e-05, 4.576053470373154e-05, 4.7866255044937134e-05, 4.997197538614273e-05, 5.207769572734833e-05, 5.4183416068553925e-05, 5.628913640975952e-05, 5.839485675096512e-05, 6.0500577092170715e-05, 6.260629743337631e-05, 6.471201777458191e-05, 6.68177381157875e-05, 6.89234584569931e-05, 7.10291787981987e-05, 7.31348991394043e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 8.0, 19.0, 15.0, 25.0, 34.0, 46.0, 80.0, 130.0, 161.0, 212.0, 338.0, 576.0, 1062.0, 1889.0, 3836.0, 8716.0, 20746.0, 50000.0, 119888.0, 237176.0, 284162.0, 179582.0, 80624.0, 33149.0, 13841.0, 5909.0, 2792.0, 1419.0, 778.0, 461.0, 263.0, 188.0, 133.0, 89.0, 66.0, 42.0, 25.0, 19.0, 17.0, 8.0, 9.0, 4.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.2978515625, -1.25762939453125, -1.2174072265625, -1.17718505859375, -1.136962890625, -1.09674072265625, -1.0565185546875, -1.01629638671875, -0.97607421875, -0.93585205078125, -0.8956298828125, -0.85540771484375, -0.815185546875, -0.77496337890625, -0.7347412109375, -0.69451904296875, -0.654296875, -0.61407470703125, -0.5738525390625, -0.53363037109375, -0.493408203125, -0.45318603515625, -0.4129638671875, -0.37274169921875, -0.33251953125, -0.29229736328125, -0.2520751953125, -0.21185302734375, -0.171630859375, -0.13140869140625, -0.0911865234375, -0.05096435546875, -0.0107421875, 0.02947998046875, 0.0697021484375, 0.10992431640625, 0.150146484375, 0.19036865234375, 0.2305908203125, 0.27081298828125, 0.31103515625, 0.35125732421875, 0.3914794921875, 0.43170166015625, 0.471923828125, 0.51214599609375, 0.5523681640625, 0.59259033203125, 0.6328125, 0.67303466796875, 0.7132568359375, 0.75347900390625, 0.793701171875, 0.83392333984375, 0.8741455078125, 0.91436767578125, 0.95458984375, 0.99481201171875, 1.0350341796875, 1.07525634765625, 1.115478515625, 1.15570068359375, 1.1959228515625, 1.23614501953125, 1.2763671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 15.0, 17.0, 29.0, 31.0, 52.0, 63.0, 71.0, 101.0, 95.0, 117.0, 98.0, 82.0, 70.0, 48.0, 30.0, 24.0, 15.0, 8.0, 9.0, 7.0, 2.0, 6.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.634765625, -0.6154937744140625, -0.596221923828125, -0.5769500732421875, -0.55767822265625, -0.5384063720703125, -0.519134521484375, -0.4998626708984375, -0.4805908203125, -0.4613189697265625, -0.442047119140625, -0.4227752685546875, -0.40350341796875, -0.3842315673828125, -0.364959716796875, -0.3456878662109375, -0.326416015625, -0.3071441650390625, -0.287872314453125, -0.2686004638671875, -0.24932861328125, -0.2300567626953125, -0.210784912109375, -0.1915130615234375, -0.1722412109375, -0.1529693603515625, -0.133697509765625, -0.1144256591796875, -0.09515380859375, -0.0758819580078125, -0.056610107421875, -0.0373382568359375, -0.01806640625, 0.0012054443359375, 0.020477294921875, 0.0397491455078125, 0.05902099609375, 0.0782928466796875, 0.097564697265625, 0.1168365478515625, 0.1361083984375, 0.1553802490234375, 0.174652099609375, 0.1939239501953125, 0.21319580078125, 0.2324676513671875, 0.251739501953125, 0.2710113525390625, 0.290283203125, 0.3095550537109375, 0.328826904296875, 0.3480987548828125, 0.36737060546875, 0.3866424560546875, 0.405914306640625, 0.4251861572265625, 0.4444580078125, 0.4637298583984375, 0.483001708984375, 0.5022735595703125, 0.52154541015625, 0.5408172607421875, 0.560089111328125, 0.5793609619140625, 0.5986328125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 10.0, 5.0, 2.0, 8.0, 13.0, 9.0, 10.0, 17.0, 12.0, 19.0, 29.0, 26.0, 33.0, 30.0, 48.0, 41.0, 37.0, 46.0, 41.0, 55.0, 47.0, 60.0, 40.0, 43.0, 38.0, 48.0, 30.0, 27.0, 28.0, 29.0, 25.0, 23.0, 22.0, 12.0, 5.0, 8.0, 4.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.342551231384277, -8.045703887939453, -7.748857498168945, -7.452010631561279, -7.155163764953613, -6.858316898345947, -6.561470031738281, -6.264623165130615, -5.967776298522949, -5.670929431915283, -5.374082565307617, -5.077235698699951, -4.780388832092285, -4.483541965484619, -4.186695098876953, -3.889848232269287, -3.593001365661621, -3.296154499053955, -2.999307632446289, -2.702460765838623, -2.405613899230957, -2.108767032623291, -1.811920166015625, -1.515073299407959, -1.218226432800293, -0.921379566192627, -0.6245326995849609, -0.3276858329772949, -0.030838966369628906, 0.2660079002380371, 0.5628547668457031, 0.8597016334533691, 1.1565475463867188, 1.4533944129943848, 1.7502412796020508, 2.047088146209717, 2.343935012817383, 2.640781879425049, 2.937628746032715, 3.234475612640381, 3.531322479248047, 3.828169345855713, 4.125016212463379, 4.421863079071045, 4.718709945678711, 5.015556812286377, 5.312403678894043, 5.609250545501709, 5.906097412109375, 6.202944278717041, 6.499791145324707, 6.796638011932373, 7.093484878540039, 7.390331745147705, 7.687178611755371, 7.984025478363037, 8.280872344970703, 8.577718734741211, 8.874566078186035, 9.17141342163086, 9.468259811401367, 9.765106201171875, 10.0619535446167, 10.358800888061523, 10.655647277832031]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 1.0, 7.0, 4.0, 6.0, 12.0, 7.0, 17.0, 19.0, 22.0, 26.0, 23.0, 22.0, 31.0, 33.0, 42.0, 29.0, 36.0, 42.0, 38.0, 55.0, 42.0, 48.0, 39.0, 52.0, 33.0, 31.0, 43.0, 27.0, 36.0, 26.0, 31.0, 22.0, 14.0, 23.0, 9.0, 15.0, 13.0, 6.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.096552848815918, -10.721324920654297, -10.34609603881836, -9.970868110656738, -9.595640182495117, -9.22041130065918, -8.845183372497559, -8.469955444335938, -8.0947265625, -7.719498157501221, -7.344269752502441, -6.96904182434082, -6.593813419342041, -6.218585014343262, -5.843357086181641, -5.468128681182861, -5.092900276184082, -4.717671871185303, -4.342443466186523, -3.9672155380249023, -3.591987133026123, -3.2167587280273438, -2.8415305614471436, -2.4663023948669434, -2.091073989868164, -1.7158457040786743, -1.3406174182891846, -0.9653891324996948, -0.5901608467102051, -0.21493256092071533, 0.16029572486877441, 0.5355238914489746, 0.9107522964477539, 1.2859805822372437, 1.6612088680267334, 2.0364370346069336, 2.411665439605713, 2.786893844604492, 3.1621220111846924, 3.5373501777648926, 3.912578582763672, 4.287806987762451, 4.6630353927612305, 5.038263320922852, 5.413491725921631, 5.78872013092041, 6.163948059082031, 6.5391764640808105, 6.91440486907959, 7.289633274078369, 7.664861679077148, 8.04008960723877, 8.41531753540039, 8.790546417236328, 9.16577434539795, 9.54100227355957, 9.916231155395508, 10.291459083557129, 10.666687965393066, 11.041915893554688, 11.417144775390625, 11.792372703552246, 12.167600631713867, 12.542829513549805, 12.918057441711426]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 18.0, 17.0, 33.0, 57.0, 106.0, 130.0, 243.0, 409.0, 689.0, 1087.0, 1864.0, 2869.0, 4654.0, 7140.0, 11019.0, 16846.0, 24688.0, 34758.0, 47658.0, 61375.0, 76558.0, 88965.0, 97742.0, 101265.0, 97401.0, 88160.0, 74338.0, 60149.0, 45556.0, 33259.0, 23828.0, 16335.0, 10625.0, 7086.0, 4453.0, 2755.0, 1654.0, 1050.0, 686.0, 402.0, 235.0, 135.0, 93.0, 58.0, 42.0, 17.0, 18.0, 11.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-5.31640625, -5.157470703125, -4.99853515625, -4.839599609375, -4.6806640625, -4.521728515625, -4.36279296875, -4.203857421875, -4.044921875, -3.885986328125, -3.72705078125, -3.568115234375, -3.4091796875, -3.250244140625, -3.09130859375, -2.932373046875, -2.7734375, -2.614501953125, -2.45556640625, -2.296630859375, -2.1376953125, -1.978759765625, -1.81982421875, -1.660888671875, -1.501953125, -1.343017578125, -1.18408203125, -1.025146484375, -0.8662109375, -0.707275390625, -0.54833984375, -0.389404296875, -0.23046875, -0.071533203125, 0.08740234375, 0.246337890625, 0.4052734375, 0.564208984375, 0.72314453125, 0.882080078125, 1.041015625, 1.199951171875, 1.35888671875, 1.517822265625, 1.6767578125, 1.835693359375, 1.99462890625, 2.153564453125, 2.3125, 2.471435546875, 2.63037109375, 2.789306640625, 2.9482421875, 3.107177734375, 3.26611328125, 3.425048828125, 3.583984375, 3.742919921875, 3.90185546875, 4.060791015625, 4.2197265625, 4.378662109375, 4.53759765625, 4.696533203125, 4.85546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 11.0, 4.0, 10.0, 5.0, 7.0, 13.0, 14.0, 14.0, 22.0, 23.0, 26.0, 33.0, 29.0, 30.0, 32.0, 28.0, 38.0, 34.0, 49.0, 36.0, 47.0, 46.0, 39.0, 53.0, 45.0, 33.0, 34.0, 25.0, 36.0, 25.0, 22.0, 23.0, 25.0, 20.0, 13.0, 9.0, 13.0, 9.0, 5.0, 5.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.9921875, -10.6309814453125, -10.269775390625, -9.9085693359375, -9.54736328125, -9.1861572265625, -8.824951171875, -8.4637451171875, -8.1025390625, -7.7413330078125, -7.380126953125, -7.0189208984375, -6.65771484375, -6.2965087890625, -5.935302734375, -5.5740966796875, -5.212890625, -4.8516845703125, -4.490478515625, -4.1292724609375, -3.76806640625, -3.4068603515625, -3.045654296875, -2.6844482421875, -2.3232421875, -1.9620361328125, -1.600830078125, -1.2396240234375, -0.87841796875, -0.5172119140625, -0.156005859375, 0.2052001953125, 0.56640625, 0.9276123046875, 1.288818359375, 1.6500244140625, 2.01123046875, 2.3724365234375, 2.733642578125, 3.0948486328125, 3.4560546875, 3.8172607421875, 4.178466796875, 4.5396728515625, 4.90087890625, 5.2620849609375, 5.623291015625, 5.9844970703125, 6.345703125, 6.7069091796875, 7.068115234375, 7.4293212890625, 7.79052734375, 8.1517333984375, 8.512939453125, 8.8741455078125, 9.2353515625, 9.5965576171875, 9.957763671875, 10.3189697265625, 10.68017578125, 11.0413818359375, 11.402587890625, 11.7637939453125, 12.125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 12.0, 15.0, 23.0, 41.0, 68.0, 134.0, 213.0, 381.0, 622.0, 1120.0, 1719.0, 2651.0, 4335.0, 7031.0, 10926.0, 16758.0, 25170.0, 36215.0, 50102.0, 66164.0, 82182.0, 96103.0, 104882.0, 106286.0, 99668.0, 87481.0, 71629.0, 54673.0, 40332.0, 28313.0, 19321.0, 12610.0, 8089.0, 5187.0, 3145.0, 1977.0, 1176.0, 718.0, 439.0, 274.0, 160.0, 114.0, 45.0, 18.0, 16.0, 7.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.1875, -5.0155029296875, -4.843505859375, -4.6715087890625, -4.49951171875, -4.3275146484375, -4.155517578125, -3.9835205078125, -3.8115234375, -3.6395263671875, -3.467529296875, -3.2955322265625, -3.12353515625, -2.9515380859375, -2.779541015625, -2.6075439453125, -2.435546875, -2.2635498046875, -2.091552734375, -1.9195556640625, -1.74755859375, -1.5755615234375, -1.403564453125, -1.2315673828125, -1.0595703125, -0.8875732421875, -0.715576171875, -0.5435791015625, -0.37158203125, -0.1995849609375, -0.027587890625, 0.1444091796875, 0.31640625, 0.4884033203125, 0.660400390625, 0.8323974609375, 1.00439453125, 1.1763916015625, 1.348388671875, 1.5203857421875, 1.6923828125, 1.8643798828125, 2.036376953125, 2.2083740234375, 2.38037109375, 2.5523681640625, 2.724365234375, 2.8963623046875, 3.068359375, 3.2403564453125, 3.412353515625, 3.5843505859375, 3.75634765625, 3.9283447265625, 4.100341796875, 4.2723388671875, 4.4443359375, 4.6163330078125, 4.788330078125, 4.9603271484375, 5.13232421875, 5.3043212890625, 5.476318359375, 5.6483154296875, 5.8203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 11.0, 3.0, 15.0, 9.0, 19.0, 19.0, 20.0, 34.0, 33.0, 37.0, 32.0, 36.0, 37.0, 33.0, 36.0, 47.0, 37.0, 40.0, 48.0, 33.0, 48.0, 37.0, 32.0, 42.0, 34.0, 31.0, 32.0, 31.0, 20.0, 17.0, 15.0, 11.0, 19.0, 11.0, 9.0, 7.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.484375, -8.24700927734375, -8.0096435546875, -7.77227783203125, -7.534912109375, -7.29754638671875, -7.0601806640625, -6.82281494140625, -6.58544921875, -6.34808349609375, -6.1107177734375, -5.87335205078125, -5.635986328125, -5.39862060546875, -5.1612548828125, -4.92388916015625, -4.6865234375, -4.44915771484375, -4.2117919921875, -3.97442626953125, -3.737060546875, -3.49969482421875, -3.2623291015625, -3.02496337890625, -2.78759765625, -2.55023193359375, -2.3128662109375, -2.07550048828125, -1.838134765625, -1.60076904296875, -1.3634033203125, -1.12603759765625, -0.888671875, -0.65130615234375, -0.4139404296875, -0.17657470703125, 0.060791015625, 0.29815673828125, 0.5355224609375, 0.77288818359375, 1.01025390625, 1.24761962890625, 1.4849853515625, 1.72235107421875, 1.959716796875, 2.19708251953125, 2.4344482421875, 2.67181396484375, 2.9091796875, 3.14654541015625, 3.3839111328125, 3.62127685546875, 3.858642578125, 4.09600830078125, 4.3333740234375, 4.57073974609375, 4.80810546875, 5.04547119140625, 5.2828369140625, 5.52020263671875, 5.757568359375, 5.99493408203125, 6.2322998046875, 6.46966552734375, 6.70703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 16.0, 20.0, 32.0, 47.0, 79.0, 136.0, 166.0, 309.0, 489.0, 757.0, 1194.0, 1880.0, 3069.0, 4739.0, 7285.0, 11132.0, 16495.0, 24347.0, 34176.0, 46675.0, 61061.0, 75226.0, 88290.0, 96779.0, 100432.0, 97168.0, 87741.0, 74841.0, 60814.0, 46917.0, 34137.0, 24439.0, 16632.0, 11005.0, 7364.0, 4582.0, 2991.0, 1850.0, 1211.0, 755.0, 419.0, 283.0, 208.0, 138.0, 92.0, 49.0, 29.0, 18.0, 11.0, 14.0, 7.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.703125, -1.64727783203125, -1.5914306640625, -1.53558349609375, -1.479736328125, -1.42388916015625, -1.3680419921875, -1.31219482421875, -1.25634765625, -1.20050048828125, -1.1446533203125, -1.08880615234375, -1.032958984375, -0.97711181640625, -0.9212646484375, -0.86541748046875, -0.8095703125, -0.75372314453125, -0.6978759765625, -0.64202880859375, -0.586181640625, -0.53033447265625, -0.4744873046875, -0.41864013671875, -0.36279296875, -0.30694580078125, -0.2510986328125, -0.19525146484375, -0.139404296875, -0.08355712890625, -0.0277099609375, 0.02813720703125, 0.083984375, 0.13983154296875, 0.1956787109375, 0.25152587890625, 0.307373046875, 0.36322021484375, 0.4190673828125, 0.47491455078125, 0.53076171875, 0.58660888671875, 0.6424560546875, 0.69830322265625, 0.754150390625, 0.80999755859375, 0.8658447265625, 0.92169189453125, 0.9775390625, 1.03338623046875, 1.0892333984375, 1.14508056640625, 1.200927734375, 1.25677490234375, 1.3126220703125, 1.36846923828125, 1.42431640625, 1.48016357421875, 1.5360107421875, 1.59185791015625, 1.647705078125, 1.70355224609375, 1.7593994140625, 1.81524658203125, 1.87109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 3.0, 9.0, 15.0, 13.0, 20.0, 20.0, 16.0, 14.0, 29.0, 20.0, 34.0, 35.0, 32.0, 41.0, 40.0, 25.0, 50.0, 53.0, 42.0, 57.0, 42.0, 46.0, 32.0, 41.0, 34.0, 35.0, 32.0, 24.0, 20.0, 17.0, 17.0, 9.0, 15.0, 11.0, 10.0, 8.0, 6.0, 6.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.00023555755615234375, -0.00022867321968078613, -0.00022178888320922852, -0.0002149045467376709, -0.00020802021026611328, -0.00020113587379455566, -0.00019425153732299805, -0.00018736720085144043, -0.0001804828643798828, -0.0001735985279083252, -0.00016671419143676758, -0.00015982985496520996, -0.00015294551849365234, -0.00014606118202209473, -0.0001391768455505371, -0.0001322925090789795, -0.00012540817260742188, -0.00011852383613586426, -0.00011163949966430664, -0.00010475516319274902, -9.78708267211914e-05, -9.098649024963379e-05, -8.410215377807617e-05, -7.721781730651855e-05, -7.033348083496094e-05, -6.344914436340332e-05, -5.65648078918457e-05, -4.9680471420288086e-05, -4.279613494873047e-05, -3.591179847717285e-05, -2.9027462005615234e-05, -2.2143125534057617e-05, -1.52587890625e-05, -8.374452590942383e-06, -1.4901161193847656e-06, 5.3942203521728516e-06, 1.2278556823730469e-05, 1.9162893295288086e-05, 2.6047229766845703e-05, 3.293156623840332e-05, 3.981590270996094e-05, 4.6700239181518555e-05, 5.358457565307617e-05, 6.046891212463379e-05, 6.73532485961914e-05, 7.423758506774902e-05, 8.112192153930664e-05, 8.800625801086426e-05, 9.489059448242188e-05, 0.00010177493095397949, 0.00010865926742553711, 0.00011554360389709473, 0.00012242794036865234, 0.00012931227684020996, 0.00013619661331176758, 0.0001430809497833252, 0.0001499652862548828, 0.00015684962272644043, 0.00016373395919799805, 0.00017061829566955566, 0.00017750263214111328, 0.0001843869686126709, 0.00019127130508422852, 0.00019815564155578613, 0.00020503997802734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 11.0, 26.0, 33.0, 63.0, 97.0, 146.0, 281.0, 406.0, 735.0, 1117.0, 1844.0, 2989.0, 4708.0, 7442.0, 11628.0, 17599.0, 26034.0, 37455.0, 51820.0, 68242.0, 83842.0, 97644.0, 105986.0, 105758.0, 98982.0, 85328.0, 69543.0, 52972.0, 38547.0, 26991.0, 18066.0, 11880.0, 7680.0, 4832.0, 2970.0, 1926.0, 1137.0, 695.0, 414.0, 254.0, 179.0, 85.0, 71.0, 52.0, 22.0, 12.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1328125, -2.0682525634765625, -2.003692626953125, -1.9391326904296875, -1.87457275390625, -1.8100128173828125, -1.745452880859375, -1.6808929443359375, -1.6163330078125, -1.5517730712890625, -1.487213134765625, -1.4226531982421875, -1.35809326171875, -1.2935333251953125, -1.228973388671875, -1.1644134521484375, -1.099853515625, -1.0352935791015625, -0.970733642578125, -0.9061737060546875, -0.84161376953125, -0.7770538330078125, -0.712493896484375, -0.6479339599609375, -0.5833740234375, -0.5188140869140625, -0.454254150390625, -0.3896942138671875, -0.32513427734375, -0.2605743408203125, -0.196014404296875, -0.1314544677734375, -0.06689453125, -0.0023345947265625, 0.062225341796875, 0.1267852783203125, 0.19134521484375, 0.2559051513671875, 0.320465087890625, 0.3850250244140625, 0.4495849609375, 0.5141448974609375, 0.578704833984375, 0.6432647705078125, 0.70782470703125, 0.7723846435546875, 0.836944580078125, 0.9015045166015625, 0.966064453125, 1.0306243896484375, 1.095184326171875, 1.1597442626953125, 1.22430419921875, 1.2888641357421875, 1.353424072265625, 1.4179840087890625, 1.4825439453125, 1.5471038818359375, 1.611663818359375, 1.6762237548828125, 1.74078369140625, 1.8053436279296875, 1.869903564453125, 1.9344635009765625, 1.9990234375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 9.0, 8.0, 6.0, 13.0, 7.0, 13.0, 21.0, 16.0, 27.0, 30.0, 29.0, 38.0, 35.0, 44.0, 45.0, 59.0, 53.0, 43.0, 44.0, 42.0, 39.0, 43.0, 44.0, 34.0, 33.0, 39.0, 21.0, 22.0, 20.0, 15.0, 15.0, 14.0, 8.0, 15.0, 7.0, 6.0, 9.0, 2.0, 7.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.966796875, -0.9356842041015625, -0.904571533203125, -0.8734588623046875, -0.84234619140625, -0.8112335205078125, -0.780120849609375, -0.7490081787109375, -0.7178955078125, -0.6867828369140625, -0.655670166015625, -0.6245574951171875, -0.59344482421875, -0.5623321533203125, -0.531219482421875, -0.5001068115234375, -0.468994140625, -0.4378814697265625, -0.406768798828125, -0.3756561279296875, -0.34454345703125, -0.3134307861328125, -0.282318115234375, -0.2512054443359375, -0.2200927734375, -0.1889801025390625, -0.157867431640625, -0.1267547607421875, -0.09564208984375, -0.0645294189453125, -0.033416748046875, -0.0023040771484375, 0.02880859375, 0.0599212646484375, 0.091033935546875, 0.1221466064453125, 0.15325927734375, 0.1843719482421875, 0.215484619140625, 0.2465972900390625, 0.2777099609375, 0.3088226318359375, 0.339935302734375, 0.3710479736328125, 0.40216064453125, 0.4332733154296875, 0.464385986328125, 0.4954986572265625, 0.526611328125, 0.5577239990234375, 0.588836669921875, 0.6199493408203125, 0.65106201171875, 0.6821746826171875, 0.713287353515625, 0.7444000244140625, 0.7755126953125, 0.8066253662109375, 0.837738037109375, 0.8688507080078125, 0.89996337890625, 0.9310760498046875, 0.962188720703125, 0.9933013916015625, 1.0244140625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 5.0, 8.0, 3.0, 3.0, 10.0, 16.0, 16.0, 14.0, 16.0, 24.0, 22.0, 26.0, 34.0, 33.0, 44.0, 47.0, 39.0, 50.0, 48.0, 56.0, 47.0, 53.0, 50.0, 37.0, 28.0, 45.0, 38.0, 31.0, 30.0, 24.0, 24.0, 18.0, 16.0, 8.0, 10.0, 7.0, 4.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.468103408813477, -8.16162109375, -7.855138778686523, -7.548655986785889, -7.242173671722412, -6.9356913566589355, -6.629208564758301, -6.322726249694824, -6.016243934631348, -5.709761619567871, -5.4032793045043945, -5.09679651260376, -4.790314197540283, -4.483831882476807, -4.177349090576172, -3.8708667755126953, -3.5643844604492188, -3.257902145385742, -2.9514195919036865, -2.644937038421631, -2.3384547233581543, -2.0319724082946777, -1.725489854812622, -1.4190073013305664, -1.1125249862670898, -0.8060425519943237, -0.4995601177215576, -0.1930776834487915, 0.11340475082397461, 0.4198871850967407, 0.7263696193695068, 1.0328521728515625, 1.3393335342407227, 1.6458159685134888, 1.9522984027862549, 2.2587809562683105, 2.565263271331787, 2.8717455863952637, 3.1782281398773193, 3.484710693359375, 3.7911930084228516, 4.097675323486328, 4.404157638549805, 4.7106404304504395, 5.017122745513916, 5.323605060577393, 5.630087852478027, 5.936570167541504, 6.2430524826049805, 6.549534797668457, 6.856017112731934, 7.162499904632568, 7.468982219696045, 7.7754645347595215, 8.081947326660156, 8.388429641723633, 8.69491195678711, 9.001394271850586, 9.307876586914062, 9.614358901977539, 9.920841217041016, 10.227324485778809, 10.533806800842285, 10.840289115905762, 11.146771430969238]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 8.0, 4.0, 5.0, 9.0, 6.0, 13.0, 11.0, 16.0, 21.0, 22.0, 26.0, 22.0, 15.0, 25.0, 33.0, 24.0, 48.0, 36.0, 38.0, 42.0, 39.0, 41.0, 44.0, 30.0, 36.0, 25.0, 38.0, 38.0, 34.0, 28.0, 29.0, 32.0, 24.0, 27.0, 15.0, 21.0, 17.0, 18.0, 5.0, 11.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-12.381056785583496, -12.007100105285645, -11.633143424987793, -11.259186744689941, -10.885229110717773, -10.511272430419922, -10.13731575012207, -9.763359069824219, -9.389402389526367, -9.015445709228516, -8.641489028930664, -8.267532348632812, -7.893575191497803, -7.519618511199951, -7.145661354064941, -6.77170467376709, -6.397747993469238, -6.023791313171387, -5.649834632873535, -5.275877475738525, -4.901920795440674, -4.527964115142822, -4.1540069580078125, -3.780050277709961, -3.4060935974121094, -3.032136917114258, -2.658179998397827, -2.2842230796813965, -1.910266399383545, -1.5363095998764038, -1.1623528003692627, -0.788395881652832, -0.41443824768066406, -0.04048144817352295, 0.33347535133361816, 0.7074321508407593, 1.0813889503479004, 1.4553457498550415, 1.8293025493621826, 2.2032594680786133, 2.577216148376465, 2.9511728286743164, 3.325129747390747, 3.6990866661071777, 4.073043346405029, 4.447000026702881, 4.820957183837891, 5.194913864135742, 5.568870544433594, 5.942827224731445, 6.316783905029297, 6.690741062164307, 7.064697742462158, 7.43865442276001, 7.8126115798950195, 8.186568260192871, 8.560524940490723, 8.934481620788574, 9.308438301086426, 9.682394981384277, 10.056352615356445, 10.430309295654297, 10.804265975952148, 11.17822265625, 11.552179336547852]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 8.0, 15.0, 25.0, 42.0, 78.0, 119.0, 232.0, 375.0, 649.0, 1126.0, 1799.0, 2926.0, 4761.0, 7958.0, 12844.0, 19646.0, 30764.0, 47324.0, 69809.0, 101899.0, 144192.0, 193412.0, 251207.0, 308679.0, 360544.0, 393790.0, 403929.0, 387131.0, 347753.0, 294071.0, 235395.0, 177961.0, 129884.0, 91060.0, 61392.0, 40916.0, 26244.0, 16926.0, 10550.0, 6621.0, 3982.0, 2455.0, 1526.0, 840.0, 533.0, 363.0, 209.0, 127.0, 74.0, 49.0, 33.0, 26.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.35382080078125, -6.1373291015625, -5.92083740234375, -5.704345703125, -5.48785400390625, -5.2713623046875, -5.05487060546875, -4.83837890625, -4.62188720703125, -4.4053955078125, -4.18890380859375, -3.972412109375, -3.75592041015625, -3.5394287109375, -3.32293701171875, -3.1064453125, -2.88995361328125, -2.6734619140625, -2.45697021484375, -2.240478515625, -2.02398681640625, -1.8074951171875, -1.59100341796875, -1.37451171875, -1.15802001953125, -0.9415283203125, -0.72503662109375, -0.508544921875, -0.29205322265625, -0.0755615234375, 0.14093017578125, 0.357421875, 0.57391357421875, 0.7904052734375, 1.00689697265625, 1.223388671875, 1.43988037109375, 1.6563720703125, 1.87286376953125, 2.08935546875, 2.30584716796875, 2.5223388671875, 2.73883056640625, 2.955322265625, 3.17181396484375, 3.3883056640625, 3.60479736328125, 3.8212890625, 4.03778076171875, 4.2542724609375, 4.47076416015625, 4.687255859375, 4.90374755859375, 5.1202392578125, 5.33673095703125, 5.55322265625, 5.76971435546875, 5.9862060546875, 6.20269775390625, 6.419189453125, 6.63568115234375, 6.8521728515625, 7.06866455078125, 7.28515625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 6.0, 7.0, 11.0, 13.0, 10.0, 16.0, 19.0, 21.0, 28.0, 26.0, 24.0, 21.0, 32.0, 42.0, 54.0, 36.0, 45.0, 35.0, 37.0, 42.0, 38.0, 43.0, 39.0, 44.0, 31.0, 27.0, 40.0, 30.0, 20.0, 27.0, 30.0, 22.0, 19.0, 13.0, 13.0, 6.0, 9.0, 9.0, 0.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.9921875, -11.640625, -11.2890625, -10.9375, -10.5859375, -10.234375, -9.8828125, -9.53125, -9.1796875, -8.828125, -8.4765625, -8.125, -7.7734375, -7.421875, -7.0703125, -6.71875, -6.3671875, -6.015625, -5.6640625, -5.3125, -4.9609375, -4.609375, -4.2578125, -3.90625, -3.5546875, -3.203125, -2.8515625, -2.5, -2.1484375, -1.796875, -1.4453125, -1.09375, -0.7421875, -0.390625, -0.0390625, 0.3125, 0.6640625, 1.015625, 1.3671875, 1.71875, 2.0703125, 2.421875, 2.7734375, 3.125, 3.4765625, 3.828125, 4.1796875, 4.53125, 4.8828125, 5.234375, 5.5859375, 5.9375, 6.2890625, 6.640625, 6.9921875, 7.34375, 7.6953125, 8.046875, 8.3984375, 8.75, 9.1015625, 9.453125, 9.8046875, 10.15625, 10.5078125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 6.0, 9.0, 15.0, 21.0, 43.0, 69.0, 102.0, 178.0, 292.0, 494.0, 844.0, 1460.0, 2423.0, 4026.0, 6689.0, 11202.0, 17971.0, 28023.0, 43962.0, 65940.0, 95251.0, 133139.0, 177944.0, 230321.0, 282983.0, 329803.0, 366102.0, 382298.0, 375772.0, 351476.0, 310270.0, 259854.0, 207990.0, 158328.0, 115700.0, 81390.0, 55199.0, 36316.0, 23126.0, 14632.0, 9049.0, 5459.0, 3380.0, 1909.0, 1152.0, 711.0, 395.0, 245.0, 143.0, 90.0, 39.0, 23.0, 13.0, 13.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-7.1640625, -6.93865966796875, -6.7132568359375, -6.48785400390625, -6.262451171875, -6.03704833984375, -5.8116455078125, -5.58624267578125, -5.36083984375, -5.13543701171875, -4.9100341796875, -4.68463134765625, -4.459228515625, -4.23382568359375, -4.0084228515625, -3.78302001953125, -3.5576171875, -3.33221435546875, -3.1068115234375, -2.88140869140625, -2.656005859375, -2.43060302734375, -2.2052001953125, -1.97979736328125, -1.75439453125, -1.52899169921875, -1.3035888671875, -1.07818603515625, -0.852783203125, -0.62738037109375, -0.4019775390625, -0.17657470703125, 0.048828125, 0.27423095703125, 0.4996337890625, 0.72503662109375, 0.950439453125, 1.17584228515625, 1.4012451171875, 1.62664794921875, 1.85205078125, 2.07745361328125, 2.3028564453125, 2.52825927734375, 2.753662109375, 2.97906494140625, 3.2044677734375, 3.42987060546875, 3.6552734375, 3.88067626953125, 4.1060791015625, 4.33148193359375, 4.556884765625, 4.78228759765625, 5.0076904296875, 5.23309326171875, 5.45849609375, 5.68389892578125, 5.9093017578125, 6.13470458984375, 6.360107421875, 6.58551025390625, 6.8109130859375, 7.03631591796875, 7.26171875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 9.0, 11.0, 25.0, 27.0, 50.0, 52.0, 91.0, 88.0, 132.0, 136.0, 159.0, 161.0, 199.0, 223.0, 226.0, 243.0, 246.0, 232.0, 236.0, 253.0, 214.0, 219.0, 167.0, 134.0, 109.0, 101.0, 75.0, 71.0, 49.0, 37.0, 33.0, 18.0, 16.0, 8.0, 7.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08203125, -5.8892822265625, -5.696533203125, -5.5037841796875, -5.31103515625, -5.1182861328125, -4.925537109375, -4.7327880859375, -4.5400390625, -4.3472900390625, -4.154541015625, -3.9617919921875, -3.76904296875, -3.5762939453125, -3.383544921875, -3.1907958984375, -2.998046875, -2.8052978515625, -2.612548828125, -2.4197998046875, -2.22705078125, -2.0343017578125, -1.841552734375, -1.6488037109375, -1.4560546875, -1.2633056640625, -1.070556640625, -0.8778076171875, -0.68505859375, -0.4923095703125, -0.299560546875, -0.1068115234375, 0.0859375, 0.2786865234375, 0.471435546875, 0.6641845703125, 0.85693359375, 1.0496826171875, 1.242431640625, 1.4351806640625, 1.6279296875, 1.8206787109375, 2.013427734375, 2.2061767578125, 2.39892578125, 2.5916748046875, 2.784423828125, 2.9771728515625, 3.169921875, 3.3626708984375, 3.555419921875, 3.7481689453125, 3.94091796875, 4.1336669921875, 4.326416015625, 4.5191650390625, 4.7119140625, 4.9046630859375, 5.097412109375, 5.2901611328125, 5.48291015625, 5.6756591796875, 5.868408203125, 6.0611572265625, 6.25390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 5.0, 6.0, 10.0, 15.0, 15.0, 17.0, 20.0, 25.0, 29.0, 42.0, 40.0, 42.0, 42.0, 46.0, 39.0, 52.0, 50.0, 46.0, 51.0, 33.0, 50.0, 49.0, 33.0, 36.0, 33.0, 23.0, 20.0, 24.0, 23.0, 14.0, 15.0, 12.0, 8.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.095524787902832, -11.7366361618042, -11.37774658203125, -11.018857955932617, -10.659968376159668, -10.301079750061035, -9.942190170288086, -9.583301544189453, -9.22441291809082, -8.865524291992188, -8.506634712219238, -8.147746086120605, -7.788856506347656, -7.429967880249023, -7.071078777313232, -6.712189674377441, -6.353300094604492, -5.994410991668701, -5.63552188873291, -5.276633262634277, -4.917743682861328, -4.558855056762695, -4.199965953826904, -3.8410768508911133, -3.4821877479553223, -3.1232986450195312, -2.7644095420837402, -2.4055206775665283, -2.0466315746307373, -1.6877424716949463, -1.3288536071777344, -0.9699645042419434, -0.6110763549804688, -0.2521873116493225, 0.10670173168182373, 0.4655907154083252, 0.8244798183441162, 1.1833689212799072, 1.5422577857971191, 1.9011468887329102, 2.260035991668701, 2.618925094604492, 2.977814197540283, 3.336703062057495, 3.695592164993286, 4.054481506347656, 4.413370132446289, 4.77225923538208, 5.131148338317871, 5.490037441253662, 5.848926544189453, 6.207815170288086, 6.566704750061035, 6.925593376159668, 7.284482479095459, 7.64337158203125, 8.002260208129883, 8.361148834228516, 8.720038414001465, 9.078927040100098, 9.437816619873047, 9.79670524597168, 10.155593872070312, 10.514483451843262, 10.873373031616211]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 6.0, 7.0, 12.0, 14.0, 23.0, 19.0, 23.0, 31.0, 21.0, 25.0, 32.0, 24.0, 31.0, 37.0, 54.0, 37.0, 40.0, 41.0, 45.0, 28.0, 45.0, 39.0, 45.0, 36.0, 26.0, 30.0, 34.0, 18.0, 22.0, 26.0, 19.0, 20.0, 21.0, 9.0, 9.0, 7.0, 7.0, 5.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.103611946105957, -13.663763046264648, -13.22391414642334, -12.784065246582031, -12.344216346740723, -11.904367446899414, -11.464519500732422, -11.024669647216797, -10.584821701049805, -10.144972801208496, -9.705123901367188, -9.265275001525879, -8.82542610168457, -8.385577201843262, -7.945728778839111, -7.505879878997803, -7.066030502319336, -6.626181602478027, -6.186332702636719, -5.74648380279541, -5.306634902954102, -4.866786003112793, -4.426937580108643, -3.987088680267334, -3.5472397804260254, -3.107390880584717, -2.667541980743408, -2.2276933193206787, -1.7878444194793701, -1.3479955196380615, -0.908146858215332, -0.46829795837402344, -0.028448104858398438, 0.4114007353782654, 0.8512495756149292, 1.2910983562469482, 1.7309472560882568, 2.1707961559295654, 2.610644817352295, 3.0504937171936035, 3.490342617034912, 3.9301915168762207, 4.370040416717529, 4.80988883972168, 5.249737739562988, 5.689586639404297, 6.1294355392456055, 6.569284439086914, 7.009133338928223, 7.448982238769531, 7.88883113861084, 8.328680038452148, 8.768528938293457, 9.208377838134766, 9.648225784301758, 10.088075637817383, 10.527923583984375, 10.967772483825684, 11.407621383666992, 11.8474702835083, 12.28731918334961, 12.727168083190918, 13.167016983032227, 13.606864929199219, 14.046714782714844]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 11.0, 23.0, 25.0, 36.0, 56.0, 76.0, 114.0, 196.0, 267.0, 433.0, 676.0, 1167.0, 1741.0, 2972.0, 4857.0, 7897.0, 13241.0, 21825.0, 35808.0, 57004.0, 84854.0, 116669.0, 142046.0, 147537.0, 129651.0, 98616.0, 67654.0, 43820.0, 27144.0, 16509.0, 9997.0, 5929.0, 3698.0, 2243.0, 1334.0, 869.0, 553.0, 361.0, 238.0, 138.0, 100.0, 50.0, 33.0, 31.0, 20.0, 15.0, 5.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.3515625, -2.28076171875, -2.2099609375, -2.13916015625, -2.068359375, -1.99755859375, -1.9267578125, -1.85595703125, -1.78515625, -1.71435546875, -1.6435546875, -1.57275390625, -1.501953125, -1.43115234375, -1.3603515625, -1.28955078125, -1.21875, -1.14794921875, -1.0771484375, -1.00634765625, -0.935546875, -0.86474609375, -0.7939453125, -0.72314453125, -0.65234375, -0.58154296875, -0.5107421875, -0.43994140625, -0.369140625, -0.29833984375, -0.2275390625, -0.15673828125, -0.0859375, -0.01513671875, 0.0556640625, 0.12646484375, 0.197265625, 0.26806640625, 0.3388671875, 0.40966796875, 0.48046875, 0.55126953125, 0.6220703125, 0.69287109375, 0.763671875, 0.83447265625, 0.9052734375, 0.97607421875, 1.046875, 1.11767578125, 1.1884765625, 1.25927734375, 1.330078125, 1.40087890625, 1.4716796875, 1.54248046875, 1.61328125, 1.68408203125, 1.7548828125, 1.82568359375, 1.896484375, 1.96728515625, 2.0380859375, 2.10888671875, 2.1796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 12.0, 8.0, 10.0, 13.0, 14.0, 17.0, 20.0, 24.0, 23.0, 24.0, 22.0, 27.0, 31.0, 29.0, 39.0, 45.0, 38.0, 50.0, 34.0, 45.0, 40.0, 40.0, 49.0, 39.0, 40.0, 37.0, 31.0, 33.0, 24.0, 17.0, 11.0, 19.0, 21.0, 18.0, 11.0, 9.0, 9.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.578125, -13.1103515625, -12.642578125, -12.1748046875, -11.70703125, -11.2392578125, -10.771484375, -10.3037109375, -9.8359375, -9.3681640625, -8.900390625, -8.4326171875, -7.96484375, -7.4970703125, -7.029296875, -6.5615234375, -6.09375, -5.6259765625, -5.158203125, -4.6904296875, -4.22265625, -3.7548828125, -3.287109375, -2.8193359375, -2.3515625, -1.8837890625, -1.416015625, -0.9482421875, -0.48046875, -0.0126953125, 0.455078125, 0.9228515625, 1.390625, 1.8583984375, 2.326171875, 2.7939453125, 3.26171875, 3.7294921875, 4.197265625, 4.6650390625, 5.1328125, 5.6005859375, 6.068359375, 6.5361328125, 7.00390625, 7.4716796875, 7.939453125, 8.4072265625, 8.875, 9.3427734375, 9.810546875, 10.2783203125, 10.74609375, 11.2138671875, 11.681640625, 12.1494140625, 12.6171875, 13.0849609375, 13.552734375, 14.0205078125, 14.48828125, 14.9560546875, 15.423828125, 15.8916015625, 16.359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 9.0, 9.0, 17.0, 16.0, 18.0, 29.0, 52.0, 57.0, 95.0, 146.0, 259.0, 316.0, 475.0, 770.0, 1232.0, 1953.0, 3061.0, 5038.0, 8429.0, 14353.0, 24401.0, 41300.0, 68701.0, 106848.0, 147187.0, 167704.0, 153355.0, 115125.0, 75414.0, 45351.0, 26965.0, 15758.0, 9245.0, 5661.0, 3379.0, 1999.0, 1347.0, 834.0, 560.0, 350.0, 233.0, 171.0, 96.0, 76.0, 61.0, 39.0, 17.0, 11.0, 10.0, 8.0, 10.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.51922607421875, -2.4368896484375, -2.35455322265625, -2.272216796875, -2.18988037109375, -2.1075439453125, -2.02520751953125, -1.94287109375, -1.86053466796875, -1.7781982421875, -1.69586181640625, -1.613525390625, -1.53118896484375, -1.4488525390625, -1.36651611328125, -1.2841796875, -1.20184326171875, -1.1195068359375, -1.03717041015625, -0.954833984375, -0.87249755859375, -0.7901611328125, -0.70782470703125, -0.62548828125, -0.54315185546875, -0.4608154296875, -0.37847900390625, -0.296142578125, -0.21380615234375, -0.1314697265625, -0.04913330078125, 0.033203125, 0.11553955078125, 0.1978759765625, 0.28021240234375, 0.362548828125, 0.44488525390625, 0.5272216796875, 0.60955810546875, 0.69189453125, 0.77423095703125, 0.8565673828125, 0.93890380859375, 1.021240234375, 1.10357666015625, 1.1859130859375, 1.26824951171875, 1.3505859375, 1.43292236328125, 1.5152587890625, 1.59759521484375, 1.679931640625, 1.76226806640625, 1.8446044921875, 1.92694091796875, 2.00927734375, 2.09161376953125, 2.1739501953125, 2.25628662109375, 2.338623046875, 2.42095947265625, 2.5032958984375, 2.58563232421875, 2.66796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 8.0, 7.0, 12.0, 16.0, 16.0, 14.0, 18.0, 25.0, 27.0, 28.0, 28.0, 26.0, 39.0, 34.0, 40.0, 34.0, 40.0, 43.0, 39.0, 34.0, 38.0, 33.0, 32.0, 33.0, 38.0, 38.0, 27.0, 27.0, 28.0, 27.0, 25.0, 21.0, 8.0, 17.0, 13.0, 10.0, 13.0, 7.0, 3.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.96875, -7.708251953125, -7.44775390625, -7.187255859375, -6.9267578125, -6.666259765625, -6.40576171875, -6.145263671875, -5.884765625, -5.624267578125, -5.36376953125, -5.103271484375, -4.8427734375, -4.582275390625, -4.32177734375, -4.061279296875, -3.80078125, -3.540283203125, -3.27978515625, -3.019287109375, -2.7587890625, -2.498291015625, -2.23779296875, -1.977294921875, -1.716796875, -1.456298828125, -1.19580078125, -0.935302734375, -0.6748046875, -0.414306640625, -0.15380859375, 0.106689453125, 0.3671875, 0.627685546875, 0.88818359375, 1.148681640625, 1.4091796875, 1.669677734375, 1.93017578125, 2.190673828125, 2.451171875, 2.711669921875, 2.97216796875, 3.232666015625, 3.4931640625, 3.753662109375, 4.01416015625, 4.274658203125, 4.53515625, 4.795654296875, 5.05615234375, 5.316650390625, 5.5771484375, 5.837646484375, 6.09814453125, 6.358642578125, 6.619140625, 6.879638671875, 7.14013671875, 7.400634765625, 7.6611328125, 7.921630859375, 8.18212890625, 8.442626953125, 8.703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 7.0, 20.0, 18.0, 18.0, 35.0, 44.0, 69.0, 105.0, 151.0, 192.0, 304.0, 498.0, 647.0, 969.0, 1373.0, 1979.0, 3130.0, 4593.0, 6877.0, 10133.0, 15354.0, 22677.0, 34032.0, 49916.0, 69611.0, 93927.0, 116595.0, 128202.0, 123456.0, 104338.0, 79828.0, 57560.0, 39760.0, 27213.0, 17945.0, 12156.0, 8088.0, 5388.0, 3708.0, 2477.0, 1624.0, 1164.0, 753.0, 520.0, 352.0, 239.0, 178.0, 102.0, 76.0, 50.0, 38.0, 22.0, 19.0, 9.0, 10.0, 6.0, 3.0, 0.0, 3.0, 5.0], "bins": [-0.40869140625, -0.3958015441894531, -0.38291168212890625, -0.3700218200683594, -0.3571319580078125, -0.3442420959472656, -0.33135223388671875, -0.3184623718261719, -0.305572509765625, -0.2926826477050781, -0.27979278564453125, -0.2669029235839844, -0.2540130615234375, -0.24112319946289062, -0.22823333740234375, -0.21534347534179688, -0.20245361328125, -0.18956375122070312, -0.17667388916015625, -0.16378402709960938, -0.1508941650390625, -0.13800430297851562, -0.12511444091796875, -0.11222457885742188, -0.099334716796875, -0.08644485473632812, -0.07355499267578125, -0.060665130615234375, -0.0477752685546875, -0.034885406494140625, -0.02199554443359375, -0.009105682373046875, 0.0037841796875, 0.016674041748046875, 0.02956390380859375, 0.042453765869140625, 0.0553436279296875, 0.06823348999023438, 0.08112335205078125, 0.09401321411132812, 0.106903076171875, 0.11979293823242188, 0.13268280029296875, 0.14557266235351562, 0.1584625244140625, 0.17135238647460938, 0.18424224853515625, 0.19713211059570312, 0.21002197265625, 0.22291183471679688, 0.23580169677734375, 0.24869155883789062, 0.2615814208984375, 0.2744712829589844, 0.28736114501953125, 0.3002510070800781, 0.313140869140625, 0.3260307312011719, 0.33892059326171875, 0.3518104553222656, 0.3647003173828125, 0.3775901794433594, 0.39048004150390625, 0.4033699035644531, 0.416259765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 8.0, 2.0, 5.0, 6.0, 12.0, 8.0, 8.0, 7.0, 12.0, 14.0, 19.0, 26.0, 18.0, 33.0, 28.0, 44.0, 42.0, 40.0, 35.0, 45.0, 54.0, 34.0, 31.0, 38.0, 38.0, 45.0, 37.0, 28.0, 38.0, 42.0, 18.0, 39.0, 31.0, 18.0, 26.0, 14.0, 12.0, 10.0, 9.0, 8.0, 6.0, 4.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.552436828613281e-05, -3.435555845499039e-05, -3.318674862384796e-05, -3.2017938792705536e-05, -3.084912896156311e-05, -2.9680319130420685e-05, -2.851150929927826e-05, -2.7342699468135834e-05, -2.6173889636993408e-05, -2.5005079805850983e-05, -2.3836269974708557e-05, -2.266746014356613e-05, -2.1498650312423706e-05, -2.032984048128128e-05, -1.9161030650138855e-05, -1.799222081899643e-05, -1.6823410987854004e-05, -1.565460115671158e-05, -1.4485791325569153e-05, -1.3316981494426727e-05, -1.2148171663284302e-05, -1.0979361832141876e-05, -9.81055200099945e-06, -8.641742169857025e-06, -7.4729323387146e-06, -6.304122507572174e-06, -5.1353126764297485e-06, -3.966502845287323e-06, -2.7976930141448975e-06, -1.628883183002472e-06, -4.600733518600464e-07, 7.087364792823792e-07, 1.8775463104248047e-06, 3.0463561415672302e-06, 4.215165972709656e-06, 5.383975803852081e-06, 6.552785634994507e-06, 7.721595466136932e-06, 8.890405297279358e-06, 1.0059215128421783e-05, 1.1228024959564209e-05, 1.2396834790706635e-05, 1.356564462184906e-05, 1.4734454452991486e-05, 1.590326428413391e-05, 1.7072074115276337e-05, 1.8240883946418762e-05, 1.9409693777561188e-05, 2.0578503608703613e-05, 2.174731343984604e-05, 2.2916123270988464e-05, 2.408493310213089e-05, 2.5253742933273315e-05, 2.642255276441574e-05, 2.7591362595558167e-05, 2.8760172426700592e-05, 2.9928982257843018e-05, 3.109779208898544e-05, 3.226660192012787e-05, 3.3435411751270294e-05, 3.460422158241272e-05, 3.5773031413555145e-05, 3.694184124469757e-05, 3.8110651075839996e-05, 3.927946090698242e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 3.0, 2.0, 7.0, 6.0, 17.0, 20.0, 40.0, 58.0, 84.0, 133.0, 211.0, 333.0, 507.0, 798.0, 1247.0, 1908.0, 3070.0, 4542.0, 6884.0, 10608.0, 16167.0, 23955.0, 35545.0, 51442.0, 71455.0, 94248.0, 113499.0, 123683.0, 119423.0, 103249.0, 80508.0, 59307.0, 41635.0, 28551.0, 19061.0, 12632.0, 8282.0, 5448.0, 3536.0, 2304.0, 1474.0, 919.0, 624.0, 436.0, 243.0, 149.0, 106.0, 76.0, 50.0, 33.0, 20.0, 11.0, 8.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.5859375, -0.568023681640625, -0.55010986328125, -0.532196044921875, -0.5142822265625, -0.496368408203125, -0.47845458984375, -0.460540771484375, -0.442626953125, -0.424713134765625, -0.40679931640625, -0.388885498046875, -0.3709716796875, -0.353057861328125, -0.33514404296875, -0.317230224609375, -0.29931640625, -0.281402587890625, -0.26348876953125, -0.245574951171875, -0.2276611328125, -0.209747314453125, -0.19183349609375, -0.173919677734375, -0.156005859375, -0.138092041015625, -0.12017822265625, -0.102264404296875, -0.0843505859375, -0.066436767578125, -0.04852294921875, -0.030609130859375, -0.0126953125, 0.005218505859375, 0.02313232421875, 0.041046142578125, 0.0589599609375, 0.076873779296875, 0.09478759765625, 0.112701416015625, 0.130615234375, 0.148529052734375, 0.16644287109375, 0.184356689453125, 0.2022705078125, 0.220184326171875, 0.23809814453125, 0.256011962890625, 0.27392578125, 0.291839599609375, 0.30975341796875, 0.327667236328125, 0.3455810546875, 0.363494873046875, 0.38140869140625, 0.399322509765625, 0.417236328125, 0.435150146484375, 0.45306396484375, 0.470977783203125, 0.4888916015625, 0.506805419921875, 0.52471923828125, 0.542633056640625, 0.560546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 4.0, 7.0, 7.0, 9.0, 17.0, 10.0, 23.0, 22.0, 26.0, 21.0, 51.0, 45.0, 46.0, 63.0, 50.0, 67.0, 70.0, 48.0, 68.0, 48.0, 48.0, 34.0, 40.0, 38.0, 25.0, 20.0, 20.0, 13.0, 9.0, 10.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.326904296875, -0.3171501159667969, -0.30739593505859375, -0.2976417541503906, -0.2878875732421875, -0.2781333923339844, -0.26837921142578125, -0.2586250305175781, -0.248870849609375, -0.23911666870117188, -0.22936248779296875, -0.21960830688476562, -0.2098541259765625, -0.20009994506835938, -0.19034576416015625, -0.18059158325195312, -0.17083740234375, -0.16108322143554688, -0.15132904052734375, -0.14157485961914062, -0.1318206787109375, -0.12206649780273438, -0.11231231689453125, -0.10255813598632812, -0.092803955078125, -0.08304977416992188, -0.07329559326171875, -0.06354141235351562, -0.0537872314453125, -0.044033050537109375, -0.03427886962890625, -0.024524688720703125, -0.0147705078125, -0.005016326904296875, 0.00473785400390625, 0.014492034912109375, 0.0242462158203125, 0.034000396728515625, 0.04375457763671875, 0.053508758544921875, 0.063262939453125, 0.07301712036132812, 0.08277130126953125, 0.09252548217773438, 0.1022796630859375, 0.11203384399414062, 0.12178802490234375, 0.13154220581054688, 0.14129638671875, 0.15105056762695312, 0.16080474853515625, 0.17055892944335938, 0.1803131103515625, 0.19006729125976562, 0.19982147216796875, 0.20957565307617188, 0.219329833984375, 0.22908401489257812, 0.23883819580078125, 0.24859237670898438, 0.2583465576171875, 0.2681007385253906, 0.27785491943359375, 0.2876091003417969, 0.29736328125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 5.0, 8.0, 9.0, 10.0, 15.0, 14.0, 21.0, 22.0, 30.0, 32.0, 43.0, 44.0, 51.0, 35.0, 53.0, 40.0, 53.0, 46.0, 46.0, 41.0, 45.0, 50.0, 40.0, 39.0, 25.0, 29.0, 23.0, 20.0, 27.0, 14.0, 14.0, 17.0, 9.0, 7.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.982329368591309, -11.620776176452637, -11.259222984313965, -10.89767074584961, -10.536117553710938, -10.174564361572266, -9.813011169433594, -9.451457977294922, -9.08990478515625, -8.728351593017578, -8.366798400878906, -8.005245208740234, -7.643692493438721, -7.282139778137207, -6.920586585998535, -6.559033393859863, -6.19748067855835, -5.835927486419678, -5.474374771118164, -5.112821578979492, -4.75126838684082, -4.389715194702148, -4.028162479400635, -3.666609287261963, -3.30505633354187, -2.9435033798217773, -2.5819501876831055, -2.2203972339630127, -1.8588441610336304, -1.497291088104248, -1.1357381343841553, -0.7741849422454834, -0.4126319885253906, -0.05107894539833069, 0.31047409772872925, 0.6720271110534668, 1.0335801839828491, 1.3951332569122314, 1.7566862106323242, 2.118239402770996, 2.479792356491089, 2.8413453102111816, 3.2028985023498535, 3.5644514560699463, 3.926004409790039, 4.287557601928711, 4.649110794067383, 5.010663986206055, 5.372216701507568, 5.73376989364624, 6.095322608947754, 6.456875801086426, 6.818428993225098, 7.1799821853637695, 7.541534900665283, 7.903088092803955, 8.264640808105469, 8.62619400024414, 8.987747192382812, 9.349300384521484, 9.71085262298584, 10.072405815124512, 10.433959007263184, 10.795512199401855, 11.157065391540527]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 0.0, 3.0, 5.0, 4.0, 5.0, 8.0, 5.0, 7.0, 11.0, 16.0, 24.0, 15.0, 27.0, 27.0, 24.0, 24.0, 32.0, 25.0, 30.0, 35.0, 52.0, 40.0, 41.0, 40.0, 45.0, 28.0, 41.0, 41.0, 47.0, 36.0, 28.0, 26.0, 35.0, 20.0, 22.0, 28.0, 18.0, 19.0, 20.0, 11.0, 9.0, 8.0, 4.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.077337265014648, -13.63789176940918, -13.198446273803711, -12.759000778198242, -12.319555282592773, -11.880109786987305, -11.440664291381836, -11.001218795776367, -10.561773300170898, -10.12232780456543, -9.682882308959961, -9.243436813354492, -8.803991317749023, -8.364545822143555, -7.925100326538086, -7.485654830932617, -7.046209335327148, -6.60676383972168, -6.167318344116211, -5.727872848510742, -5.288427352905273, -4.848981857299805, -4.409536361694336, -3.970090866088867, -3.5306453704833984, -3.0911998748779297, -2.651754379272461, -2.212308883666992, -1.7728633880615234, -1.3334178924560547, -0.8939723968505859, -0.4545269012451172, -0.015081405639648438, 0.4243640899658203, 0.8638095855712891, 1.3032550811767578, 1.7427005767822266, 2.1821460723876953, 2.621591567993164, 3.061037063598633, 3.5004825592041016, 3.9399280548095703, 4.379373550415039, 4.818819046020508, 5.258264541625977, 5.697710037231445, 6.137155532836914, 6.576601028442383, 7.016046524047852, 7.45549201965332, 7.894937515258789, 8.334383010864258, 8.773828506469727, 9.213274002075195, 9.652719497680664, 10.092164993286133, 10.531610488891602, 10.97105598449707, 11.410501480102539, 11.849946975708008, 12.289392471313477, 12.728837966918945, 13.168283462524414, 13.607728958129883, 14.047174453735352]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 10.0, 10.0, 18.0, 29.0, 39.0, 70.0, 114.0, 175.0, 305.0, 503.0, 786.0, 1244.0, 2047.0, 3228.0, 5001.0, 7463.0, 11104.0, 16416.0, 23736.0, 32596.0, 43919.0, 56350.0, 69309.0, 80928.0, 89767.0, 94301.0, 94014.0, 88257.0, 77105.0, 64933.0, 52225.0, 39997.0, 29476.0, 21021.0, 14629.0, 9673.0, 6423.0, 4115.0, 2665.0, 1729.0, 1032.0, 738.0, 401.0, 257.0, 143.0, 107.0, 55.0, 44.0, 24.0, 12.0, 11.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.40625, -5.2415771484375, -5.076904296875, -4.9122314453125, -4.74755859375, -4.5828857421875, -4.418212890625, -4.2535400390625, -4.0888671875, -3.9241943359375, -3.759521484375, -3.5948486328125, -3.43017578125, -3.2655029296875, -3.100830078125, -2.9361572265625, -2.771484375, -2.6068115234375, -2.442138671875, -2.2774658203125, -2.11279296875, -1.9481201171875, -1.783447265625, -1.6187744140625, -1.4541015625, -1.2894287109375, -1.124755859375, -0.9600830078125, -0.79541015625, -0.6307373046875, -0.466064453125, -0.3013916015625, -0.13671875, 0.0279541015625, 0.192626953125, 0.3572998046875, 0.52197265625, 0.6866455078125, 0.851318359375, 1.0159912109375, 1.1806640625, 1.3453369140625, 1.510009765625, 1.6746826171875, 1.83935546875, 2.0040283203125, 2.168701171875, 2.3333740234375, 2.498046875, 2.6627197265625, 2.827392578125, 2.9920654296875, 3.15673828125, 3.3214111328125, 3.486083984375, 3.6507568359375, 3.8154296875, 3.9801025390625, 4.144775390625, 4.3094482421875, 4.47412109375, 4.6387939453125, 4.803466796875, 4.9681396484375, 5.1328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 3.0, 5.0, 8.0, 5.0, 14.0, 9.0, 18.0, 22.0, 23.0, 18.0, 28.0, 27.0, 39.0, 32.0, 52.0, 36.0, 29.0, 59.0, 48.0, 45.0, 54.0, 40.0, 40.0, 36.0, 35.0, 34.0, 34.0, 34.0, 30.0, 30.0, 17.0, 20.0, 19.0, 12.0, 7.0, 12.0, 8.0, 2.0, 4.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.0, -15.5064697265625, -15.012939453125, -14.5194091796875, -14.02587890625, -13.5323486328125, -13.038818359375, -12.5452880859375, -12.0517578125, -11.5582275390625, -11.064697265625, -10.5711669921875, -10.07763671875, -9.5841064453125, -9.090576171875, -8.5970458984375, -8.103515625, -7.6099853515625, -7.116455078125, -6.6229248046875, -6.12939453125, -5.6358642578125, -5.142333984375, -4.6488037109375, -4.1552734375, -3.6617431640625, -3.168212890625, -2.6746826171875, -2.18115234375, -1.6876220703125, -1.194091796875, -0.7005615234375, -0.20703125, 0.2864990234375, 0.780029296875, 1.2735595703125, 1.76708984375, 2.2606201171875, 2.754150390625, 3.2476806640625, 3.7412109375, 4.2347412109375, 4.728271484375, 5.2218017578125, 5.71533203125, 6.2088623046875, 6.702392578125, 7.1959228515625, 7.689453125, 8.1829833984375, 8.676513671875, 9.1700439453125, 9.66357421875, 10.1571044921875, 10.650634765625, 11.1441650390625, 11.6376953125, 12.1312255859375, 12.624755859375, 13.1182861328125, 13.61181640625, 14.1053466796875, 14.598876953125, 15.0924072265625, 15.5859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 12.0, 13.0, 17.0, 32.0, 53.0, 70.0, 138.0, 202.0, 373.0, 600.0, 1006.0, 1649.0, 2670.0, 4433.0, 6932.0, 11057.0, 16671.0, 25148.0, 36002.0, 49834.0, 65416.0, 81762.0, 95008.0, 103141.0, 104880.0, 98758.0, 87496.0, 72267.0, 56036.0, 41974.0, 29175.0, 20118.0, 13182.0, 8477.0, 5338.0, 3349.0, 2116.0, 1233.0, 786.0, 443.0, 259.0, 183.0, 90.0, 55.0, 34.0, 26.0, 19.0, 16.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.6484375, -6.4541015625, -6.259765625, -6.0654296875, -5.87109375, -5.6767578125, -5.482421875, -5.2880859375, -5.09375, -4.8994140625, -4.705078125, -4.5107421875, -4.31640625, -4.1220703125, -3.927734375, -3.7333984375, -3.5390625, -3.3447265625, -3.150390625, -2.9560546875, -2.76171875, -2.5673828125, -2.373046875, -2.1787109375, -1.984375, -1.7900390625, -1.595703125, -1.4013671875, -1.20703125, -1.0126953125, -0.818359375, -0.6240234375, -0.4296875, -0.2353515625, -0.041015625, 0.1533203125, 0.34765625, 0.5419921875, 0.736328125, 0.9306640625, 1.125, 1.3193359375, 1.513671875, 1.7080078125, 1.90234375, 2.0966796875, 2.291015625, 2.4853515625, 2.6796875, 2.8740234375, 3.068359375, 3.2626953125, 3.45703125, 3.6513671875, 3.845703125, 4.0400390625, 4.234375, 4.4287109375, 4.623046875, 4.8173828125, 5.01171875, 5.2060546875, 5.400390625, 5.5947265625, 5.7890625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 3.0, 8.0, 8.0, 10.0, 16.0, 8.0, 23.0, 26.0, 27.0, 24.0, 37.0, 25.0, 42.0, 31.0, 41.0, 36.0, 38.0, 46.0, 55.0, 69.0, 45.0, 49.0, 37.0, 31.0, 39.0, 38.0, 31.0, 24.0, 24.0, 22.0, 18.0, 16.0, 16.0, 6.0, 4.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.65625, -9.336181640625, -9.01611328125, -8.696044921875, -8.3759765625, -8.055908203125, -7.73583984375, -7.415771484375, -7.095703125, -6.775634765625, -6.45556640625, -6.135498046875, -5.8154296875, -5.495361328125, -5.17529296875, -4.855224609375, -4.53515625, -4.215087890625, -3.89501953125, -3.574951171875, -3.2548828125, -2.934814453125, -2.61474609375, -2.294677734375, -1.974609375, -1.654541015625, -1.33447265625, -1.014404296875, -0.6943359375, -0.374267578125, -0.05419921875, 0.265869140625, 0.5859375, 0.906005859375, 1.22607421875, 1.546142578125, 1.8662109375, 2.186279296875, 2.50634765625, 2.826416015625, 3.146484375, 3.466552734375, 3.78662109375, 4.106689453125, 4.4267578125, 4.746826171875, 5.06689453125, 5.386962890625, 5.70703125, 6.027099609375, 6.34716796875, 6.667236328125, 6.9873046875, 7.307373046875, 7.62744140625, 7.947509765625, 8.267578125, 8.587646484375, 8.90771484375, 9.227783203125, 9.5478515625, 9.867919921875, 10.18798828125, 10.508056640625, 10.828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 9.0, 15.0, 10.0, 11.0, 17.0, 25.0, 49.0, 58.0, 87.0, 163.0, 257.0, 363.0, 536.0, 928.0, 1466.0, 2422.0, 3978.0, 6640.0, 11105.0, 18240.0, 30193.0, 47029.0, 68327.0, 93820.0, 115564.0, 128649.0, 127969.0, 113981.0, 91683.0, 66486.0, 45227.0, 28656.0, 17443.0, 10732.0, 6347.0, 3814.0, 2325.0, 1379.0, 902.0, 586.0, 369.0, 261.0, 131.0, 114.0, 54.0, 49.0, 25.0, 22.0, 22.0, 13.0, 8.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2.9921875, -2.901397705078125, -2.81060791015625, -2.719818115234375, -2.6290283203125, -2.538238525390625, -2.44744873046875, -2.356658935546875, -2.265869140625, -2.175079345703125, -2.08428955078125, -1.993499755859375, -1.9027099609375, -1.811920166015625, -1.72113037109375, -1.630340576171875, -1.53955078125, -1.448760986328125, -1.35797119140625, -1.267181396484375, -1.1763916015625, -1.085601806640625, -0.99481201171875, -0.904022216796875, -0.813232421875, -0.722442626953125, -0.63165283203125, -0.540863037109375, -0.4500732421875, -0.359283447265625, -0.26849365234375, -0.177703857421875, -0.0869140625, 0.003875732421875, 0.09466552734375, 0.185455322265625, 0.2762451171875, 0.367034912109375, 0.45782470703125, 0.548614501953125, 0.639404296875, 0.730194091796875, 0.82098388671875, 0.911773681640625, 1.0025634765625, 1.093353271484375, 1.18414306640625, 1.274932861328125, 1.36572265625, 1.456512451171875, 1.54730224609375, 1.638092041015625, 1.7288818359375, 1.819671630859375, 1.91046142578125, 2.001251220703125, 2.092041015625, 2.182830810546875, 2.27362060546875, 2.364410400390625, 2.4552001953125, 2.545989990234375, 2.63677978515625, 2.727569580078125, 2.818359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 8.0, 5.0, 6.0, 10.0, 14.0, 23.0, 17.0, 19.0, 35.0, 23.0, 28.0, 38.0, 37.0, 50.0, 49.0, 44.0, 50.0, 42.0, 49.0, 30.0, 48.0, 46.0, 45.0, 41.0, 26.0, 27.0, 29.0, 15.0, 31.0, 22.0, 13.0, 16.0, 13.0, 9.0, 8.0, 8.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00033664703369140625, -0.0003270655870437622, -0.00031748414039611816, -0.0003079026937484741, -0.0002983212471008301, -0.00028873980045318604, -0.000279158353805542, -0.00026957690715789795, -0.0002599954605102539, -0.00025041401386260986, -0.00024083256721496582, -0.00023125112056732178, -0.00022166967391967773, -0.0002120882272720337, -0.00020250678062438965, -0.0001929253339767456, -0.00018334388732910156, -0.00017376244068145752, -0.00016418099403381348, -0.00015459954738616943, -0.0001450181007385254, -0.00013543665409088135, -0.0001258552074432373, -0.00011627376079559326, -0.00010669231414794922, -9.711086750030518e-05, -8.752942085266113e-05, -7.794797420501709e-05, -6.836652755737305e-05, -5.8785080909729004e-05, -4.920363426208496e-05, -3.962218761444092e-05, -3.0040740966796875e-05, -2.0459294319152832e-05, -1.0877847671508789e-05, -1.296401023864746e-06, 8.285045623779297e-06, 1.786649227142334e-05, 2.7447938919067383e-05, 3.7029385566711426e-05, 4.661083221435547e-05, 5.619227886199951e-05, 6.577372550964355e-05, 7.53551721572876e-05, 8.493661880493164e-05, 9.451806545257568e-05, 0.00010409951210021973, 0.00011368095874786377, 0.0001232624053955078, 0.00013284385204315186, 0.0001424252986907959, 0.00015200674533843994, 0.00016158819198608398, 0.00017116963863372803, 0.00018075108528137207, 0.0001903325319290161, 0.00019991397857666016, 0.0002094954252243042, 0.00021907687187194824, 0.00022865831851959229, 0.00023823976516723633, 0.00024782121181488037, 0.0002574026584625244, 0.00026698410511016846, 0.0002765655517578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 9.0, 11.0, 8.0, 17.0, 28.0, 46.0, 44.0, 100.0, 135.0, 226.0, 386.0, 614.0, 979.0, 1829.0, 3150.0, 5773.0, 10292.0, 18322.0, 32679.0, 54995.0, 84965.0, 119198.0, 145152.0, 151645.0, 136595.0, 105341.0, 71811.0, 44980.0, 25958.0, 14681.0, 7906.0, 4495.0, 2533.0, 1422.0, 843.0, 555.0, 284.0, 193.0, 110.0, 78.0, 53.0, 33.0, 20.0, 14.0, 10.0, 6.0, 6.0, 10.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.609375, -3.49761962890625, -3.3858642578125, -3.27410888671875, -3.162353515625, -3.05059814453125, -2.9388427734375, -2.82708740234375, -2.71533203125, -2.60357666015625, -2.4918212890625, -2.38006591796875, -2.268310546875, -2.15655517578125, -2.0447998046875, -1.93304443359375, -1.8212890625, -1.70953369140625, -1.5977783203125, -1.48602294921875, -1.374267578125, -1.26251220703125, -1.1507568359375, -1.03900146484375, -0.92724609375, -0.81549072265625, -0.7037353515625, -0.59197998046875, -0.480224609375, -0.36846923828125, -0.2567138671875, -0.14495849609375, -0.033203125, 0.07855224609375, 0.1903076171875, 0.30206298828125, 0.413818359375, 0.52557373046875, 0.6373291015625, 0.74908447265625, 0.86083984375, 0.97259521484375, 1.0843505859375, 1.19610595703125, 1.307861328125, 1.41961669921875, 1.5313720703125, 1.64312744140625, 1.7548828125, 1.86663818359375, 1.9783935546875, 2.09014892578125, 2.201904296875, 2.31365966796875, 2.4254150390625, 2.53717041015625, 2.64892578125, 2.76068115234375, 2.8724365234375, 2.98419189453125, 3.095947265625, 3.20770263671875, 3.3194580078125, 3.43121337890625, 3.54296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 3.0, 7.0, 12.0, 11.0, 10.0, 20.0, 16.0, 18.0, 20.0, 22.0, 32.0, 31.0, 26.0, 33.0, 37.0, 33.0, 57.0, 50.0, 44.0, 49.0, 40.0, 32.0, 34.0, 29.0, 40.0, 28.0, 37.0, 31.0, 24.0, 27.0, 25.0, 13.0, 16.0, 14.0, 15.0, 11.0, 11.0, 7.0, 5.0, 4.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.2919921875, -1.2536773681640625, -1.215362548828125, -1.1770477294921875, -1.13873291015625, -1.1004180908203125, -1.062103271484375, -1.0237884521484375, -0.9854736328125, -0.9471588134765625, -0.908843994140625, -0.8705291748046875, -0.83221435546875, -0.7938995361328125, -0.755584716796875, -0.7172698974609375, -0.678955078125, -0.6406402587890625, -0.602325439453125, -0.5640106201171875, -0.52569580078125, -0.4873809814453125, -0.449066162109375, -0.4107513427734375, -0.3724365234375, -0.3341217041015625, -0.295806884765625, -0.2574920654296875, -0.21917724609375, -0.1808624267578125, -0.142547607421875, -0.1042327880859375, -0.06591796875, -0.0276031494140625, 0.010711669921875, 0.0490264892578125, 0.08734130859375, 0.1256561279296875, 0.163970947265625, 0.2022857666015625, 0.2406005859375, 0.2789154052734375, 0.317230224609375, 0.3555450439453125, 0.39385986328125, 0.4321746826171875, 0.470489501953125, 0.5088043212890625, 0.547119140625, 0.5854339599609375, 0.623748779296875, 0.6620635986328125, 0.70037841796875, 0.7386932373046875, 0.777008056640625, 0.8153228759765625, 0.8536376953125, 0.8919525146484375, 0.930267333984375, 0.9685821533203125, 1.00689697265625, 1.0452117919921875, 1.083526611328125, 1.1218414306640625, 1.16015625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 9.0, 7.0, 14.0, 11.0, 10.0, 20.0, 26.0, 26.0, 27.0, 33.0, 41.0, 43.0, 37.0, 46.0, 45.0, 52.0, 40.0, 42.0, 44.0, 37.0, 48.0, 41.0, 39.0, 40.0, 30.0, 24.0, 27.0, 20.0, 23.0, 16.0, 18.0, 11.0, 12.0, 8.0, 5.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.094738006591797, -10.74846076965332, -10.40218448638916, -10.055908203125, -9.709630966186523, -9.363353729248047, -9.017077445983887, -8.670801162719727, -8.32452392578125, -7.978247165679932, -7.631970405578613, -7.285693645477295, -6.939416885375977, -6.593140125274658, -6.24686336517334, -5.9005866050720215, -5.554309844970703, -5.208033084869385, -4.861756324768066, -4.515479564666748, -4.16920280456543, -3.8229260444641113, -3.476649284362793, -3.1303725242614746, -2.7840957641601562, -2.437819004058838, -2.0915422439575195, -1.7452654838562012, -1.3989887237548828, -1.0527119636535645, -0.7064352035522461, -0.36015844345092773, -0.013880729675292969, 0.3323960304260254, 0.6786727905273438, 1.024949550628662, 1.3712263107299805, 1.7175030708312988, 2.063779830932617, 2.4100565910339355, 2.756333351135254, 3.1026101112365723, 3.4488868713378906, 3.795163631439209, 4.141440391540527, 4.487717151641846, 4.833993911743164, 5.180270671844482, 5.526547431945801, 5.872824192047119, 6.2191009521484375, 6.565377712249756, 6.911654472351074, 7.257931232452393, 7.604207992553711, 7.950484752655029, 8.296761512756348, 8.643037796020508, 8.989315032958984, 9.335592269897461, 9.681868553161621, 10.028144836425781, 10.374422073364258, 10.720699310302734, 11.066975593566895]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 12.0, 7.0, 12.0, 13.0, 21.0, 16.0, 22.0, 26.0, 23.0, 29.0, 32.0, 40.0, 37.0, 40.0, 43.0, 33.0, 46.0, 46.0, 33.0, 39.0, 48.0, 51.0, 44.0, 43.0, 22.0, 27.0, 19.0, 19.0, 24.0, 23.0, 24.0, 16.0, 11.0, 8.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.210838317871094, -14.713766098022461, -14.216693878173828, -13.719621658325195, -13.222549438476562, -12.72547721862793, -12.22840404510498, -11.731331825256348, -11.234259605407715, -10.737187385559082, -10.24011516571045, -9.743042945861816, -9.245969772338867, -8.748897552490234, -8.251825332641602, -7.754753112792969, -7.257680892944336, -6.760608673095703, -6.26353645324707, -5.766463756561279, -5.2693915367126465, -4.772319316864014, -4.275246620178223, -3.77817440032959, -3.281102180480957, -2.784029960632324, -2.2869575023651123, -1.78988516330719, -1.2928128242492676, -0.7957406044006348, -0.29866814613342285, 0.19840431213378906, 0.6954765319824219, 1.1925488710403442, 1.6896212100982666, 2.1866936683654785, 2.6837658882141113, 3.180838108062744, 3.677910566329956, 4.174983024597168, 4.672055244445801, 5.169127464294434, 5.666199684143066, 6.163272380828857, 6.66034460067749, 7.157416820526123, 7.654489517211914, 8.151561737060547, 8.64863395690918, 9.145706176757812, 9.642778396606445, 10.139850616455078, 10.636922836303711, 11.133995056152344, 11.631068229675293, 12.128140449523926, 12.625212669372559, 13.122284889221191, 13.619357109069824, 14.116429328918457, 14.613502502441406, 15.110574722290039, 15.607646942138672, 16.104719161987305, 16.601791381835938]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 11.0, 20.0, 26.0, 44.0, 76.0, 118.0, 216.0, 364.0, 617.0, 985.0, 1740.0, 2779.0, 4723.0, 8003.0, 13224.0, 21003.0, 33422.0, 51912.0, 78772.0, 115818.0, 162148.0, 220579.0, 282773.0, 344305.0, 390665.0, 416069.0, 412286.0, 381742.0, 330344.0, 267960.0, 205086.0, 150122.0, 104891.0, 70191.0, 45706.0, 29591.0, 18176.0, 11149.0, 6797.0, 4062.0, 2394.0, 1470.0, 817.0, 475.0, 262.0, 142.0, 84.0, 49.0, 34.0, 19.0, 7.0, 9.0, 2.0, 2.0, 1.0], "bins": [-9.8984375, -9.6146240234375, -9.330810546875, -9.0469970703125, -8.76318359375, -8.4793701171875, -8.195556640625, -7.9117431640625, -7.6279296875, -7.3441162109375, -7.060302734375, -6.7764892578125, -6.49267578125, -6.2088623046875, -5.925048828125, -5.6412353515625, -5.357421875, -5.0736083984375, -4.789794921875, -4.5059814453125, -4.22216796875, -3.9383544921875, -3.654541015625, -3.3707275390625, -3.0869140625, -2.8031005859375, -2.519287109375, -2.2354736328125, -1.95166015625, -1.6678466796875, -1.384033203125, -1.1002197265625, -0.81640625, -0.5325927734375, -0.248779296875, 0.0350341796875, 0.31884765625, 0.6026611328125, 0.886474609375, 1.1702880859375, 1.4541015625, 1.7379150390625, 2.021728515625, 2.3055419921875, 2.58935546875, 2.8731689453125, 3.156982421875, 3.4407958984375, 3.724609375, 4.0084228515625, 4.292236328125, 4.5760498046875, 4.85986328125, 5.1436767578125, 5.427490234375, 5.7113037109375, 5.9951171875, 6.2789306640625, 6.562744140625, 6.8465576171875, 7.13037109375, 7.4141845703125, 7.697998046875, 7.9818115234375, 8.265625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 4.0, 3.0, 10.0, 7.0, 13.0, 12.0, 14.0, 21.0, 24.0, 25.0, 31.0, 32.0, 33.0, 36.0, 37.0, 36.0, 36.0, 47.0, 45.0, 39.0, 39.0, 52.0, 37.0, 47.0, 45.0, 29.0, 36.0, 25.0, 27.0, 30.0, 12.0, 28.0, 16.0, 11.0, 11.0, 9.0, 12.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.8878173828125, -14.416259765625, -13.9447021484375, -13.47314453125, -13.0015869140625, -12.530029296875, -12.0584716796875, -11.5869140625, -11.1153564453125, -10.643798828125, -10.1722412109375, -9.70068359375, -9.2291259765625, -8.757568359375, -8.2860107421875, -7.814453125, -7.3428955078125, -6.871337890625, -6.3997802734375, -5.92822265625, -5.4566650390625, -4.985107421875, -4.5135498046875, -4.0419921875, -3.5704345703125, -3.098876953125, -2.6273193359375, -2.15576171875, -1.6842041015625, -1.212646484375, -0.7410888671875, -0.26953125, 0.2020263671875, 0.673583984375, 1.1451416015625, 1.61669921875, 2.0882568359375, 2.559814453125, 3.0313720703125, 3.5029296875, 3.9744873046875, 4.446044921875, 4.9176025390625, 5.38916015625, 5.8607177734375, 6.332275390625, 6.8038330078125, 7.275390625, 7.7469482421875, 8.218505859375, 8.6900634765625, 9.16162109375, 9.6331787109375, 10.104736328125, 10.5762939453125, 11.0478515625, 11.5194091796875, 11.990966796875, 12.4625244140625, 12.93408203125, 13.4056396484375, 13.877197265625, 14.3487548828125, 14.8203125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 14.0, 24.0, 42.0, 71.0, 154.0, 234.0, 383.0, 614.0, 1163.0, 1974.0, 3165.0, 5479.0, 9187.0, 15378.0, 24666.0, 39282.0, 60476.0, 90995.0, 132785.0, 182761.0, 242817.0, 301229.0, 356824.0, 394289.0, 410506.0, 398785.0, 363485.0, 309376.0, 251001.0, 189676.0, 138670.0, 96011.0, 64277.0, 41841.0, 26727.0, 15886.0, 9710.0, 5784.0, 3534.0, 2050.0, 1212.0, 717.0, 404.0, 266.0, 165.0, 84.0, 49.0, 34.0, 15.0, 8.0, 2.0, 0.0, 3.0, 3.0], "bins": [-10.890625, -10.5755615234375, -10.260498046875, -9.9454345703125, -9.63037109375, -9.3153076171875, -9.000244140625, -8.6851806640625, -8.3701171875, -8.0550537109375, -7.739990234375, -7.4249267578125, -7.10986328125, -6.7947998046875, -6.479736328125, -6.1646728515625, -5.849609375, -5.5345458984375, -5.219482421875, -4.9044189453125, -4.58935546875, -4.2742919921875, -3.959228515625, -3.6441650390625, -3.3291015625, -3.0140380859375, -2.698974609375, -2.3839111328125, -2.06884765625, -1.7537841796875, -1.438720703125, -1.1236572265625, -0.80859375, -0.4935302734375, -0.178466796875, 0.1365966796875, 0.45166015625, 0.7667236328125, 1.081787109375, 1.3968505859375, 1.7119140625, 2.0269775390625, 2.342041015625, 2.6571044921875, 2.97216796875, 3.2872314453125, 3.602294921875, 3.9173583984375, 4.232421875, 4.5474853515625, 4.862548828125, 5.1776123046875, 5.49267578125, 5.8077392578125, 6.122802734375, 6.4378662109375, 6.7529296875, 7.0679931640625, 7.383056640625, 7.6981201171875, 8.01318359375, 8.3282470703125, 8.643310546875, 8.9583740234375, 9.2734375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 17.0, 20.0, 26.0, 35.0, 27.0, 56.0, 60.0, 78.0, 89.0, 104.0, 122.0, 163.0, 138.0, 149.0, 158.0, 186.0, 212.0, 207.0, 196.0, 188.0, 227.0, 170.0, 189.0, 158.0, 180.0, 152.0, 134.0, 101.0, 100.0, 77.0, 58.0, 65.0, 48.0, 50.0, 27.0, 19.0, 16.0, 13.0, 16.0, 7.0, 3.0, 5.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.45703125, -6.24615478515625, -6.0352783203125, -5.82440185546875, -5.613525390625, -5.40264892578125, -5.1917724609375, -4.98089599609375, -4.77001953125, -4.55914306640625, -4.3482666015625, -4.13739013671875, -3.926513671875, -3.71563720703125, -3.5047607421875, -3.29388427734375, -3.0830078125, -2.87213134765625, -2.6612548828125, -2.45037841796875, -2.239501953125, -2.02862548828125, -1.8177490234375, -1.60687255859375, -1.39599609375, -1.18511962890625, -0.9742431640625, -0.76336669921875, -0.552490234375, -0.34161376953125, -0.1307373046875, 0.08013916015625, 0.291015625, 0.50189208984375, 0.7127685546875, 0.92364501953125, 1.134521484375, 1.34539794921875, 1.5562744140625, 1.76715087890625, 1.97802734375, 2.18890380859375, 2.3997802734375, 2.61065673828125, 2.821533203125, 3.03240966796875, 3.2432861328125, 3.45416259765625, 3.6650390625, 3.87591552734375, 4.0867919921875, 4.29766845703125, 4.508544921875, 4.71942138671875, 4.9302978515625, 5.14117431640625, 5.35205078125, 5.56292724609375, 5.7738037109375, 5.98468017578125, 6.195556640625, 6.40643310546875, 6.6173095703125, 6.82818603515625, 7.0390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 12.0, 9.0, 13.0, 16.0, 23.0, 21.0, 21.0, 18.0, 28.0, 29.0, 26.0, 41.0, 46.0, 37.0, 37.0, 47.0, 47.0, 55.0, 46.0, 38.0, 44.0, 45.0, 30.0, 35.0, 23.0, 21.0, 25.0, 21.0, 23.0, 14.0, 22.0, 11.0, 11.0, 11.0, 11.0, 8.0, 3.0, 6.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.201578140258789, -13.745174407958984, -13.28877067565918, -12.832367897033691, -12.375964164733887, -11.919560432434082, -11.463157653808594, -11.006753921508789, -10.550350189208984, -10.09394645690918, -9.637542724609375, -9.181139945983887, -8.724736213684082, -8.268332481384277, -7.811929225921631, -7.355525970458984, -6.89912223815918, -6.442718505859375, -5.9863152503967285, -5.529911994934082, -5.073508262634277, -4.617104530334473, -4.160701274871826, -3.7042977809906006, -3.247894287109375, -2.7914907932281494, -2.335087299346924, -1.8786838054656982, -1.4222803115844727, -0.9658768177032471, -0.5094733238220215, -0.0530698299407959, 0.4033327102661133, 0.8597362041473389, 1.3161396980285645, 1.77254319190979, 2.2289466857910156, 2.685350179672241, 3.141753673553467, 3.5981571674346924, 4.054560661315918, 4.510964393615723, 4.967367649078369, 5.423770904541016, 5.88017463684082, 6.336578369140625, 6.7929816246032715, 7.249384880065918, 7.705788612365723, 8.162192344665527, 8.618595123291016, 9.07499885559082, 9.531402587890625, 9.98780632019043, 10.444210052490234, 10.900612831115723, 11.357016563415527, 11.813420295715332, 12.26982307434082, 12.726226806640625, 13.18263053894043, 13.639034271240234, 14.095438003540039, 14.551840782165527, 15.008244514465332]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 5.0, 9.0, 10.0, 7.0, 8.0, 7.0, 17.0, 16.0, 13.0, 13.0, 19.0, 27.0, 27.0, 28.0, 20.0, 38.0, 39.0, 37.0, 26.0, 29.0, 39.0, 53.0, 37.0, 42.0, 34.0, 30.0, 36.0, 33.0, 32.0, 30.0, 27.0, 24.0, 28.0, 19.0, 18.0, 19.0, 14.0, 13.0, 13.0, 10.0, 10.0, 10.0, 5.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0], "bins": [-17.918136596679688, -17.35854721069336, -16.79895782470703, -16.239368438720703, -15.679780006408691, -15.120190620422363, -14.560601234436035, -14.001011848449707, -13.441423416137695, -12.881834030151367, -12.322244644165039, -11.762655258178711, -11.2030668258667, -10.643477439880371, -10.083888053894043, -9.524298667907715, -8.964709281921387, -8.405119895935059, -7.845530986785889, -7.2859416007995605, -6.726352691650391, -6.1667633056640625, -5.607173919677734, -5.047584533691406, -4.487995624542236, -3.9284064769744873, -3.3688173294067383, -2.80922794342041, -2.249638795852661, -1.690049648284912, -1.130460262298584, -0.570871114730835, -0.011281967163085938, 0.5483072400093079, 1.1078964471817017, 1.6674857139587402, 2.2270748615264893, 2.7866640090942383, 3.3462533950805664, 3.9058425426483154, 4.4654316902160645, 5.025021076202393, 5.5846099853515625, 6.144199371337891, 6.703788757324219, 7.263377666473389, 7.822967052459717, 8.382555961608887, 8.942145347595215, 9.501734733581543, 10.061324119567871, 10.620912551879883, 11.180501937866211, 11.740091323852539, 12.299680709838867, 12.859270095825195, 13.418859481811523, 13.978448867797852, 14.53803825378418, 15.097627639770508, 15.65721607208252, 16.21680450439453, 16.77639389038086, 17.335983276367188, 17.895572662353516]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 11.0, 6.0, 19.0, 23.0, 25.0, 38.0, 74.0, 94.0, 130.0, 200.0, 274.0, 375.0, 551.0, 825.0, 1155.0, 1686.0, 2508.0, 3559.0, 5371.0, 8056.0, 11597.0, 17365.0, 25685.0, 36916.0, 52408.0, 71043.0, 91895.0, 110519.0, 120074.0, 114623.0, 99624.0, 79374.0, 58808.0, 42376.0, 29204.0, 20052.0, 13394.0, 9025.0, 6273.0, 4141.0, 2882.0, 1985.0, 1334.0, 930.0, 620.0, 423.0, 295.0, 229.0, 143.0, 105.0, 82.0, 56.0, 44.0, 17.0, 13.0, 19.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.482421875, -2.401519775390625, -2.32061767578125, -2.239715576171875, -2.1588134765625, -2.077911376953125, -1.99700927734375, -1.916107177734375, -1.835205078125, -1.754302978515625, -1.67340087890625, -1.592498779296875, -1.5115966796875, -1.430694580078125, -1.34979248046875, -1.268890380859375, -1.18798828125, -1.107086181640625, -1.02618408203125, -0.945281982421875, -0.8643798828125, -0.783477783203125, -0.70257568359375, -0.621673583984375, -0.540771484375, -0.459869384765625, -0.37896728515625, -0.298065185546875, -0.2171630859375, -0.136260986328125, -0.05535888671875, 0.025543212890625, 0.1064453125, 0.187347412109375, 0.26824951171875, 0.349151611328125, 0.4300537109375, 0.510955810546875, 0.59185791015625, 0.672760009765625, 0.753662109375, 0.834564208984375, 0.91546630859375, 0.996368408203125, 1.0772705078125, 1.158172607421875, 1.23907470703125, 1.319976806640625, 1.40087890625, 1.481781005859375, 1.56268310546875, 1.643585205078125, 1.7244873046875, 1.805389404296875, 1.88629150390625, 1.967193603515625, 2.048095703125, 2.128997802734375, 2.20989990234375, 2.290802001953125, 2.3717041015625, 2.452606201171875, 2.53350830078125, 2.614410400390625, 2.6953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 13.0, 7.0, 5.0, 7.0, 7.0, 12.0, 9.0, 15.0, 16.0, 15.0, 29.0, 25.0, 23.0, 24.0, 33.0, 27.0, 37.0, 52.0, 26.0, 32.0, 43.0, 41.0, 40.0, 35.0, 33.0, 38.0, 35.0, 34.0, 26.0, 35.0, 21.0, 25.0, 21.0, 29.0, 20.0, 13.0, 13.0, 6.0, 21.0, 13.0, 10.0, 9.0, 2.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-18.640625, -18.056884765625, -17.47314453125, -16.889404296875, -16.3056640625, -15.721923828125, -15.13818359375, -14.554443359375, -13.970703125, -13.386962890625, -12.80322265625, -12.219482421875, -11.6357421875, -11.052001953125, -10.46826171875, -9.884521484375, -9.30078125, -8.717041015625, -8.13330078125, -7.549560546875, -6.9658203125, -6.382080078125, -5.79833984375, -5.214599609375, -4.630859375, -4.047119140625, -3.46337890625, -2.879638671875, -2.2958984375, -1.712158203125, -1.12841796875, -0.544677734375, 0.0390625, 0.622802734375, 1.20654296875, 1.790283203125, 2.3740234375, 2.957763671875, 3.54150390625, 4.125244140625, 4.708984375, 5.292724609375, 5.87646484375, 6.460205078125, 7.0439453125, 7.627685546875, 8.21142578125, 8.795166015625, 9.37890625, 9.962646484375, 10.54638671875, 11.130126953125, 11.7138671875, 12.297607421875, 12.88134765625, 13.465087890625, 14.048828125, 14.632568359375, 15.21630859375, 15.800048828125, 16.3837890625, 16.967529296875, 17.55126953125, 18.135009765625, 18.71875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 6.0, 3.0, 9.0, 10.0, 16.0, 15.0, 26.0, 51.0, 63.0, 97.0, 131.0, 173.0, 245.0, 385.0, 581.0, 822.0, 1236.0, 1756.0, 2828.0, 4394.0, 6994.0, 11018.0, 17696.0, 28887.0, 46496.0, 73488.0, 107790.0, 141481.0, 155279.0, 141344.0, 107461.0, 73426.0, 46756.0, 28876.0, 17591.0, 11149.0, 6972.0, 4363.0, 2873.0, 1933.0, 1274.0, 826.0, 564.0, 340.0, 260.0, 175.0, 118.0, 87.0, 59.0, 47.0, 34.0, 16.0, 20.0, 14.0, 7.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-3.33203125, -3.2294921875, -3.126953125, -3.0244140625, -2.921875, -2.8193359375, -2.716796875, -2.6142578125, -2.51171875, -2.4091796875, -2.306640625, -2.2041015625, -2.1015625, -1.9990234375, -1.896484375, -1.7939453125, -1.69140625, -1.5888671875, -1.486328125, -1.3837890625, -1.28125, -1.1787109375, -1.076171875, -0.9736328125, -0.87109375, -0.7685546875, -0.666015625, -0.5634765625, -0.4609375, -0.3583984375, -0.255859375, -0.1533203125, -0.05078125, 0.0517578125, 0.154296875, 0.2568359375, 0.359375, 0.4619140625, 0.564453125, 0.6669921875, 0.76953125, 0.8720703125, 0.974609375, 1.0771484375, 1.1796875, 1.2822265625, 1.384765625, 1.4873046875, 1.58984375, 1.6923828125, 1.794921875, 1.8974609375, 2.0, 2.1025390625, 2.205078125, 2.3076171875, 2.41015625, 2.5126953125, 2.615234375, 2.7177734375, 2.8203125, 2.9228515625, 3.025390625, 3.1279296875, 3.23046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 0.0, 2.0, 6.0, 10.0, 5.0, 9.0, 12.0, 16.0, 16.0, 11.0, 19.0, 21.0, 27.0, 24.0, 33.0, 27.0, 33.0, 39.0, 27.0, 40.0, 55.0, 40.0, 58.0, 33.0, 30.0, 40.0, 40.0, 39.0, 33.0, 42.0, 24.0, 26.0, 27.0, 17.0, 16.0, 10.0, 25.0, 17.0, 10.0, 9.0, 6.0, 7.0, 4.0, 8.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-11.546875, -11.18994140625, -10.8330078125, -10.47607421875, -10.119140625, -9.76220703125, -9.4052734375, -9.04833984375, -8.69140625, -8.33447265625, -7.9775390625, -7.62060546875, -7.263671875, -6.90673828125, -6.5498046875, -6.19287109375, -5.8359375, -5.47900390625, -5.1220703125, -4.76513671875, -4.408203125, -4.05126953125, -3.6943359375, -3.33740234375, -2.98046875, -2.62353515625, -2.2666015625, -1.90966796875, -1.552734375, -1.19580078125, -0.8388671875, -0.48193359375, -0.125, 0.23193359375, 0.5888671875, 0.94580078125, 1.302734375, 1.65966796875, 2.0166015625, 2.37353515625, 2.73046875, 3.08740234375, 3.4443359375, 3.80126953125, 4.158203125, 4.51513671875, 4.8720703125, 5.22900390625, 5.5859375, 5.94287109375, 6.2998046875, 6.65673828125, 7.013671875, 7.37060546875, 7.7275390625, 8.08447265625, 8.44140625, 8.79833984375, 9.1552734375, 9.51220703125, 9.869140625, 10.22607421875, 10.5830078125, 10.93994140625, 11.296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 3.0, 7.0, 11.0, 13.0, 28.0, 34.0, 58.0, 94.0, 144.0, 242.0, 355.0, 597.0, 982.0, 1546.0, 2642.0, 4388.0, 7301.0, 11989.0, 20299.0, 34240.0, 56272.0, 89080.0, 130721.0, 163624.0, 163422.0, 130327.0, 89241.0, 56128.0, 34358.0, 20112.0, 12161.0, 7036.0, 4372.0, 2540.0, 1547.0, 1004.0, 608.0, 354.0, 238.0, 168.0, 93.0, 62.0, 47.0, 23.0, 17.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8173828125, -0.791839599609375, -0.76629638671875, -0.740753173828125, -0.7152099609375, -0.689666748046875, -0.66412353515625, -0.638580322265625, -0.613037109375, -0.587493896484375, -0.56195068359375, -0.536407470703125, -0.5108642578125, -0.485321044921875, -0.45977783203125, -0.434234619140625, -0.40869140625, -0.383148193359375, -0.35760498046875, -0.332061767578125, -0.3065185546875, -0.280975341796875, -0.25543212890625, -0.229888916015625, -0.204345703125, -0.178802490234375, -0.15325927734375, -0.127716064453125, -0.1021728515625, -0.076629638671875, -0.05108642578125, -0.025543212890625, 0.0, 0.025543212890625, 0.05108642578125, 0.076629638671875, 0.1021728515625, 0.127716064453125, 0.15325927734375, 0.178802490234375, 0.204345703125, 0.229888916015625, 0.25543212890625, 0.280975341796875, 0.3065185546875, 0.332061767578125, 0.35760498046875, 0.383148193359375, 0.40869140625, 0.434234619140625, 0.45977783203125, 0.485321044921875, 0.5108642578125, 0.536407470703125, 0.56195068359375, 0.587493896484375, 0.613037109375, 0.638580322265625, 0.66412353515625, 0.689666748046875, 0.7152099609375, 0.740753173828125, 0.76629638671875, 0.791839599609375, 0.8173828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 11.0, 7.0, 8.0, 8.0, 19.0, 18.0, 17.0, 18.0, 27.0, 33.0, 19.0, 28.0, 37.0, 35.0, 39.0, 38.0, 38.0, 37.0, 36.0, 32.0, 35.0, 40.0, 37.0, 34.0, 43.0, 29.0, 42.0, 22.0, 32.0, 23.0, 23.0, 15.0, 19.0, 14.0, 12.0, 10.0, 9.0, 6.0, 7.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.1081180572509766e-05, -4.945043474435806e-05, -4.781968891620636e-05, -4.618894308805466e-05, -4.4558197259902954e-05, -4.292745143175125e-05, -4.129670560359955e-05, -3.9665959775447845e-05, -3.803521394729614e-05, -3.640446811914444e-05, -3.477372229099274e-05, -3.3142976462841034e-05, -3.151223063468933e-05, -2.9881484806537628e-05, -2.8250738978385925e-05, -2.6619993150234222e-05, -2.498924732208252e-05, -2.3358501493930817e-05, -2.1727755665779114e-05, -2.009700983762741e-05, -1.8466264009475708e-05, -1.6835518181324005e-05, -1.5204772353172302e-05, -1.35740265250206e-05, -1.1943280696868896e-05, -1.0312534868717194e-05, -8.68178904056549e-06, -7.051043212413788e-06, -5.420297384262085e-06, -3.789551556110382e-06, -2.158805727958679e-06, -5.280598998069763e-07, 1.1026859283447266e-06, 2.7334317564964294e-06, 4.364177584648132e-06, 5.994923412799835e-06, 7.625669240951538e-06, 9.256415069103241e-06, 1.0887160897254944e-05, 1.2517906725406647e-05, 1.414865255355835e-05, 1.5779398381710052e-05, 1.7410144209861755e-05, 1.9040890038013458e-05, 2.067163586616516e-05, 2.2302381694316864e-05, 2.3933127522468567e-05, 2.556387335062027e-05, 2.7194619178771973e-05, 2.8825365006923676e-05, 3.045611083507538e-05, 3.208685666322708e-05, 3.3717602491378784e-05, 3.534834831953049e-05, 3.697909414768219e-05, 3.860983997583389e-05, 4.0240585803985596e-05, 4.18713316321373e-05, 4.3502077460289e-05, 4.5132823288440704e-05, 4.676356911659241e-05, 4.839431494474411e-05, 5.002506077289581e-05, 5.1655806601047516e-05, 5.328655242919922e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 13.0, 8.0, 16.0, 23.0, 29.0, 46.0, 68.0, 115.0, 140.0, 259.0, 338.0, 546.0, 769.0, 1206.0, 1800.0, 2580.0, 4189.0, 6240.0, 9733.0, 14909.0, 23218.0, 35567.0, 52907.0, 76116.0, 103282.0, 126569.0, 136505.0, 125951.0, 101227.0, 74230.0, 51093.0, 34255.0, 22898.0, 14492.0, 9422.0, 6038.0, 3961.0, 2583.0, 1699.0, 1133.0, 815.0, 507.0, 376.0, 249.0, 145.0, 111.0, 61.0, 41.0, 31.0, 20.0, 18.0, 4.0, 6.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.93017578125, -0.9006118774414062, -0.8710479736328125, -0.8414840698242188, -0.811920166015625, -0.7823562622070312, -0.7527923583984375, -0.7232284545898438, -0.69366455078125, -0.6641006469726562, -0.6345367431640625, -0.6049728393554688, -0.575408935546875, -0.5458450317382812, -0.5162811279296875, -0.48671722412109375, -0.4571533203125, -0.42758941650390625, -0.3980255126953125, -0.36846160888671875, -0.338897705078125, -0.30933380126953125, -0.2797698974609375, -0.25020599365234375, -0.22064208984375, -0.19107818603515625, -0.1615142822265625, -0.13195037841796875, -0.102386474609375, -0.07282257080078125, -0.0432586669921875, -0.01369476318359375, 0.015869140625, 0.04543304443359375, 0.0749969482421875, 0.10456085205078125, 0.134124755859375, 0.16368865966796875, 0.1932525634765625, 0.22281646728515625, 0.25238037109375, 0.28194427490234375, 0.3115081787109375, 0.34107208251953125, 0.370635986328125, 0.40019989013671875, 0.4297637939453125, 0.45932769775390625, 0.4888916015625, 0.5184555053710938, 0.5480194091796875, 0.5775833129882812, 0.607147216796875, 0.6367111206054688, 0.6662750244140625, 0.6958389282226562, 0.72540283203125, 0.7549667358398438, 0.7845306396484375, 0.8140945434570312, 0.843658447265625, 0.8732223510742188, 0.9027862548828125, 0.9323501586914062, 0.9619140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 8.0, 9.0, 9.0, 19.0, 16.0, 23.0, 28.0, 30.0, 25.0, 30.0, 39.0, 59.0, 47.0, 47.0, 64.0, 62.0, 47.0, 50.0, 62.0, 34.0, 39.0, 43.0, 26.0, 34.0, 29.0, 27.0, 19.0, 12.0, 8.0, 9.0, 11.0, 11.0, 7.0, 6.0, 0.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.462890625, -0.4457244873046875, -0.428558349609375, -0.4113922119140625, -0.39422607421875, -0.3770599365234375, -0.359893798828125, -0.3427276611328125, -0.3255615234375, -0.3083953857421875, -0.291229248046875, -0.2740631103515625, -0.25689697265625, -0.2397308349609375, -0.222564697265625, -0.2053985595703125, -0.188232421875, -0.1710662841796875, -0.153900146484375, -0.1367340087890625, -0.11956787109375, -0.1024017333984375, -0.085235595703125, -0.0680694580078125, -0.0509033203125, -0.0337371826171875, -0.016571044921875, 0.0005950927734375, 0.01776123046875, 0.0349273681640625, 0.052093505859375, 0.0692596435546875, 0.08642578125, 0.1035919189453125, 0.120758056640625, 0.1379241943359375, 0.15509033203125, 0.1722564697265625, 0.189422607421875, 0.2065887451171875, 0.2237548828125, 0.2409210205078125, 0.258087158203125, 0.2752532958984375, 0.29241943359375, 0.3095855712890625, 0.326751708984375, 0.3439178466796875, 0.361083984375, 0.3782501220703125, 0.395416259765625, 0.4125823974609375, 0.42974853515625, 0.4469146728515625, 0.464080810546875, 0.4812469482421875, 0.4984130859375, 0.5155792236328125, 0.532745361328125, 0.5499114990234375, 0.56707763671875, 0.5842437744140625, 0.601409912109375, 0.6185760498046875, 0.6357421875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 8.0, 9.0, 12.0, 12.0, 22.0, 15.0, 25.0, 21.0, 22.0, 25.0, 38.0, 27.0, 39.0, 43.0, 30.0, 53.0, 41.0, 50.0, 49.0, 47.0, 37.0, 46.0, 43.0, 31.0, 34.0, 21.0, 24.0, 25.0, 22.0, 19.0, 17.0, 17.0, 12.0, 13.0, 10.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.363988876342773, -13.901348114013672, -13.43870735168457, -12.976066589355469, -12.513425827026367, -12.050785064697266, -11.588144302368164, -11.125503540039062, -10.662862777709961, -10.20022201538086, -9.737581253051758, -9.274940490722656, -8.812299728393555, -8.349658966064453, -7.887018203735352, -7.42437744140625, -6.961736679077148, -6.499095916748047, -6.036455154418945, -5.573814392089844, -5.111173629760742, -4.648532867431641, -4.185892105102539, -3.7232513427734375, -3.260610580444336, -2.7979698181152344, -2.335329055786133, -1.8726882934570312, -1.4100475311279297, -0.9474067687988281, -0.48476600646972656, -0.022125244140625, 0.44051551818847656, 0.9031562805175781, 1.3657970428466797, 1.8284378051757812, 2.291078567504883, 2.7537193298339844, 3.216360092163086, 3.6790008544921875, 4.141641616821289, 4.604282379150391, 5.066923141479492, 5.529563903808594, 5.992204666137695, 6.454845428466797, 6.917486190795898, 7.380126953125, 7.842767715454102, 8.305408477783203, 8.768049240112305, 9.230690002441406, 9.693330764770508, 10.15597152709961, 10.618612289428711, 11.081253051757812, 11.543893814086914, 12.006534576416016, 12.469175338745117, 12.931816101074219, 13.39445686340332, 13.857097625732422, 14.319738388061523, 14.782379150390625, 15.245019912719727]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 9.0, 6.0, 8.0, 5.0, 17.0, 20.0, 12.0, 11.0, 20.0, 23.0, 31.0, 26.0, 25.0, 37.0, 32.0, 37.0, 31.0, 25.0, 40.0, 55.0, 42.0, 35.0, 36.0, 30.0, 35.0, 36.0, 33.0, 32.0, 22.0, 29.0, 26.0, 17.0, 21.0, 18.0, 15.0, 12.0, 13.0, 10.0, 8.0, 11.0, 5.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0], "bins": [-18.04243278503418, -17.478641510009766, -16.914852142333984, -16.35106086730957, -15.787269592285156, -15.223478317260742, -14.659687995910645, -14.095897674560547, -13.532106399536133, -12.968315124511719, -12.404524803161621, -11.840734481811523, -11.27694320678711, -10.713151931762695, -10.149361610412598, -9.5855712890625, -9.021780014038086, -8.457988739013672, -7.894198417663574, -7.330407619476318, -6.7666168212890625, -6.202826023101807, -5.639035224914551, -5.075244426727295, -4.511453628540039, -3.947662830352783, -3.3838720321655273, -2.8200812339782715, -2.2562904357910156, -1.6924996376037598, -1.128708839416504, -0.564918041229248, -0.0011272430419921875, 0.5626635551452637, 1.1264543533325195, 1.6902451515197754, 2.2540359497070312, 2.817826747894287, 3.381617546081543, 3.945408344268799, 4.509199142456055, 5.0729899406433105, 5.636780738830566, 6.200571537017822, 6.764362335205078, 7.328153133392334, 7.89194393157959, 8.455734252929688, 9.019525527954102, 9.583316802978516, 10.147107124328613, 10.710897445678711, 11.274688720703125, 11.838479995727539, 12.402270317077637, 12.966060638427734, 13.529851913452148, 14.093643188476562, 14.65743350982666, 15.221223831176758, 15.785015106201172, 16.348806381225586, 16.91259765625, 17.47638702392578, 18.040178298950195]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 7.0, 3.0, 3.0, 13.0, 14.0, 21.0, 18.0, 40.0, 68.0, 70.0, 117.0, 198.0, 291.0, 464.0, 711.0, 1159.0, 1954.0, 3201.0, 5381.0, 9126.0, 14730.0, 24399.0, 38403.0, 58530.0, 82354.0, 106643.0, 124839.0, 130808.0, 121816.0, 102108.0, 76105.0, 54111.0, 35187.0, 21845.0, 13333.0, 7988.0, 4796.0, 2930.0, 1726.0, 1147.0, 634.0, 428.0, 280.0, 211.0, 128.0, 79.0, 51.0, 30.0, 21.0, 18.0, 16.0, 5.0, 6.0, 5.0, 2.0, 0.0, 2.0], "bins": [-11.0, -10.68017578125, -10.3603515625, -10.04052734375, -9.720703125, -9.40087890625, -9.0810546875, -8.76123046875, -8.44140625, -8.12158203125, -7.8017578125, -7.48193359375, -7.162109375, -6.84228515625, -6.5224609375, -6.20263671875, -5.8828125, -5.56298828125, -5.2431640625, -4.92333984375, -4.603515625, -4.28369140625, -3.9638671875, -3.64404296875, -3.32421875, -3.00439453125, -2.6845703125, -2.36474609375, -2.044921875, -1.72509765625, -1.4052734375, -1.08544921875, -0.765625, -0.44580078125, -0.1259765625, 0.19384765625, 0.513671875, 0.83349609375, 1.1533203125, 1.47314453125, 1.79296875, 2.11279296875, 2.4326171875, 2.75244140625, 3.072265625, 3.39208984375, 3.7119140625, 4.03173828125, 4.3515625, 4.67138671875, 4.9912109375, 5.31103515625, 5.630859375, 5.95068359375, 6.2705078125, 6.59033203125, 6.91015625, 7.22998046875, 7.5498046875, 7.86962890625, 8.189453125, 8.50927734375, 8.8291015625, 9.14892578125, 9.46875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 6.0, 5.0, 1.0, 5.0, 7.0, 14.0, 18.0, 12.0, 13.0, 15.0, 17.0, 17.0, 21.0, 31.0, 31.0, 35.0, 31.0, 27.0, 32.0, 39.0, 47.0, 37.0, 37.0, 50.0, 36.0, 47.0, 32.0, 38.0, 39.0, 32.0, 33.0, 34.0, 20.0, 27.0, 16.0, 12.0, 12.0, 27.0, 9.0, 5.0, 10.0, 3.0, 5.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -17.98583984375, -17.3935546875, -16.80126953125, -16.208984375, -15.61669921875, -15.0244140625, -14.43212890625, -13.83984375, -13.24755859375, -12.6552734375, -12.06298828125, -11.470703125, -10.87841796875, -10.2861328125, -9.69384765625, -9.1015625, -8.50927734375, -7.9169921875, -7.32470703125, -6.732421875, -6.14013671875, -5.5478515625, -4.95556640625, -4.36328125, -3.77099609375, -3.1787109375, -2.58642578125, -1.994140625, -1.40185546875, -0.8095703125, -0.21728515625, 0.375, 0.96728515625, 1.5595703125, 2.15185546875, 2.744140625, 3.33642578125, 3.9287109375, 4.52099609375, 5.11328125, 5.70556640625, 6.2978515625, 6.89013671875, 7.482421875, 8.07470703125, 8.6669921875, 9.25927734375, 9.8515625, 10.44384765625, 11.0361328125, 11.62841796875, 12.220703125, 12.81298828125, 13.4052734375, 13.99755859375, 14.58984375, 15.18212890625, 15.7744140625, 16.36669921875, 16.958984375, 17.55126953125, 18.1435546875, 18.73583984375, 19.328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 12.0, 15.0, 20.0, 36.0, 55.0, 80.0, 129.0, 187.0, 298.0, 459.0, 647.0, 944.0, 1494.0, 2340.0, 3559.0, 5571.0, 8775.0, 13915.0, 22348.0, 34790.0, 52675.0, 76356.0, 101969.0, 124770.0, 133555.0, 125642.0, 104954.0, 78876.0, 54668.0, 35957.0, 22997.0, 14588.0, 9154.0, 5826.0, 3803.0, 2453.0, 1630.0, 1025.0, 660.0, 441.0, 281.0, 211.0, 139.0, 93.0, 59.0, 38.0, 28.0, 19.0, 4.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.1484375, -11.750732421875, -11.35302734375, -10.955322265625, -10.5576171875, -10.159912109375, -9.76220703125, -9.364501953125, -8.966796875, -8.569091796875, -8.17138671875, -7.773681640625, -7.3759765625, -6.978271484375, -6.58056640625, -6.182861328125, -5.78515625, -5.387451171875, -4.98974609375, -4.592041015625, -4.1943359375, -3.796630859375, -3.39892578125, -3.001220703125, -2.603515625, -2.205810546875, -1.80810546875, -1.410400390625, -1.0126953125, -0.614990234375, -0.21728515625, 0.180419921875, 0.578125, 0.975830078125, 1.37353515625, 1.771240234375, 2.1689453125, 2.566650390625, 2.96435546875, 3.362060546875, 3.759765625, 4.157470703125, 4.55517578125, 4.952880859375, 5.3505859375, 5.748291015625, 6.14599609375, 6.543701171875, 6.94140625, 7.339111328125, 7.73681640625, 8.134521484375, 8.5322265625, 8.929931640625, 9.32763671875, 9.725341796875, 10.123046875, 10.520751953125, 10.91845703125, 11.316162109375, 11.7138671875, 12.111572265625, 12.50927734375, 12.906982421875, 13.3046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 4.0, 6.0, 3.0, 1.0, 6.0, 6.0, 2.0, 10.0, 13.0, 13.0, 14.0, 18.0, 20.0, 15.0, 28.0, 17.0, 24.0, 24.0, 21.0, 34.0, 25.0, 27.0, 43.0, 43.0, 43.0, 41.0, 29.0, 41.0, 36.0, 30.0, 37.0, 33.0, 29.0, 34.0, 23.0, 27.0, 26.0, 21.0, 30.0, 13.0, 19.0, 11.0, 13.0, 6.0, 6.0, 10.0, 12.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.8203125, -10.4608154296875, -10.101318359375, -9.7418212890625, -9.38232421875, -9.0228271484375, -8.663330078125, -8.3038330078125, -7.9443359375, -7.5848388671875, -7.225341796875, -6.8658447265625, -6.50634765625, -6.1468505859375, -5.787353515625, -5.4278564453125, -5.068359375, -4.7088623046875, -4.349365234375, -3.9898681640625, -3.63037109375, -3.2708740234375, -2.911376953125, -2.5518798828125, -2.1923828125, -1.8328857421875, -1.473388671875, -1.1138916015625, -0.75439453125, -0.3948974609375, -0.035400390625, 0.3240966796875, 0.68359375, 1.0430908203125, 1.402587890625, 1.7620849609375, 2.12158203125, 2.4810791015625, 2.840576171875, 3.2000732421875, 3.5595703125, 3.9190673828125, 4.278564453125, 4.6380615234375, 4.99755859375, 5.3570556640625, 5.716552734375, 6.0760498046875, 6.435546875, 6.7950439453125, 7.154541015625, 7.5140380859375, 7.87353515625, 8.2330322265625, 8.592529296875, 8.9520263671875, 9.3115234375, 9.6710205078125, 10.030517578125, 10.3900146484375, 10.74951171875, 11.1090087890625, 11.468505859375, 11.8280029296875, 12.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 2.0, 5.0, 18.0, 23.0, 34.0, 50.0, 97.0, 109.0, 166.0, 303.0, 449.0, 640.0, 986.0, 1475.0, 2328.0, 3751.0, 6264.0, 10432.0, 18120.0, 31662.0, 53576.0, 85074.0, 121645.0, 149243.0, 155642.0, 137121.0, 102315.0, 67951.0, 40954.0, 24002.0, 13141.0, 7836.0, 4732.0, 3062.0, 1921.0, 1164.0, 806.0, 514.0, 330.0, 223.0, 153.0, 89.0, 46.0, 34.0, 23.0, 20.0, 10.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0], "bins": [-6.375, -6.194091796875, -6.01318359375, -5.832275390625, -5.6513671875, -5.470458984375, -5.28955078125, -5.108642578125, -4.927734375, -4.746826171875, -4.56591796875, -4.385009765625, -4.2041015625, -4.023193359375, -3.84228515625, -3.661376953125, -3.48046875, -3.299560546875, -3.11865234375, -2.937744140625, -2.7568359375, -2.575927734375, -2.39501953125, -2.214111328125, -2.033203125, -1.852294921875, -1.67138671875, -1.490478515625, -1.3095703125, -1.128662109375, -0.94775390625, -0.766845703125, -0.5859375, -0.405029296875, -0.22412109375, -0.043212890625, 0.1376953125, 0.318603515625, 0.49951171875, 0.680419921875, 0.861328125, 1.042236328125, 1.22314453125, 1.404052734375, 1.5849609375, 1.765869140625, 1.94677734375, 2.127685546875, 2.30859375, 2.489501953125, 2.67041015625, 2.851318359375, 3.0322265625, 3.213134765625, 3.39404296875, 3.574951171875, 3.755859375, 3.936767578125, 4.11767578125, 4.298583984375, 4.4794921875, 4.660400390625, 4.84130859375, 5.022216796875, 5.203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 4.0, 6.0, 8.0, 15.0, 17.0, 22.0, 25.0, 20.0, 42.0, 48.0, 47.0, 54.0, 67.0, 66.0, 58.0, 67.0, 74.0, 59.0, 56.0, 49.0, 48.0, 29.0, 25.0, 17.0, 12.0, 18.0, 6.0, 10.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006871223449707031, -0.0006660297513008118, -0.0006449371576309204, -0.000623844563961029, -0.0006027519702911377, -0.0005816593766212463, -0.000560566782951355, -0.0005394741892814636, -0.0005183815956115723, -0.0004972890019416809, -0.00047619640827178955, -0.0004551038146018982, -0.00043401122093200684, -0.0004129186272621155, -0.0003918260335922241, -0.00037073343992233276, -0.0003496408462524414, -0.00032854825258255005, -0.0003074556589126587, -0.00028636306524276733, -0.000265270471572876, -0.0002441778779029846, -0.00022308528423309326, -0.0002019926905632019, -0.00018090009689331055, -0.0001598075032234192, -0.00013871490955352783, -0.00011762231588363647, -9.652972221374512e-05, -7.543712854385376e-05, -5.43445348739624e-05, -3.3251941204071045e-05, -1.2159347534179688e-05, 8.93324613571167e-06, 3.0025839805603027e-05, 5.1118433475494385e-05, 7.221102714538574e-05, 9.33036208152771e-05, 0.00011439621448516846, 0.00013548880815505981, 0.00015658140182495117, 0.00017767399549484253, 0.0001987665891647339, 0.00021985918283462524, 0.0002409517765045166, 0.00026204437017440796, 0.0002831369638442993, 0.0003042295575141907, 0.00032532215118408203, 0.0003464147448539734, 0.00036750733852386475, 0.0003885999321937561, 0.00040969252586364746, 0.0004307851195335388, 0.0004518777132034302, 0.00047297030687332153, 0.0004940629005432129, 0.0005151554942131042, 0.0005362480878829956, 0.000557340681552887, 0.0005784332752227783, 0.0005995258688926697, 0.000620618462562561, 0.0006417110562324524, 0.0006628036499023438]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 6.0, 2.0, 3.0, 1.0, 8.0, 10.0, 21.0, 20.0, 43.0, 66.0, 78.0, 151.0, 248.0, 332.0, 528.0, 900.0, 1290.0, 1987.0, 3074.0, 4705.0, 7628.0, 12626.0, 21392.0, 36026.0, 59068.0, 90271.0, 123762.0, 147566.0, 150143.0, 128615.0, 95837.0, 63484.0, 39209.0, 23029.0, 13640.0, 8305.0, 5189.0, 3234.0, 2151.0, 1343.0, 898.0, 561.0, 343.0, 282.0, 170.0, 115.0, 74.0, 37.0, 31.0, 22.0, 15.0, 17.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.107177734375, -4.92529296875, -4.743408203125, -4.5615234375, -4.379638671875, -4.19775390625, -4.015869140625, -3.833984375, -3.652099609375, -3.47021484375, -3.288330078125, -3.1064453125, -2.924560546875, -2.74267578125, -2.560791015625, -2.37890625, -2.197021484375, -2.01513671875, -1.833251953125, -1.6513671875, -1.469482421875, -1.28759765625, -1.105712890625, -0.923828125, -0.741943359375, -0.56005859375, -0.378173828125, -0.1962890625, -0.014404296875, 0.16748046875, 0.349365234375, 0.53125, 0.713134765625, 0.89501953125, 1.076904296875, 1.2587890625, 1.440673828125, 1.62255859375, 1.804443359375, 1.986328125, 2.168212890625, 2.35009765625, 2.531982421875, 2.7138671875, 2.895751953125, 3.07763671875, 3.259521484375, 3.44140625, 3.623291015625, 3.80517578125, 3.987060546875, 4.1689453125, 4.350830078125, 4.53271484375, 4.714599609375, 4.896484375, 5.078369140625, 5.26025390625, 5.442138671875, 5.6240234375, 5.805908203125, 5.98779296875, 6.169677734375, 6.3515625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 8.0, 11.0, 14.0, 12.0, 35.0, 28.0, 33.0, 46.0, 54.0, 55.0, 62.0, 69.0, 70.0, 60.0, 82.0, 59.0, 53.0, 53.0, 43.0, 32.0, 27.0, 26.0, 15.0, 13.0, 11.0, 8.0, 3.0, 2.0, 9.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.348541259765625, -2.25762939453125, -2.166717529296875, -2.0758056640625, -1.984893798828125, -1.89398193359375, -1.803070068359375, -1.712158203125, -1.621246337890625, -1.53033447265625, -1.439422607421875, -1.3485107421875, -1.257598876953125, -1.16668701171875, -1.075775146484375, -0.98486328125, -0.893951416015625, -0.80303955078125, -0.712127685546875, -0.6212158203125, -0.530303955078125, -0.43939208984375, -0.348480224609375, -0.257568359375, -0.166656494140625, -0.07574462890625, 0.015167236328125, 0.1060791015625, 0.196990966796875, 0.28790283203125, 0.378814697265625, 0.4697265625, 0.560638427734375, 0.65155029296875, 0.742462158203125, 0.8333740234375, 0.924285888671875, 1.01519775390625, 1.106109619140625, 1.197021484375, 1.287933349609375, 1.37884521484375, 1.469757080078125, 1.5606689453125, 1.651580810546875, 1.74249267578125, 1.833404541015625, 1.92431640625, 2.015228271484375, 2.10614013671875, 2.197052001953125, 2.2879638671875, 2.378875732421875, 2.46978759765625, 2.560699462890625, 2.651611328125, 2.742523193359375, 2.83343505859375, 2.924346923828125, 3.0152587890625, 3.106170654296875, 3.19708251953125, 3.287994384765625, 3.37890625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 7.0, 12.0, 16.0, 16.0, 20.0, 18.0, 25.0, 25.0, 24.0, 36.0, 35.0, 37.0, 41.0, 47.0, 48.0, 41.0, 40.0, 43.0, 39.0, 58.0, 39.0, 34.0, 36.0, 31.0, 28.0, 27.0, 22.0, 27.0, 19.0, 19.0, 13.0, 15.0, 12.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.464649200439453, -14.96546459197998, -14.466279029846191, -13.967094421386719, -13.467909812927246, -12.968725204467773, -12.469539642333984, -11.970355033874512, -11.471170425415039, -10.971985816955566, -10.472800254821777, -9.973615646362305, -9.474431037902832, -8.97524642944336, -8.47606086730957, -7.976876258850098, -7.477690696716309, -6.978505611419678, -6.479321002960205, -5.980135917663574, -5.480951309204102, -4.981766223907471, -4.48258113861084, -3.983396291732788, -3.4842114448547363, -2.9850265979766846, -2.485841751098633, -1.986656665802002, -1.4874718189239502, -0.9882869720458984, -0.4891018867492676, 0.01008296012878418, 0.5092678070068359, 1.0084526538848877, 1.507637619972229, 2.0068225860595703, 2.506007432937622, 3.005192279815674, 3.5043773651123047, 4.003561973571777, 4.502747058868408, 5.001932144165039, 5.501116752624512, 6.000301837921143, 6.499486923217773, 6.998671531677246, 7.497856616973877, 7.997041702270508, 8.49622631072998, 8.995410919189453, 9.494596481323242, 9.993781089782715, 10.492965698242188, 10.992151260375977, 11.49133586883545, 11.990520477294922, 12.489706039428711, 12.988890647888184, 13.488076210021973, 13.987260818481445, 14.486445426940918, 14.98563003540039, 15.48481559753418, 15.984000205993652, 16.483184814453125]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 3.0, 2.0, 7.0, 6.0, 10.0, 10.0, 13.0, 14.0, 14.0, 17.0, 20.0, 10.0, 25.0, 20.0, 27.0, 38.0, 38.0, 32.0, 29.0, 39.0, 34.0, 44.0, 34.0, 42.0, 46.0, 42.0, 34.0, 42.0, 39.0, 28.0, 33.0, 26.0, 27.0, 25.0, 18.0, 20.0, 16.0, 12.0, 19.0, 7.0, 10.0, 8.0, 5.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.54252052307129, -21.81709861755371, -21.091678619384766, -20.366256713867188, -19.64083480834961, -18.915414810180664, -18.189992904663086, -17.46457290649414, -16.739151000976562, -16.013729095458984, -15.288309097290039, -14.562887191772461, -13.8374662399292, -13.112045288085938, -12.38662338256836, -11.661202430725098, -10.935781478881836, -10.210360527038574, -9.484939575195312, -8.759517669677734, -8.034096717834473, -7.308675765991211, -6.583254337310791, -5.857832908630371, -5.132411956787109, -4.406991004943848, -3.6815695762634277, -2.956148386001587, -2.230727195739746, -1.5053060054779053, -0.7798848152160645, -0.05446338653564453, 0.6709556579589844, 1.3963768482208252, 2.121798038482666, 2.847219228744507, 3.5726404190063477, 4.298061370849609, 5.023482799530029, 5.748904228210449, 6.474325180053711, 7.199746131896973, 7.925167560577393, 8.650588989257812, 9.376009941101074, 10.101430892944336, 10.826852798461914, 11.552273750305176, 12.277694702148438, 13.0031156539917, 13.728536605834961, 14.453958511352539, 15.1793794631958, 15.904800415039062, 16.63022232055664, 17.35564422607422, 18.081064224243164, 18.806486129760742, 19.531906127929688, 20.257328033447266, 20.982749938964844, 21.70816993713379, 22.433591842651367, 23.159011840820312, 23.88443374633789]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 10.0, 12.0, 15.0, 12.0, 22.0, 41.0, 37.0, 59.0, 79.0, 86.0, 137.0, 159.0, 242.0, 284.0, 400.0, 557.0, 759.0, 1032.0, 1376.0, 1800.0, 2551.0, 3451.0, 4541.0, 6185.0, 996794.0, 8391.0, 5531.0, 4141.0, 3105.0, 2338.0, 1679.0, 1189.0, 905.0, 628.0, 533.0, 390.0, 281.0, 217.0, 147.0, 134.0, 90.0, 68.0, 50.0, 40.0, 31.0, 26.0, 10.0, 10.0, 8.0, 12.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-162.41436767578125, -157.6148681640625, -152.8153533935547, -148.01585388183594, -143.2163543701172, -138.41685485839844, -133.61734008789062, -128.81784057617188, -124.01834106445312, -119.21883392333984, -114.4193344116211, -109.61982727050781, -104.82032775878906, -100.02082061767578, -95.2213134765625, -90.42181396484375, -85.62230682373047, -80.82279968261719, -76.02330017089844, -71.22379302978516, -66.4242935180664, -61.624786376953125, -56.82528305053711, -52.025779724121094, -47.22627639770508, -42.42677307128906, -37.62726974487305, -32.82776641845703, -28.028261184692383, -23.228757858276367, -18.42925262451172, -13.629749298095703, -8.830245971679688, -4.030742168426514, 0.7687616348266602, 5.568265914916992, 10.367769241333008, 15.167272567749023, 19.966777801513672, 24.766281127929688, 29.565784454345703, 34.36528778076172, 39.164791107177734, 43.96429443359375, 48.76380157470703, 53.56330108642578, 58.36280822753906, 63.16231155395508, 67.9618148803711, 72.76132202148438, 77.56082153320312, 82.3603286743164, 87.15982818603516, 91.95933532714844, 96.75883483886719, 101.55834197998047, 106.35784912109375, 111.15735626220703, 115.95685577392578, 120.75636291503906, 125.55586242675781, 130.35536193847656, 135.15487670898438, 139.95437622070312, 144.75387573242188]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 10.0, 15.0, 15.0, 30.0, 20.0, 29.0, 47.0, 46.0, 54.0, 72.0, 87.0, 155.0, 217.0, 427.0, 910.0, 2096.0, 5734.0, 16542.0, 40503.0, 50511680.0, 827121.0, 39682.0, 16075.0, 5598.0, 2104.0, 981.0, 455.0, 237.0, 157.0, 89.0, 68.0, 49.0, 50.0, 38.0, 35.0, 16.0, 18.0, 11.0, 12.0, 9.0, 11.0, 6.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0], "bins": [-352.0, -342.21875, -332.4375, -322.65625, -312.875, -303.09375, -293.3125, -283.53125, -273.75, -263.96875, -254.1875, -244.40625, -234.625, -224.84375, -215.0625, -205.28125, -195.5, -185.71875, -175.9375, -166.15625, -156.375, -146.59375, -136.8125, -127.03125, -117.25, -107.46875, -97.6875, -87.90625, -78.125, -68.34375, -58.5625, -48.78125, -39.0, -29.21875, -19.4375, -9.65625, 0.125, 9.90625, 19.6875, 29.46875, 39.25, 49.03125, 58.8125, 68.59375, 78.375, 88.15625, 97.9375, 107.71875, 117.5, 127.28125, 137.0625, 146.84375, 156.625, 166.40625, 176.1875, 185.96875, 195.75, 205.53125, 215.3125, 225.09375, 234.875, 244.65625, 254.4375, 264.21875, 274.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 12.0, 13.0, 30.0, 30.0, 45.0, 64.0, 113.0, 166.0, 223.0, 324.0, 499.0, 768.0, 1184.0, 1836.0, 2879.0, 4591.0, 7417.0, 12544.0, 22032.0, 39386.0, 71864.0, 132506.0, 247226.0, 472997.0, 1063450.0, 2079350.0, 1082625.0, 484987.0, 253975.0, 137137.0, 73996.0, 40453.0, 23046.0, 12958.0, 7886.0, 4712.0, 2939.0, 1832.0, 1151.0, 733.0, 470.0, 325.0, 241.0, 141.0, 78.0, 63.0, 49.0, 32.0, 18.0, 12.0, 10.0, 11.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-12.2578125, -11.868896484375, -11.47998046875, -11.091064453125, -10.7021484375, -10.313232421875, -9.92431640625, -9.535400390625, -9.146484375, -8.757568359375, -8.36865234375, -7.979736328125, -7.5908203125, -7.201904296875, -6.81298828125, -6.424072265625, -6.03515625, -5.646240234375, -5.25732421875, -4.868408203125, -4.4794921875, -4.090576171875, -3.70166015625, -3.312744140625, -2.923828125, -2.534912109375, -2.14599609375, -1.757080078125, -1.3681640625, -0.979248046875, -0.59033203125, -0.201416015625, 0.1875, 0.576416015625, 0.96533203125, 1.354248046875, 1.7431640625, 2.132080078125, 2.52099609375, 2.909912109375, 3.298828125, 3.687744140625, 4.07666015625, 4.465576171875, 4.8544921875, 5.243408203125, 5.63232421875, 6.021240234375, 6.41015625, 6.799072265625, 7.18798828125, 7.576904296875, 7.9658203125, 8.354736328125, 8.74365234375, 9.132568359375, 9.521484375, 9.910400390625, 10.29931640625, 10.688232421875, 11.0771484375, 11.466064453125, 11.85498046875, 12.243896484375, 12.6328125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 7.0, 10.0, 21.0, 11.0, 24.0, 21.0, 33.0, 21.0, 39.0, 21.0, 29.0, 45.0, 34.0, 60.0, 95.0, 208.0, 320.0, 308.0, 148.0, 107.0, 50.0, 46.0, 47.0, 39.0, 23.0, 28.0, 23.0, 23.0, 31.0, 37.0, 15.0, 13.0, 17.0, 18.0, 5.0, 10.0, 8.0, 6.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-27.828125, -26.973388671875, -26.11865234375, -25.263916015625, -24.4091796875, -23.554443359375, -22.69970703125, -21.844970703125, -20.990234375, -20.135498046875, -19.28076171875, -18.426025390625, -17.5712890625, -16.716552734375, -15.86181640625, -15.007080078125, -14.15234375, -13.297607421875, -12.44287109375, -11.588134765625, -10.7333984375, -9.878662109375, -9.02392578125, -8.169189453125, -7.314453125, -6.459716796875, -5.60498046875, -4.750244140625, -3.8955078125, -3.040771484375, -2.18603515625, -1.331298828125, -0.4765625, 0.378173828125, 1.23291015625, 2.087646484375, 2.9423828125, 3.797119140625, 4.65185546875, 5.506591796875, 6.361328125, 7.216064453125, 8.07080078125, 8.925537109375, 9.7802734375, 10.635009765625, 11.48974609375, 12.344482421875, 13.19921875, 14.053955078125, 14.90869140625, 15.763427734375, 16.6181640625, 17.472900390625, 18.32763671875, 19.182373046875, 20.037109375, 20.891845703125, 21.74658203125, 22.601318359375, 23.4560546875, 24.310791015625, 25.16552734375, 26.020263671875, 26.875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 11.0, 17.0, 20.0, 33.0, 61.0, 85.0, 136.0, 181.0, 306.0, 554.0, 974.0, 1766.0, 3212.0, 5464.0, 9749.0, 16684.0, 28941.0, 49328.0, 83386.0, 139216.0, 226078.0, 369187.0, 795465.0, 2436847.0, 1067710.0, 424232.0, 250787.0, 154952.0, 93929.0, 55386.0, 32200.0, 18759.0, 11096.0, 6391.0, 3564.0, 1978.0, 1123.0, 661.0, 336.0, 204.0, 147.0, 80.0, 51.0, 32.0, 25.0, 17.0, 21.0, 11.0, 10.0, 5.0, 9.0, 3.0, 3.0, 4.0], "bins": [-8.6015625, -8.34564208984375, -8.0897216796875, -7.83380126953125, -7.577880859375, -7.32196044921875, -7.0660400390625, -6.81011962890625, -6.55419921875, -6.29827880859375, -6.0423583984375, -5.78643798828125, -5.530517578125, -5.27459716796875, -5.0186767578125, -4.76275634765625, -4.5068359375, -4.25091552734375, -3.9949951171875, -3.73907470703125, -3.483154296875, -3.22723388671875, -2.9713134765625, -2.71539306640625, -2.45947265625, -2.20355224609375, -1.9476318359375, -1.69171142578125, -1.435791015625, -1.17987060546875, -0.9239501953125, -0.66802978515625, -0.412109375, -0.15618896484375, 0.0997314453125, 0.35565185546875, 0.611572265625, 0.86749267578125, 1.1234130859375, 1.37933349609375, 1.63525390625, 1.89117431640625, 2.1470947265625, 2.40301513671875, 2.658935546875, 2.91485595703125, 3.1707763671875, 3.42669677734375, 3.6826171875, 3.93853759765625, 4.1944580078125, 4.45037841796875, 4.706298828125, 4.96221923828125, 5.2181396484375, 5.47406005859375, 5.72998046875, 5.98590087890625, 6.2418212890625, 6.49774169921875, 6.753662109375, 7.00958251953125, 7.2655029296875, 7.52142333984375, 7.77734375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 11.0, 7.0, 11.0, 7.0, 14.0, 14.0, 16.0, 21.0, 23.0, 21.0, 21.0, 28.0, 23.0, 29.0, 22.0, 24.0, 26.0, 37.0, 67.0, 111.0, 255.0, 425.0, 245.0, 95.0, 47.0, 38.0, 40.0, 40.0, 30.0, 30.0, 33.0, 23.0, 24.0, 13.0, 18.0, 22.0, 10.0, 15.0, 10.0, 14.0, 13.0, 8.0, 6.0, 7.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-31.984375, -30.980224609375, -29.97607421875, -28.971923828125, -27.9677734375, -26.963623046875, -25.95947265625, -24.955322265625, -23.951171875, -22.947021484375, -21.94287109375, -20.938720703125, -19.9345703125, -18.930419921875, -17.92626953125, -16.922119140625, -15.91796875, -14.913818359375, -13.90966796875, -12.905517578125, -11.9013671875, -10.897216796875, -9.89306640625, -8.888916015625, -7.884765625, -6.880615234375, -5.87646484375, -4.872314453125, -3.8681640625, -2.864013671875, -1.85986328125, -0.855712890625, 0.1484375, 1.152587890625, 2.15673828125, 3.160888671875, 4.1650390625, 5.169189453125, 6.17333984375, 7.177490234375, 8.181640625, 9.185791015625, 10.18994140625, 11.194091796875, 12.1982421875, 13.202392578125, 14.20654296875, 15.210693359375, 16.21484375, 17.218994140625, 18.22314453125, 19.227294921875, 20.2314453125, 21.235595703125, 22.23974609375, 23.243896484375, 24.248046875, 25.252197265625, 26.25634765625, 27.260498046875, 28.2646484375, 29.268798828125, 30.27294921875, 31.277099609375, 32.28125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 11.0, 8.0, 8.0, 7.0, 14.0, 30.0, 13.0, 36.0, 48.0, 55.0, 90.0, 118.0, 188.0, 240.0, 473.0, 898.0, 1537.0, 2670.0, 5060.0, 9952.0, 20983.0, 47993.0, 126867.0, 5703478.0, 242249.0, 71381.0, 29293.0, 13249.0, 6501.0, 3455.0, 1770.0, 1051.0, 587.0, 356.0, 256.0, 128.0, 87.0, 79.0, 65.0, 45.0, 28.0, 13.0, 10.0, 7.0, 7.0, 6.0, 10.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 6.0, 3.0], "bins": [-42.59375, -41.29150390625, -39.9892578125, -38.68701171875, -37.384765625, -36.08251953125, -34.7802734375, -33.47802734375, -32.17578125, -30.87353515625, -29.5712890625, -28.26904296875, -26.966796875, -25.66455078125, -24.3623046875, -23.06005859375, -21.7578125, -20.45556640625, -19.1533203125, -17.85107421875, -16.548828125, -15.24658203125, -13.9443359375, -12.64208984375, -11.33984375, -10.03759765625, -8.7353515625, -7.43310546875, -6.130859375, -4.82861328125, -3.5263671875, -2.22412109375, -0.921875, 0.38037109375, 1.6826171875, 2.98486328125, 4.287109375, 5.58935546875, 6.8916015625, 8.19384765625, 9.49609375, 10.79833984375, 12.1005859375, 13.40283203125, 14.705078125, 16.00732421875, 17.3095703125, 18.61181640625, 19.9140625, 21.21630859375, 22.5185546875, 23.82080078125, 25.123046875, 26.42529296875, 27.7275390625, 29.02978515625, 30.33203125, 31.63427734375, 32.9365234375, 34.23876953125, 35.541015625, 36.84326171875, 38.1455078125, 39.44775390625, 40.75]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 8.0, 11.0, 16.0, 22.0, 20.0, 12.0, 20.0, 25.0, 30.0, 21.0, 30.0, 43.0, 40.0, 31.0, 55.0, 90.0, 445.0, 536.0, 97.0, 56.0, 36.0, 46.0, 28.0, 27.0, 43.0, 22.0, 27.0, 28.0, 22.0, 18.0, 19.0, 19.0, 19.0, 12.0, 7.0, 4.0, 4.0, 4.0, 2.0, 5.0, 0.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-67.1875, -65.17041015625, -63.1533203125, -61.13623046875, -59.119140625, -57.10205078125, -55.0849609375, -53.06787109375, -51.05078125, -49.03369140625, -47.0166015625, -44.99951171875, -42.982421875, -40.96533203125, -38.9482421875, -36.93115234375, -34.9140625, -32.89697265625, -30.8798828125, -28.86279296875, -26.845703125, -24.82861328125, -22.8115234375, -20.79443359375, -18.77734375, -16.76025390625, -14.7431640625, -12.72607421875, -10.708984375, -8.69189453125, -6.6748046875, -4.65771484375, -2.640625, -0.62353515625, 1.3935546875, 3.41064453125, 5.427734375, 7.44482421875, 9.4619140625, 11.47900390625, 13.49609375, 15.51318359375, 17.5302734375, 19.54736328125, 21.564453125, 23.58154296875, 25.5986328125, 27.61572265625, 29.6328125, 31.64990234375, 33.6669921875, 35.68408203125, 37.701171875, 39.71826171875, 41.7353515625, 43.75244140625, 45.76953125, 47.78662109375, 49.8037109375, 51.82080078125, 53.837890625, 55.85498046875, 57.8720703125, 59.88916015625, 61.90625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 6.0, 7.0, 16.0, 33.0, 40.0, 55.0, 123.0, 247.0, 240.0, 95.0, 36.0, 29.0, 20.0, 17.0, 12.0, 10.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-853.69775390625, -827.048828125, -800.39990234375, -773.7509765625, -747.10205078125, -720.453125, -693.8042602539062, -667.1553344726562, -640.5064086914062, -613.8574829101562, -587.2085571289062, -560.5596313476562, -533.9107666015625, -507.2618103027344, -480.6129150390625, -453.9639892578125, -427.3150634765625, -400.6661376953125, -374.0172119140625, -347.3683166503906, -320.7193908691406, -294.0704650878906, -267.42156982421875, -240.77264404296875, -214.12371826171875, -187.47479248046875, -160.8258819580078, -134.17697143554688, -107.52804565429688, -80.87911987304688, -54.23020935058594, -27.581298828125, -0.93243408203125, 25.71648406982422, 52.36540222167969, 79.01432037353516, 105.66323852539062, 132.31216430664062, 158.96107482910156, 185.6099853515625, 212.2589111328125, 238.9078369140625, 265.5567626953125, 292.2056579589844, 318.8545837402344, 345.5035095214844, 372.15240478515625, 398.80133056640625, 425.45025634765625, 452.09918212890625, 478.74810791015625, 505.3970031738281, 532.0458984375, 558.69482421875, 585.34375, 611.99267578125, 638.6416015625, 665.29052734375, 691.939453125, 718.58837890625, 745.2373046875, 771.88623046875, 798.5350952148438, 825.1840209960938, 851.8329467773438]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 8.0, 8.0, 12.0, 10.0, 13.0, 16.0, 17.0, 20.0, 21.0, 32.0, 44.0, 68.0, 85.0, 146.0, 116.0, 86.0, 55.0, 40.0, 34.0, 22.0, 16.0, 22.0, 11.0, 10.0, 5.0, 10.0, 9.0, 8.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0], "bins": [-1200.2208251953125, -1167.5484619140625, -1134.876220703125, -1102.203857421875, -1069.5316162109375, -1036.8592529296875, -1004.1869506835938, -971.5146484375, -938.84228515625, -906.1699829101562, -873.4976806640625, -840.8253173828125, -808.1530151367188, -775.480712890625, -742.8084106445312, -710.1361083984375, -677.4638061523438, -644.79150390625, -612.1192016601562, -579.4468994140625, -546.7745361328125, -514.1022338867188, -481.429931640625, -448.75762939453125, -416.0852966308594, -383.4129943847656, -350.74066162109375, -318.068359375, -285.39605712890625, -252.72372436523438, -220.05142211914062, -187.3791046142578, -154.70672607421875, -122.03440856933594, -89.36209869384766, -56.689788818359375, -24.017471313476562, 8.65484619140625, 41.3271484375, 73.99946594238281, 106.67178344726562, 139.34410095214844, 172.01641845703125, 204.688720703125, 237.3610382080078, 270.0333557128906, 302.7056579589844, 335.37799072265625, 368.05029296875, 400.72259521484375, 433.3949279785156, 466.0672302246094, 498.73956298828125, 531.411865234375, 564.0841674804688, 596.7564697265625, 629.4288330078125, 662.1011352539062, 694.7734375, 727.44580078125, 760.1181030273438, 792.7904052734375, 825.4627075195312, 858.135009765625, 890.8073120117188]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 0.0, 6.0, 5.0, 9.0, 7.0, 20.0, 24.0, 40.0, 62.0, 103.0, 147.0, 226.0, 312.0, 434.0, 679.0, 982.0, 1514.0, 2106.0, 3281.0, 5382.0, 8803.0, 15641.0, 30721.0, 73874.0, 329080.0, 3432708.0, 161775.0, 56034.0, 27933.0, 15704.0, 9489.0, 5959.0, 3789.0, 2385.0, 1644.0, 1017.0, 751.0, 522.0, 314.0, 218.0, 169.0, 120.0, 95.0, 62.0, 49.0, 23.0, 12.0, 24.0, 8.0, 8.0, 6.0, 3.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.59765625, -4.43548583984375, -4.2733154296875, -4.11114501953125, -3.948974609375, -3.78680419921875, -3.6246337890625, -3.46246337890625, -3.30029296875, -3.13812255859375, -2.9759521484375, -2.81378173828125, -2.651611328125, -2.48944091796875, -2.3272705078125, -2.16510009765625, -2.0029296875, -1.84075927734375, -1.6785888671875, -1.51641845703125, -1.354248046875, -1.19207763671875, -1.0299072265625, -0.86773681640625, -0.70556640625, -0.54339599609375, -0.3812255859375, -0.21905517578125, -0.056884765625, 0.10528564453125, 0.2674560546875, 0.42962646484375, 0.591796875, 0.75396728515625, 0.9161376953125, 1.07830810546875, 1.240478515625, 1.40264892578125, 1.5648193359375, 1.72698974609375, 1.88916015625, 2.05133056640625, 2.2135009765625, 2.37567138671875, 2.537841796875, 2.70001220703125, 2.8621826171875, 3.02435302734375, 3.1865234375, 3.34869384765625, 3.5108642578125, 3.67303466796875, 3.835205078125, 3.99737548828125, 4.1595458984375, 4.32171630859375, 4.48388671875, 4.64605712890625, 4.8082275390625, 4.97039794921875, 5.132568359375, 5.29473876953125, 5.4569091796875, 5.61907958984375, 5.78125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 8.0, 4.0, 5.0, 10.0, 16.0, 10.0, 30.0, 39.0, 55.0, 380.0, 247.0, 54.0, 37.0, 9.0, 11.0, 15.0, 4.0, 10.0, 3.0, 0.0, 1.0, 7.0, 2.0, 9.0, 1.0, 0.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7509765625, -1.6945037841796875, -1.638031005859375, -1.5815582275390625, -1.52508544921875, -1.4686126708984375, -1.412139892578125, -1.3556671142578125, -1.2991943359375, -1.2427215576171875, -1.186248779296875, -1.1297760009765625, -1.07330322265625, -1.0168304443359375, -0.960357666015625, -0.9038848876953125, -0.847412109375, -0.7909393310546875, -0.734466552734375, -0.6779937744140625, -0.62152099609375, -0.5650482177734375, -0.508575439453125, -0.4521026611328125, -0.3956298828125, -0.3391571044921875, -0.282684326171875, -0.2262115478515625, -0.16973876953125, -0.1132659912109375, -0.056793212890625, -0.0003204345703125, 0.05615234375, 0.1126251220703125, 0.169097900390625, 0.2255706787109375, 0.28204345703125, 0.3385162353515625, 0.394989013671875, 0.4514617919921875, 0.5079345703125, 0.5644073486328125, 0.620880126953125, 0.6773529052734375, 0.73382568359375, 0.7902984619140625, 0.846771240234375, 0.9032440185546875, 0.959716796875, 1.0161895751953125, 1.072662353515625, 1.1291351318359375, 1.18560791015625, 1.2420806884765625, 1.298553466796875, 1.3550262451171875, 1.4114990234375, 1.4679718017578125, 1.524444580078125, 1.5809173583984375, 1.63739013671875, 1.6938629150390625, 1.750335693359375, 1.8068084716796875, 1.86328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 8.0, 8.0, 11.0, 18.0, 36.0, 39.0, 68.0, 94.0, 122.0, 183.0, 295.0, 443.0, 827.0, 1530.0, 2818.0, 5923.0, 13943.0, 39165.0, 140149.0, 752827.0, 2562071.0, 514992.0, 106442.0, 31108.0, 11241.0, 4767.0, 2224.0, 1156.0, 674.0, 387.0, 235.0, 155.0, 98.0, 62.0, 51.0, 31.0, 22.0, 15.0, 4.0, 11.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.247802734375, -4.11669921875, -3.985595703125, -3.8544921875, -3.723388671875, -3.59228515625, -3.461181640625, -3.330078125, -3.198974609375, -3.06787109375, -2.936767578125, -2.8056640625, -2.674560546875, -2.54345703125, -2.412353515625, -2.28125, -2.150146484375, -2.01904296875, -1.887939453125, -1.7568359375, -1.625732421875, -1.49462890625, -1.363525390625, -1.232421875, -1.101318359375, -0.97021484375, -0.839111328125, -0.7080078125, -0.576904296875, -0.44580078125, -0.314697265625, -0.18359375, -0.052490234375, 0.07861328125, 0.209716796875, 0.3408203125, 0.471923828125, 0.60302734375, 0.734130859375, 0.865234375, 0.996337890625, 1.12744140625, 1.258544921875, 1.3896484375, 1.520751953125, 1.65185546875, 1.782958984375, 1.9140625, 2.045166015625, 2.17626953125, 2.307373046875, 2.4384765625, 2.569580078125, 2.70068359375, 2.831787109375, 2.962890625, 3.093994140625, 3.22509765625, 3.356201171875, 3.4873046875, 3.618408203125, 3.74951171875, 3.880615234375, 4.01171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 7.0, 7.0, 17.0, 6.0, 25.0, 29.0, 31.0, 71.0, 96.0, 102.0, 146.0, 222.0, 297.0, 407.0, 639.0, 548.0, 425.0, 250.0, 218.0, 143.0, 94.0, 76.0, 55.0, 38.0, 35.0, 22.0, 21.0, 6.0, 8.0, 7.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.708984375, -2.631317138671875, -2.55364990234375, -2.475982666015625, -2.3983154296875, -2.320648193359375, -2.24298095703125, -2.165313720703125, -2.087646484375, -2.009979248046875, -1.93231201171875, -1.854644775390625, -1.7769775390625, -1.699310302734375, -1.62164306640625, -1.543975830078125, -1.46630859375, -1.388641357421875, -1.31097412109375, -1.233306884765625, -1.1556396484375, -1.077972412109375, -1.00030517578125, -0.922637939453125, -0.844970703125, -0.767303466796875, -0.68963623046875, -0.611968994140625, -0.5343017578125, -0.456634521484375, -0.37896728515625, -0.301300048828125, -0.2236328125, -0.145965576171875, -0.06829833984375, 0.009368896484375, 0.0870361328125, 0.164703369140625, 0.24237060546875, 0.320037841796875, 0.397705078125, 0.475372314453125, 0.55303955078125, 0.630706787109375, 0.7083740234375, 0.786041259765625, 0.86370849609375, 0.941375732421875, 1.01904296875, 1.096710205078125, 1.17437744140625, 1.252044677734375, 1.3297119140625, 1.407379150390625, 1.48504638671875, 1.562713623046875, 1.640380859375, 1.718048095703125, 1.79571533203125, 1.873382568359375, 1.9510498046875, 2.028717041015625, 2.10638427734375, 2.184051513671875, 2.26171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 11.0, 15.0, 21.0, 39.0, 52.0, 133.0, 169.0, 177.0, 167.0, 93.0, 50.0, 21.0, 22.0, 9.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.085464477539062, -10.592352867126465, -10.09924030303955, -9.606128692626953, -9.113016128540039, -8.619904518127441, -8.126792907714844, -7.63368034362793, -7.140568733215332, -6.647456645965576, -6.15434455871582, -5.661232948303223, -5.168120861053467, -4.675008773803711, -4.181896686553955, -3.6887848377227783, -3.1956725120544434, -2.7025604248046875, -2.2094485759735107, -1.7163364887237549, -1.2232245206832886, -0.7301125526428223, -0.2370004653930664, 0.25611138343811035, 0.7492234706878662, 1.2423354387283325, 1.7354474067687988, 2.2285594940185547, 2.7216715812683105, 3.2147834300994873, 3.707895517349243, 4.20100736618042, 4.694119453430176, 5.187231540679932, 5.6803436279296875, 6.173455238342285, 6.666567325592041, 7.159679412841797, 7.652791500091553, 8.145903587341309, 8.639015197753906, 9.132126808166504, 9.625239372253418, 10.118350982666016, 10.61146354675293, 11.104575157165527, 11.597686767578125, 12.090799331665039, 12.583911895751953, 13.07702350616455, 13.570136070251465, 14.063247680664062, 14.556360244750977, 15.049471855163574, 15.542583465576172, 16.035696029663086, 16.528806686401367, 17.02191925048828, 17.515029907226562, 18.008142471313477, 18.50125503540039, 18.994365692138672, 19.487478256225586, 19.9805908203125, 20.473703384399414]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 5.0, 10.0, 9.0, 6.0, 15.0, 22.0, 22.0, 24.0, 26.0, 40.0, 26.0, 28.0, 44.0, 33.0, 36.0, 45.0, 52.0, 40.0, 56.0, 59.0, 46.0, 46.0, 31.0, 46.0, 30.0, 27.0, 30.0, 25.0, 19.0, 21.0, 18.0, 5.0, 11.0, 9.0, 9.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.630636215209961, -12.234087944030762, -11.837539672851562, -11.440991401672363, -11.044443130493164, -10.647893905639648, -10.25134563446045, -9.85479736328125, -9.45824909210205, -9.061700820922852, -8.665152549743652, -8.268604278564453, -7.872055530548096, -7.4755072593688965, -7.078958511352539, -6.68241024017334, -6.285861968994141, -5.889313697814941, -5.492765426635742, -5.096216678619385, -4.6996684074401855, -4.303120136260986, -3.906571626663208, -3.5100231170654297, -3.1134748458862305, -2.7169265747070312, -2.320378065109253, -1.9238296747207642, -1.5272812843322754, -1.1307328939437866, -0.7341845035552979, -0.33763599395751953, 0.05891227722167969, 0.45546066761016846, 0.8520090579986572, 1.248557448387146, 1.6451058387756348, 2.041654109954834, 2.4382026195526123, 2.8347511291503906, 3.23129940032959, 3.627847671508789, 4.024395942687988, 4.420944690704346, 4.817492961883545, 5.214041233062744, 5.610589981079102, 6.007138252258301, 6.4036865234375, 6.800234794616699, 7.196783065795898, 7.593331813812256, 7.989880084991455, 8.386428833007812, 8.782977104187012, 9.179525375366211, 9.57607364654541, 9.97262191772461, 10.369170188903809, 10.765718460083008, 11.162267684936523, 11.558815956115723, 11.955364227294922, 12.351912498474121, 12.74846076965332]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 5.0, 17.0, 18.0, 30.0, 58.0, 61.0, 79.0, 107.0, 163.0, 198.0, 284.0, 393.0, 542.0, 742.0, 1025.0, 1407.0, 2077.0, 3119.0, 4796.0, 7945.0, 14429.0, 32000.0, 144716.0, 697088.0, 80775.0, 24091.0, 11686.0, 6806.0, 4295.0, 2807.0, 1882.0, 1353.0, 974.0, 703.0, 502.0, 377.0, 261.0, 188.0, 164.0, 110.0, 99.0, 47.0, 45.0, 24.0, 18.0, 19.0, 4.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.25, -4.11865234375, -3.9873046875, -3.85595703125, -3.724609375, -3.59326171875, -3.4619140625, -3.33056640625, -3.19921875, -3.06787109375, -2.9365234375, -2.80517578125, -2.673828125, -2.54248046875, -2.4111328125, -2.27978515625, -2.1484375, -2.01708984375, -1.8857421875, -1.75439453125, -1.623046875, -1.49169921875, -1.3603515625, -1.22900390625, -1.09765625, -0.96630859375, -0.8349609375, -0.70361328125, -0.572265625, -0.44091796875, -0.3095703125, -0.17822265625, -0.046875, 0.08447265625, 0.2158203125, 0.34716796875, 0.478515625, 0.60986328125, 0.7412109375, 0.87255859375, 1.00390625, 1.13525390625, 1.2666015625, 1.39794921875, 1.529296875, 1.66064453125, 1.7919921875, 1.92333984375, 2.0546875, 2.18603515625, 2.3173828125, 2.44873046875, 2.580078125, 2.71142578125, 2.8427734375, 2.97412109375, 3.10546875, 3.23681640625, 3.3681640625, 3.49951171875, 3.630859375, 3.76220703125, 3.8935546875, 4.02490234375, 4.15625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 5.0, 5.0, 6.0, 11.0, 15.0, 15.0, 17.0, 22.0, 50.0, 90.0, 195.0, 225.0, 132.0, 72.0, 36.0, 10.0, 15.0, 9.0, 9.0, 3.0, 7.0, 4.0, 2.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5478515625, -1.49322509765625, -1.4385986328125, -1.38397216796875, -1.329345703125, -1.27471923828125, -1.2200927734375, -1.16546630859375, -1.11083984375, -1.05621337890625, -1.0015869140625, -0.94696044921875, -0.892333984375, -0.83770751953125, -0.7830810546875, -0.72845458984375, -0.673828125, -0.61920166015625, -0.5645751953125, -0.50994873046875, -0.455322265625, -0.40069580078125, -0.3460693359375, -0.29144287109375, -0.23681640625, -0.18218994140625, -0.1275634765625, -0.07293701171875, -0.018310546875, 0.03631591796875, 0.0909423828125, 0.14556884765625, 0.2001953125, 0.25482177734375, 0.3094482421875, 0.36407470703125, 0.418701171875, 0.47332763671875, 0.5279541015625, 0.58258056640625, 0.63720703125, 0.69183349609375, 0.7464599609375, 0.80108642578125, 0.855712890625, 0.91033935546875, 0.9649658203125, 1.01959228515625, 1.07421875, 1.12884521484375, 1.1834716796875, 1.23809814453125, 1.292724609375, 1.34735107421875, 1.4019775390625, 1.45660400390625, 1.51123046875, 1.56585693359375, 1.6204833984375, 1.67510986328125, 1.729736328125, 1.78436279296875, 1.8389892578125, 1.89361572265625, 1.9482421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 8.0, 6.0, 13.0, 13.0, 18.0, 18.0, 36.0, 36.0, 56.0, 62.0, 107.0, 160.0, 256.0, 452.0, 765.0, 1311.0, 2487.0, 4792.0, 10423.0, 24659.0, 67689.0, 235327.0, 485519.0, 136750.0, 44390.0, 17412.0, 7612.0, 3602.0, 1912.0, 1065.0, 557.0, 361.0, 229.0, 153.0, 75.0, 61.0, 36.0, 29.0, 23.0, 16.0, 16.0, 9.0, 13.0, 7.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.26953125, -5.11590576171875, -4.9622802734375, -4.80865478515625, -4.655029296875, -4.50140380859375, -4.3477783203125, -4.19415283203125, -4.04052734375, -3.88690185546875, -3.7332763671875, -3.57965087890625, -3.426025390625, -3.27239990234375, -3.1187744140625, -2.96514892578125, -2.8115234375, -2.65789794921875, -2.5042724609375, -2.35064697265625, -2.197021484375, -2.04339599609375, -1.8897705078125, -1.73614501953125, -1.58251953125, -1.42889404296875, -1.2752685546875, -1.12164306640625, -0.968017578125, -0.81439208984375, -0.6607666015625, -0.50714111328125, -0.353515625, -0.19989013671875, -0.0462646484375, 0.10736083984375, 0.260986328125, 0.41461181640625, 0.5682373046875, 0.72186279296875, 0.87548828125, 1.02911376953125, 1.1827392578125, 1.33636474609375, 1.489990234375, 1.64361572265625, 1.7972412109375, 1.95086669921875, 2.1044921875, 2.25811767578125, 2.4117431640625, 2.56536865234375, 2.718994140625, 2.87261962890625, 3.0262451171875, 3.17987060546875, 3.33349609375, 3.48712158203125, 3.6407470703125, 3.79437255859375, 3.947998046875, 4.10162353515625, 4.2552490234375, 4.40887451171875, 4.5625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 7.0, 4.0, 1.0, 6.0, 4.0, 7.0, 10.0, 14.0, 18.0, 16.0, 20.0, 15.0, 30.0, 35.0, 41.0, 35.0, 45.0, 32.0, 51.0, 64.0, 47.0, 28.0, 48.0, 44.0, 35.0, 32.0, 35.0, 40.0, 36.0, 31.0, 36.0, 17.0, 27.0, 18.0, 14.0, 9.0, 14.0, 2.0, 8.0, 15.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.15087890625, -6.9150390625, -6.67919921875, -6.443359375, -6.20751953125, -5.9716796875, -5.73583984375, -5.5, -5.26416015625, -5.0283203125, -4.79248046875, -4.556640625, -4.32080078125, -4.0849609375, -3.84912109375, -3.61328125, -3.37744140625, -3.1416015625, -2.90576171875, -2.669921875, -2.43408203125, -2.1982421875, -1.96240234375, -1.7265625, -1.49072265625, -1.2548828125, -1.01904296875, -0.783203125, -0.54736328125, -0.3115234375, -0.07568359375, 0.16015625, 0.39599609375, 0.6318359375, 0.86767578125, 1.103515625, 1.33935546875, 1.5751953125, 1.81103515625, 2.046875, 2.28271484375, 2.5185546875, 2.75439453125, 2.990234375, 3.22607421875, 3.4619140625, 3.69775390625, 3.93359375, 4.16943359375, 4.4052734375, 4.64111328125, 4.876953125, 5.11279296875, 5.3486328125, 5.58447265625, 5.8203125, 6.05615234375, 6.2919921875, 6.52783203125, 6.763671875, 6.99951171875, 7.2353515625, 7.47119140625, 7.70703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 15.0, 30.0, 49.0, 59.0, 103.0, 219.0, 396.0, 849.0, 2364.0, 8999.0, 66734.0, 872577.0, 81367.0, 10191.0, 2701.0, 977.0, 433.0, 212.0, 91.0, 65.0, 46.0, 26.0, 9.0, 9.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.80859375, -5.58111572265625, -5.3536376953125, -5.12615966796875, -4.898681640625, -4.67120361328125, -4.4437255859375, -4.21624755859375, -3.98876953125, -3.76129150390625, -3.5338134765625, -3.30633544921875, -3.078857421875, -2.85137939453125, -2.6239013671875, -2.39642333984375, -2.1689453125, -1.94146728515625, -1.7139892578125, -1.48651123046875, -1.259033203125, -1.03155517578125, -0.8040771484375, -0.57659912109375, -0.34912109375, -0.12164306640625, 0.1058349609375, 0.33331298828125, 0.560791015625, 0.78826904296875, 1.0157470703125, 1.24322509765625, 1.470703125, 1.69818115234375, 1.9256591796875, 2.15313720703125, 2.380615234375, 2.60809326171875, 2.8355712890625, 3.06304931640625, 3.29052734375, 3.51800537109375, 3.7454833984375, 3.97296142578125, 4.200439453125, 4.42791748046875, 4.6553955078125, 4.88287353515625, 5.1103515625, 5.33782958984375, 5.5653076171875, 5.79278564453125, 6.020263671875, 6.24774169921875, 6.4752197265625, 6.70269775390625, 6.93017578125, 7.15765380859375, 7.3851318359375, 7.61260986328125, 7.840087890625, 8.06756591796875, 8.2950439453125, 8.52252197265625, 8.75]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 3.0, 7.0, 8.0, 15.0, 15.0, 34.0, 33.0, 54.0, 69.0, 84.0, 109.0, 92.0, 120.0, 74.0, 62.0, 58.0, 39.0, 42.0, 25.0, 20.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010991096496582031, -0.00010643899440765381, -0.0001029670238494873, -9.94950532913208e-05, -9.60230827331543e-05, -9.255111217498779e-05, -8.907914161682129e-05, -8.560717105865479e-05, -8.213520050048828e-05, -7.866322994232178e-05, -7.519125938415527e-05, -7.171928882598877e-05, -6.824731826782227e-05, -6.477534770965576e-05, -6.130337715148926e-05, -5.7831406593322754e-05, -5.435943603515625e-05, -5.0887465476989746e-05, -4.741549491882324e-05, -4.394352436065674e-05, -4.0471553802490234e-05, -3.699958324432373e-05, -3.3527612686157227e-05, -3.0055642127990723e-05, -2.658367156982422e-05, -2.3111701011657715e-05, -1.963973045349121e-05, -1.6167759895324707e-05, -1.2695789337158203e-05, -9.2238187789917e-06, -5.751848220825195e-06, -2.2798776626586914e-06, 1.1920928955078125e-06, 4.664063453674316e-06, 8.13603401184082e-06, 1.1608004570007324e-05, 1.5079975128173828e-05, 1.8551945686340332e-05, 2.2023916244506836e-05, 2.549588680267334e-05, 2.8967857360839844e-05, 3.243982791900635e-05, 3.591179847717285e-05, 3.9383769035339355e-05, 4.285573959350586e-05, 4.632771015167236e-05, 4.979968070983887e-05, 5.327165126800537e-05, 5.6743621826171875e-05, 6.021559238433838e-05, 6.368756294250488e-05, 6.715953350067139e-05, 7.063150405883789e-05, 7.41034746170044e-05, 7.75754451751709e-05, 8.10474157333374e-05, 8.45193862915039e-05, 8.799135684967041e-05, 9.146332740783691e-05, 9.493529796600342e-05, 9.840726852416992e-05, 0.00010187923908233643, 0.00010535120964050293, 0.00010882318019866943, 0.00011229515075683594]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 11.0, 6.0, 13.0, 15.0, 21.0, 24.0, 63.0, 65.0, 108.0, 166.0, 270.0, 526.0, 1006.0, 2071.0, 4646.0, 13297.0, 48338.0, 277540.0, 564367.0, 99706.0, 22981.0, 7472.0, 2935.0, 1271.0, 596.0, 433.0, 207.0, 136.0, 79.0, 62.0, 28.0, 31.0, 23.0, 9.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.0234375, -3.9058837890625, -3.788330078125, -3.6707763671875, -3.55322265625, -3.4356689453125, -3.318115234375, -3.2005615234375, -3.0830078125, -2.9654541015625, -2.847900390625, -2.7303466796875, -2.61279296875, -2.4952392578125, -2.377685546875, -2.2601318359375, -2.142578125, -2.0250244140625, -1.907470703125, -1.7899169921875, -1.67236328125, -1.5548095703125, -1.437255859375, -1.3197021484375, -1.2021484375, -1.0845947265625, -0.967041015625, -0.8494873046875, -0.73193359375, -0.6143798828125, -0.496826171875, -0.3792724609375, -0.26171875, -0.1441650390625, -0.026611328125, 0.0909423828125, 0.20849609375, 0.3260498046875, 0.443603515625, 0.5611572265625, 0.6787109375, 0.7962646484375, 0.913818359375, 1.0313720703125, 1.14892578125, 1.2664794921875, 1.384033203125, 1.5015869140625, 1.619140625, 1.7366943359375, 1.854248046875, 1.9718017578125, 2.08935546875, 2.2069091796875, 2.324462890625, 2.4420166015625, 2.5595703125, 2.6771240234375, 2.794677734375, 2.9122314453125, 3.02978515625, 3.1473388671875, 3.264892578125, 3.3824462890625, 3.5]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 11.0, 8.0, 19.0, 21.0, 18.0, 32.0, 47.0, 37.0, 67.0, 59.0, 75.0, 69.0, 73.0, 71.0, 63.0, 58.0, 57.0, 35.0, 35.0, 29.0, 27.0, 19.0, 13.0, 10.0, 3.0, 8.0, 7.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.502777099609375, -3.38250732421875, -3.262237548828125, -3.1419677734375, -3.021697998046875, -2.90142822265625, -2.781158447265625, -2.660888671875, -2.540618896484375, -2.42034912109375, -2.300079345703125, -2.1798095703125, -2.059539794921875, -1.93927001953125, -1.819000244140625, -1.69873046875, -1.578460693359375, -1.45819091796875, -1.337921142578125, -1.2176513671875, -1.097381591796875, -0.97711181640625, -0.856842041015625, -0.736572265625, -0.616302490234375, -0.49603271484375, -0.375762939453125, -0.2554931640625, -0.135223388671875, -0.01495361328125, 0.105316162109375, 0.2255859375, 0.345855712890625, 0.46612548828125, 0.586395263671875, 0.7066650390625, 0.826934814453125, 0.94720458984375, 1.067474365234375, 1.187744140625, 1.308013916015625, 1.42828369140625, 1.548553466796875, 1.6688232421875, 1.789093017578125, 1.90936279296875, 2.029632568359375, 2.14990234375, 2.270172119140625, 2.39044189453125, 2.510711669921875, 2.6309814453125, 2.751251220703125, 2.87152099609375, 2.991790771484375, 3.112060546875, 3.232330322265625, 3.35260009765625, 3.472869873046875, 3.5931396484375, 3.713409423828125, 3.83367919921875, 3.953948974609375, 4.07421875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 18.0, 27.0, 94.0, 334.0, 380.0, 98.0, 27.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.16302490234375, -124.28840637207031, -120.41378021240234, -116.5391616821289, -112.66453552246094, -108.7899169921875, -104.91529846191406, -101.0406723022461, -97.16605377197266, -93.29143524169922, -89.41680908203125, -85.54219055175781, -81.66756439208984, -77.7929458618164, -73.91831970214844, -70.043701171875, -66.16908264160156, -62.29446029663086, -58.419837951660156, -54.54521942138672, -50.670597076416016, -46.79597473144531, -42.92135238647461, -39.046730041503906, -35.17210388183594, -31.297481536865234, -27.422861099243164, -23.54823875427246, -19.67361831665039, -15.798995971679688, -11.924373626708984, -8.049753189086914, -4.175132751464844, -0.30051112174987793, 3.574110507965088, 7.448732376098633, 11.32335376739502, 15.197975158691406, 19.07259750366211, 22.94721794128418, 26.821840286254883, 30.696462631225586, 34.571083068847656, 38.44570541381836, 42.32032775878906, 46.1949462890625, 50.06957244873047, 53.944190979003906, 57.81881332397461, 61.69343566894531, 65.56805419921875, 69.44268035888672, 73.31729888916016, 77.19192504882812, 81.06654357910156, 84.941162109375, 88.81578826904297, 92.6904067993164, 96.56503295898438, 100.43965148925781, 104.31427764892578, 108.18889617919922, 112.06352233886719, 115.93814086914062, 119.81275939941406]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 5.0, 6.0, 9.0, 13.0, 23.0, 46.0, 56.0, 110.0, 155.0, 167.0, 125.0, 101.0, 59.0, 26.0, 22.0, 9.0, 9.0, 6.0, 4.0, 6.0, 9.0, 0.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.05458068847656, -141.53274536132812, -137.01089477539062, -132.4890594482422, -127.96720886230469, -123.44536590576172, -118.92352294921875, -114.40168762207031, -109.87983703613281, -105.35799407958984, -100.83615112304688, -96.3143081665039, -91.79246520996094, -87.27062225341797, -82.748779296875, -78.22694396972656, -73.7051010131836, -69.18325805664062, -64.66141510009766, -60.13957214355469, -55.61772918701172, -51.09588623046875, -46.57404708862305, -42.05220413208008, -37.53036117553711, -33.00851821899414, -28.486675262451172, -23.964834213256836, -19.442991256713867, -14.921148300170898, -10.399307250976562, -5.877464294433594, -1.355621337890625, 3.1662211418151855, 7.688063621520996, 12.209905624389648, 16.731748580932617, 21.253591537475586, 25.775432586669922, 30.29727554321289, 34.81911849975586, 39.34096145629883, 43.8628044128418, 48.3846435546875, 52.90648651123047, 57.42832946777344, 61.950172424316406, 66.47201538085938, 70.99385833740234, 75.51570129394531, 80.03754425048828, 84.55938720703125, 89.08123016357422, 93.60307312011719, 98.12490844726562, 102.64675903320312, 107.16859436035156, 111.69043731689453, 116.2122802734375, 120.73412322998047, 125.25596618652344, 129.77780151367188, 134.29965209960938, 138.8214874267578, 143.3433380126953]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 10.0, 11.0, 14.0, 29.0, 38.0, 62.0, 90.0, 106.0, 188.0, 263.0, 448.0, 734.0, 1335.0, 2762.0, 6556.0, 23490.0, 261166.0, 3818949.0, 57486.0, 11989.0, 4403.0, 1852.0, 1039.0, 512.0, 261.0, 165.0, 113.0, 57.0, 47.0, 29.0, 22.0, 13.0, 8.0, 4.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-26.0625, -25.30126953125, -24.5400390625, -23.77880859375, -23.017578125, -22.25634765625, -21.4951171875, -20.73388671875, -19.97265625, -19.21142578125, -18.4501953125, -17.68896484375, -16.927734375, -16.16650390625, -15.4052734375, -14.64404296875, -13.8828125, -13.12158203125, -12.3603515625, -11.59912109375, -10.837890625, -10.07666015625, -9.3154296875, -8.55419921875, -7.79296875, -7.03173828125, -6.2705078125, -5.50927734375, -4.748046875, -3.98681640625, -3.2255859375, -2.46435546875, -1.703125, -0.94189453125, -0.1806640625, 0.58056640625, 1.341796875, 2.10302734375, 2.8642578125, 3.62548828125, 4.38671875, 5.14794921875, 5.9091796875, 6.67041015625, 7.431640625, 8.19287109375, 8.9541015625, 9.71533203125, 10.4765625, 11.23779296875, 11.9990234375, 12.76025390625, 13.521484375, 14.28271484375, 15.0439453125, 15.80517578125, 16.56640625, 17.32763671875, 18.0888671875, 18.85009765625, 19.611328125, 20.37255859375, 21.1337890625, 21.89501953125, 22.65625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 7.0, 9.0, 18.0, 22.0, 40.0, 60.0, 116.0, 171.0, 185.0, 140.0, 73.0, 42.0, 20.0, 18.0, 12.0, 8.0, 10.0, 3.0, 5.0, 5.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0625, -1.99627685546875, -1.9300537109375, -1.86383056640625, -1.797607421875, -1.73138427734375, -1.6651611328125, -1.59893798828125, -1.53271484375, -1.46649169921875, -1.4002685546875, -1.33404541015625, -1.267822265625, -1.20159912109375, -1.1353759765625, -1.06915283203125, -1.0029296875, -0.93670654296875, -0.8704833984375, -0.80426025390625, -0.738037109375, -0.67181396484375, -0.6055908203125, -0.53936767578125, -0.47314453125, -0.40692138671875, -0.3406982421875, -0.27447509765625, -0.208251953125, -0.14202880859375, -0.0758056640625, -0.00958251953125, 0.056640625, 0.12286376953125, 0.1890869140625, 0.25531005859375, 0.321533203125, 0.38775634765625, 0.4539794921875, 0.52020263671875, 0.58642578125, 0.65264892578125, 0.7188720703125, 0.78509521484375, 0.851318359375, 0.91754150390625, 0.9837646484375, 1.04998779296875, 1.1162109375, 1.18243408203125, 1.2486572265625, 1.31488037109375, 1.381103515625, 1.44732666015625, 1.5135498046875, 1.57977294921875, 1.64599609375, 1.71221923828125, 1.7784423828125, 1.84466552734375, 1.910888671875, 1.97711181640625, 2.0433349609375, 2.10955810546875, 2.17578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 16.0, 21.0, 23.0, 31.0, 58.0, 91.0, 158.0, 258.0, 524.0, 1145.0, 2833.0, 7691.0, 29125.0, 307061.0, 3698875.0, 119188.0, 18096.0, 5244.0, 2043.0, 843.0, 404.0, 195.0, 140.0, 81.0, 45.0, 27.0, 21.0, 12.0, 9.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.953125, -12.46142578125, -11.9697265625, -11.47802734375, -10.986328125, -10.49462890625, -10.0029296875, -9.51123046875, -9.01953125, -8.52783203125, -8.0361328125, -7.54443359375, -7.052734375, -6.56103515625, -6.0693359375, -5.57763671875, -5.0859375, -4.59423828125, -4.1025390625, -3.61083984375, -3.119140625, -2.62744140625, -2.1357421875, -1.64404296875, -1.15234375, -0.66064453125, -0.1689453125, 0.32275390625, 0.814453125, 1.30615234375, 1.7978515625, 2.28955078125, 2.78125, 3.27294921875, 3.7646484375, 4.25634765625, 4.748046875, 5.23974609375, 5.7314453125, 6.22314453125, 6.71484375, 7.20654296875, 7.6982421875, 8.18994140625, 8.681640625, 9.17333984375, 9.6650390625, 10.15673828125, 10.6484375, 11.14013671875, 11.6318359375, 12.12353515625, 12.615234375, 13.10693359375, 13.5986328125, 14.09033203125, 14.58203125, 15.07373046875, 15.5654296875, 16.05712890625, 16.548828125, 17.04052734375, 17.5322265625, 18.02392578125, 18.515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 7.0, 5.0, 2.0, 4.0, 5.0, 11.0, 8.0, 16.0, 22.0, 40.0, 86.0, 143.0, 345.0, 1758.0, 1000.0, 315.0, 131.0, 66.0, 33.0, 28.0, 18.0, 6.0, 13.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.0692138671875, -2.954833984375, -2.8404541015625, -2.72607421875, -2.6116943359375, -2.497314453125, -2.3829345703125, -2.2685546875, -2.1541748046875, -2.039794921875, -1.9254150390625, -1.81103515625, -1.6966552734375, -1.582275390625, -1.4678955078125, -1.353515625, -1.2391357421875, -1.124755859375, -1.0103759765625, -0.89599609375, -0.7816162109375, -0.667236328125, -0.5528564453125, -0.4384765625, -0.3240966796875, -0.209716796875, -0.0953369140625, 0.01904296875, 0.1334228515625, 0.247802734375, 0.3621826171875, 0.4765625, 0.5909423828125, 0.705322265625, 0.8197021484375, 0.93408203125, 1.0484619140625, 1.162841796875, 1.2772216796875, 1.3916015625, 1.5059814453125, 1.620361328125, 1.7347412109375, 1.84912109375, 1.9635009765625, 2.077880859375, 2.1922607421875, 2.306640625, 2.4210205078125, 2.535400390625, 2.6497802734375, 2.76416015625, 2.8785400390625, 2.992919921875, 3.1072998046875, 3.2216796875, 3.3360595703125, 3.450439453125, 3.5648193359375, 3.67919921875, 3.7935791015625, 3.907958984375, 4.0223388671875, 4.13671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 25.0, 59.0, 247.0, 464.0, 146.0, 36.0, 10.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.16297912597656, -35.19352722167969, -34.22407531738281, -33.25461959838867, -32.2851676940918, -31.315715789794922, -30.346263885498047, -29.376811981201172, -28.407358169555664, -27.43790626525879, -26.46845245361328, -25.499000549316406, -24.52954864501953, -23.560094833374023, -22.59064292907715, -21.62118911743164, -20.651737213134766, -19.68228530883789, -18.712831497192383, -17.743379592895508, -16.77392578125, -15.804473876953125, -14.83502197265625, -13.865569114685059, -12.896116256713867, -11.926663398742676, -10.957210540771484, -9.98775863647461, -9.018305778503418, -8.048852920532227, -7.079400539398193, -6.10994815826416, -5.140497207641602, -4.17104434967041, -3.201591968536377, -2.2321393489837646, -1.2626867294311523, -0.29323387145996094, 0.6762185096740723, 1.6456708908081055, 2.615123748779297, 3.584576368331909, 4.5540289878845215, 5.523481369018555, 6.492934226989746, 7.4623870849609375, 8.431838989257812, 9.401291847229004, 10.370744705200195, 11.340197563171387, 12.309650421142578, 13.279102325439453, 14.248555183410645, 15.218008041381836, 16.18745994567871, 17.15691375732422, 18.126365661621094, 19.09581756591797, 20.065271377563477, 21.03472328186035, 22.00417709350586, 22.973628997802734, 23.94308090209961, 24.912532806396484, 25.881986618041992]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 10.0, 16.0, 15.0, 29.0, 54.0, 61.0, 92.0, 100.0, 126.0, 123.0, 92.0, 74.0, 74.0, 41.0, 26.0, 19.0, 9.0, 11.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.327640533447266, -19.696151733398438, -19.06466293334961, -18.43317413330078, -17.801685333251953, -17.170194625854492, -16.538705825805664, -15.907217025756836, -15.275728225708008, -14.64423942565918, -14.012750625610352, -13.381260871887207, -12.749772071838379, -12.11828327178955, -11.486793518066406, -10.855304718017578, -10.22381591796875, -9.592327117919922, -8.960838317871094, -8.32934856414795, -7.697859764099121, -7.066370964050293, -6.434881687164307, -5.80339241027832, -5.171903610229492, -4.540414810180664, -3.9089255332946777, -3.2774364948272705, -2.6459474563598633, -2.014458417892456, -1.3829693794250488, -0.7514801025390625, -0.11999130249023438, 0.5114977359771729, 1.14298677444458, 1.7744758129119873, 2.4059648513793945, 3.0374538898468018, 3.668942928314209, 4.300432205200195, 4.931921005249023, 5.563409805297852, 6.194899082183838, 6.826388359069824, 7.457877159118652, 8.08936595916748, 8.720855712890625, 9.352344512939453, 9.983833312988281, 10.61532211303711, 11.246810913085938, 11.878300666809082, 12.50978946685791, 13.141278266906738, 13.772768020629883, 14.404256820678711, 15.035745620727539, 15.667234420776367, 16.298723220825195, 16.930212020874023, 17.561702728271484, 18.193191528320312, 18.82468032836914, 19.45616912841797, 20.087657928466797]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 2.0, 5.0, 15.0, 14.0, 18.0, 28.0, 51.0, 66.0, 120.0, 216.0, 372.0, 821.0, 2123.0, 6129.0, 24274.0, 242593.0, 710403.0, 46418.0, 9664.0, 3036.0, 1123.0, 488.0, 239.0, 119.0, 87.0, 49.0, 22.0, 17.0, 17.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.2454833984375, -16.740966796875, -16.2364501953125, -15.73193359375, -15.2274169921875, -14.722900390625, -14.2183837890625, -13.7138671875, -13.2093505859375, -12.704833984375, -12.2003173828125, -11.69580078125, -11.1912841796875, -10.686767578125, -10.1822509765625, -9.677734375, -9.1732177734375, -8.668701171875, -8.1641845703125, -7.65966796875, -7.1551513671875, -6.650634765625, -6.1461181640625, -5.6416015625, -5.1370849609375, -4.632568359375, -4.1280517578125, -3.62353515625, -3.1190185546875, -2.614501953125, -2.1099853515625, -1.60546875, -1.1009521484375, -0.596435546875, -0.0919189453125, 0.41259765625, 0.9171142578125, 1.421630859375, 1.9261474609375, 2.4306640625, 2.9351806640625, 3.439697265625, 3.9442138671875, 4.44873046875, 4.9532470703125, 5.457763671875, 5.9622802734375, 6.466796875, 6.9713134765625, 7.475830078125, 7.9803466796875, 8.48486328125, 8.9893798828125, 9.493896484375, 9.9984130859375, 10.5029296875, 11.0074462890625, 11.511962890625, 12.0164794921875, 12.52099609375, 13.0255126953125, 13.530029296875, 14.0345458984375, 14.5390625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 10.0, 10.0, 14.0, 9.0, 25.0, 45.0, 70.0, 122.0, 174.0, 171.0, 128.0, 88.0, 42.0, 24.0, 18.0, 15.0, 6.0, 10.0, 5.0, 6.0, 2.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.203125, -1.137298583984375, -1.07147216796875, -1.005645751953125, -0.9398193359375, -0.873992919921875, -0.80816650390625, -0.742340087890625, -0.676513671875, -0.610687255859375, -0.54486083984375, -0.479034423828125, -0.4132080078125, -0.347381591796875, -0.28155517578125, -0.215728759765625, -0.14990234375, -0.084075927734375, -0.01824951171875, 0.047576904296875, 0.1134033203125, 0.179229736328125, 0.24505615234375, 0.310882568359375, 0.376708984375, 0.442535400390625, 0.50836181640625, 0.574188232421875, 0.6400146484375, 0.705841064453125, 0.77166748046875, 0.837493896484375, 0.9033203125, 0.969146728515625, 1.03497314453125, 1.100799560546875, 1.1666259765625, 1.232452392578125, 1.29827880859375, 1.364105224609375, 1.429931640625, 1.495758056640625, 1.56158447265625, 1.627410888671875, 1.6932373046875, 1.759063720703125, 1.82489013671875, 1.890716552734375, 1.95654296875, 2.022369384765625, 2.08819580078125, 2.154022216796875, 2.2198486328125, 2.285675048828125, 2.35150146484375, 2.417327880859375, 2.483154296875, 2.548980712890625, 2.61480712890625, 2.680633544921875, 2.7464599609375, 2.812286376953125, 2.87811279296875, 2.943939208984375, 3.009765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 2.0, 13.0, 6.0, 15.0, 14.0, 19.0, 47.0, 52.0, 93.0, 144.0, 247.0, 399.0, 692.0, 1383.0, 2805.0, 6325.0, 14622.0, 38619.0, 116481.0, 420381.0, 313229.0, 83600.0, 28315.0, 11055.0, 4847.0, 2388.0, 1236.0, 596.0, 345.0, 225.0, 135.0, 67.0, 46.0, 35.0, 26.0, 14.0, 8.0, 12.0, 9.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.48046875, -5.30853271484375, -5.1365966796875, -4.96466064453125, -4.792724609375, -4.62078857421875, -4.4488525390625, -4.27691650390625, -4.10498046875, -3.93304443359375, -3.7611083984375, -3.58917236328125, -3.417236328125, -3.24530029296875, -3.0733642578125, -2.90142822265625, -2.7294921875, -2.55755615234375, -2.3856201171875, -2.21368408203125, -2.041748046875, -1.86981201171875, -1.6978759765625, -1.52593994140625, -1.35400390625, -1.18206787109375, -1.0101318359375, -0.83819580078125, -0.666259765625, -0.49432373046875, -0.3223876953125, -0.15045166015625, 0.021484375, 0.19342041015625, 0.3653564453125, 0.53729248046875, 0.709228515625, 0.88116455078125, 1.0531005859375, 1.22503662109375, 1.39697265625, 1.56890869140625, 1.7408447265625, 1.91278076171875, 2.084716796875, 2.25665283203125, 2.4285888671875, 2.60052490234375, 2.7724609375, 2.94439697265625, 3.1163330078125, 3.28826904296875, 3.460205078125, 3.63214111328125, 3.8040771484375, 3.97601318359375, 4.14794921875, 4.31988525390625, 4.4918212890625, 4.66375732421875, 4.835693359375, 5.00762939453125, 5.1795654296875, 5.35150146484375, 5.5234375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 10.0, 11.0, 14.0, 17.0, 17.0, 21.0, 27.0, 36.0, 35.0, 32.0, 40.0, 45.0, 39.0, 46.0, 43.0, 56.0, 53.0, 53.0, 53.0, 46.0, 50.0, 44.0, 34.0, 30.0, 32.0, 18.0, 20.0, 15.0, 13.0, 8.0, 12.0, 10.0, 4.0, 6.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.9144287109375, -4.746826171875, -4.5792236328125, -4.41162109375, -4.2440185546875, -4.076416015625, -3.9088134765625, -3.7412109375, -3.5736083984375, -3.406005859375, -3.2384033203125, -3.07080078125, -2.9031982421875, -2.735595703125, -2.5679931640625, -2.400390625, -2.2327880859375, -2.065185546875, -1.8975830078125, -1.72998046875, -1.5623779296875, -1.394775390625, -1.2271728515625, -1.0595703125, -0.8919677734375, -0.724365234375, -0.5567626953125, -0.38916015625, -0.2215576171875, -0.053955078125, 0.1136474609375, 0.28125, 0.4488525390625, 0.616455078125, 0.7840576171875, 0.95166015625, 1.1192626953125, 1.286865234375, 1.4544677734375, 1.6220703125, 1.7896728515625, 1.957275390625, 2.1248779296875, 2.29248046875, 2.4600830078125, 2.627685546875, 2.7952880859375, 2.962890625, 3.1304931640625, 3.298095703125, 3.4656982421875, 3.63330078125, 3.8009033203125, 3.968505859375, 4.1361083984375, 4.3037109375, 4.4713134765625, 4.638916015625, 4.8065185546875, 4.97412109375, 5.1417236328125, 5.309326171875, 5.4769287109375, 5.64453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 4.0, 7.0, 12.0, 18.0, 21.0, 34.0, 37.0, 48.0, 65.0, 86.0, 145.0, 268.0, 442.0, 814.0, 1580.0, 3704.0, 11134.0, 46692.0, 404575.0, 502726.0, 55366.0, 12663.0, 4218.0, 1822.0, 828.0, 449.0, 319.0, 159.0, 84.0, 73.0, 46.0, 38.0, 20.0, 14.0, 7.0, 9.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5390625, -8.2451171875, -7.951171875, -7.6572265625, -7.36328125, -7.0693359375, -6.775390625, -6.4814453125, -6.1875, -5.8935546875, -5.599609375, -5.3056640625, -5.01171875, -4.7177734375, -4.423828125, -4.1298828125, -3.8359375, -3.5419921875, -3.248046875, -2.9541015625, -2.66015625, -2.3662109375, -2.072265625, -1.7783203125, -1.484375, -1.1904296875, -0.896484375, -0.6025390625, -0.30859375, -0.0146484375, 0.279296875, 0.5732421875, 0.8671875, 1.1611328125, 1.455078125, 1.7490234375, 2.04296875, 2.3369140625, 2.630859375, 2.9248046875, 3.21875, 3.5126953125, 3.806640625, 4.1005859375, 4.39453125, 4.6884765625, 4.982421875, 5.2763671875, 5.5703125, 5.8642578125, 6.158203125, 6.4521484375, 6.74609375, 7.0400390625, 7.333984375, 7.6279296875, 7.921875, 8.2158203125, 8.509765625, 8.8037109375, 9.09765625, 9.3916015625, 9.685546875, 9.9794921875, 10.2734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 14.0, 10.0, 15.0, 18.0, 19.0, 38.0, 66.0, 119.0, 213.0, 198.0, 102.0, 72.0, 41.0, 23.0, 9.0, 10.0, 11.0, 10.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040340423583984375, -0.00038943439722061157, -0.0003754645586013794, -0.0003614947199821472, -0.00034752488136291504, -0.00033355504274368286, -0.0003195852041244507, -0.0003056153655052185, -0.00029164552688598633, -0.00027767568826675415, -0.00026370584964752197, -0.0002497360110282898, -0.00023576617240905762, -0.00022179633378982544, -0.00020782649517059326, -0.00019385665655136108, -0.0001798868179321289, -0.00016591697931289673, -0.00015194714069366455, -0.00013797730207443237, -0.0001240074634552002, -0.00011003762483596802, -9.606778621673584e-05, -8.209794759750366e-05, -6.812810897827148e-05, -5.415827035903931e-05, -4.018843173980713e-05, -2.621859312057495e-05, -1.2248754501342773e-05, 1.7210841178894043e-06, 1.5690922737121582e-05, 2.966076135635376e-05, 4.363059997558594e-05, 5.7600438594818115e-05, 7.157027721405029e-05, 8.554011583328247e-05, 9.950995445251465e-05, 0.00011347979307174683, 0.000127449631690979, 0.00014141947031021118, 0.00015538930892944336, 0.00016935914754867554, 0.00018332898616790771, 0.0001972988247871399, 0.00021126866340637207, 0.00022523850202560425, 0.00023920834064483643, 0.0002531781792640686, 0.0002671480178833008, 0.00028111785650253296, 0.00029508769512176514, 0.0003090575337409973, 0.0003230273723602295, 0.00033699721097946167, 0.00035096704959869385, 0.000364936888217926, 0.0003789067268371582, 0.0003928765654563904, 0.00040684640407562256, 0.00042081624269485474, 0.0004347860813140869, 0.0004487559199333191, 0.00046272575855255127, 0.00047669559717178345, 0.0004906654357910156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 10.0, 25.0, 21.0, 38.0, 66.0, 126.0, 248.0, 515.0, 1356.0, 4018.0, 15271.0, 81840.0, 643826.0, 256781.0, 32991.0, 7363.0, 2310.0, 926.0, 352.0, 186.0, 110.0, 56.0, 36.0, 23.0, 18.0, 15.0, 6.0, 6.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6796875, -11.38592529296875, -11.0921630859375, -10.79840087890625, -10.504638671875, -10.21087646484375, -9.9171142578125, -9.62335205078125, -9.32958984375, -9.03582763671875, -8.7420654296875, -8.44830322265625, -8.154541015625, -7.86077880859375, -7.5670166015625, -7.27325439453125, -6.9794921875, -6.68572998046875, -6.3919677734375, -6.09820556640625, -5.804443359375, -5.51068115234375, -5.2169189453125, -4.92315673828125, -4.62939453125, -4.33563232421875, -4.0418701171875, -3.74810791015625, -3.454345703125, -3.16058349609375, -2.8668212890625, -2.57305908203125, -2.279296875, -1.98553466796875, -1.6917724609375, -1.39801025390625, -1.104248046875, -0.81048583984375, -0.5167236328125, -0.22296142578125, 0.07080078125, 0.36456298828125, 0.6583251953125, 0.95208740234375, 1.245849609375, 1.53961181640625, 1.8333740234375, 2.12713623046875, 2.4208984375, 2.71466064453125, 3.0084228515625, 3.30218505859375, 3.595947265625, 3.88970947265625, 4.1834716796875, 4.47723388671875, 4.77099609375, 5.06475830078125, 5.3585205078125, 5.65228271484375, 5.946044921875, 6.23980712890625, 6.5335693359375, 6.82733154296875, 7.12109375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 9.0, 13.0, 16.0, 13.0, 20.0, 23.0, 34.0, 36.0, 52.0, 51.0, 77.0, 98.0, 93.0, 82.0, 82.0, 72.0, 41.0, 44.0, 29.0, 30.0, 23.0, 11.0, 6.0, 13.0, 5.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9765625, -3.82122802734375, -3.6658935546875, -3.51055908203125, -3.355224609375, -3.19989013671875, -3.0445556640625, -2.88922119140625, -2.73388671875, -2.57855224609375, -2.4232177734375, -2.26788330078125, -2.112548828125, -1.95721435546875, -1.8018798828125, -1.64654541015625, -1.4912109375, -1.33587646484375, -1.1805419921875, -1.02520751953125, -0.869873046875, -0.71453857421875, -0.5592041015625, -0.40386962890625, -0.24853515625, -0.09320068359375, 0.0621337890625, 0.21746826171875, 0.372802734375, 0.52813720703125, 0.6834716796875, 0.83880615234375, 0.994140625, 1.14947509765625, 1.3048095703125, 1.46014404296875, 1.615478515625, 1.77081298828125, 1.9261474609375, 2.08148193359375, 2.23681640625, 2.39215087890625, 2.5474853515625, 2.70281982421875, 2.858154296875, 3.01348876953125, 3.1688232421875, 3.32415771484375, 3.4794921875, 3.63482666015625, 3.7901611328125, 3.94549560546875, 4.100830078125, 4.25616455078125, 4.4114990234375, 4.56683349609375, 4.72216796875, 4.87750244140625, 5.0328369140625, 5.18817138671875, 5.343505859375, 5.49884033203125, 5.6541748046875, 5.80950927734375, 5.96484375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 9.0, 12.0, 24.0, 69.0, 121.0, 201.0, 217.0, 171.0, 75.0, 34.0, 24.0, 13.0, 5.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-81.08412170410156, -79.4083023071289, -77.73248291015625, -76.05667114257812, -74.38085174560547, -72.70503234863281, -71.02922058105469, -69.35340118408203, -67.67758178710938, -66.00176239013672, -64.32594299316406, -62.65013122558594, -60.97431182861328, -59.298492431640625, -57.622676849365234, -55.946861267089844, -54.27104187011719, -52.59522247314453, -50.91940689086914, -49.24359130859375, -47.567771911621094, -45.89195251464844, -44.21613693237305, -42.540321350097656, -40.864501953125, -39.188682556152344, -37.51286697387695, -35.83705139160156, -34.161231994628906, -32.48541259765625, -30.80959701538086, -29.133779525756836, -27.45796012878418, -25.782142639160156, -24.106325149536133, -22.43050765991211, -20.754690170288086, -19.078872680664062, -17.40305519104004, -15.727237701416016, -14.051420211791992, -12.375602722167969, -10.699785232543945, -9.023967742919922, -7.348150253295898, -5.672332763671875, -3.9965152740478516, -2.320697784423828, -0.6448802947998047, 1.0309371948242188, 2.706754684448242, 4.382572174072266, 6.058389663696289, 7.7342071533203125, 9.410024642944336, 11.08584213256836, 12.761659622192383, 14.437477111816406, 16.11329460144043, 17.789112091064453, 19.464929580688477, 21.1407470703125, 22.816564559936523, 24.492382049560547, 26.16819953918457]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 11.0, 5.0, 3.0, 10.0, 14.0, 8.0, 16.0, 30.0, 36.0, 36.0, 65.0, 74.0, 71.0, 80.0, 79.0, 81.0, 55.0, 57.0, 63.0, 55.0, 31.0, 34.0, 23.0, 15.0, 12.0, 14.0, 6.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-65.4575424194336, -63.834007263183594, -62.21047592163086, -60.58694076538086, -58.963409423828125, -57.339874267578125, -55.716339111328125, -54.09280776977539, -52.469276428222656, -50.845741271972656, -49.22220993041992, -47.59867477416992, -45.97514343261719, -44.35160827636719, -42.72807312011719, -41.10454177856445, -39.48100662231445, -37.85747146606445, -36.23394012451172, -34.61040496826172, -32.986873626708984, -31.363338470458984, -29.739805221557617, -28.11627197265625, -26.492738723754883, -24.869205474853516, -23.24567222595215, -21.62213897705078, -19.99860382080078, -18.375072479248047, -16.751537322998047, -15.12800407409668, -13.504470825195312, -11.880937576293945, -10.257404327392578, -8.633870124816895, -7.010336875915527, -5.38680362701416, -3.7632694244384766, -2.1397361755371094, -0.5162029266357422, 1.107330560684204, 2.7308640480041504, 4.354397773742676, 5.977931022644043, 7.60146427154541, 9.224998474121094, 10.848531723022461, 12.472064971923828, 14.095598220825195, 15.719131469726562, 17.342666625976562, 18.966197967529297, 20.589733123779297, 22.213266372680664, 23.83679962158203, 25.4603328704834, 27.083866119384766, 28.707399368286133, 30.3309326171875, 31.9544677734375, 33.577999114990234, 35.201534271240234, 36.82506561279297, 38.44860076904297]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 7.0, 7.0, 15.0, 21.0, 21.0, 41.0, 52.0, 65.0, 125.0, 178.0, 292.0, 472.0, 799.0, 1496.0, 2842.0, 6988.0, 22333.0, 185802.0, 3832691.0, 108430.0, 18569.0, 6293.0, 2738.0, 1482.0, 814.0, 556.0, 357.0, 263.0, 165.0, 102.0, 76.0, 67.0, 37.0, 26.0, 13.0, 8.0, 14.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.109375, -25.3720703125, -24.634765625, -23.8974609375, -23.16015625, -22.4228515625, -21.685546875, -20.9482421875, -20.2109375, -19.4736328125, -18.736328125, -17.9990234375, -17.26171875, -16.5244140625, -15.787109375, -15.0498046875, -14.3125, -13.5751953125, -12.837890625, -12.1005859375, -11.36328125, -10.6259765625, -9.888671875, -9.1513671875, -8.4140625, -7.6767578125, -6.939453125, -6.2021484375, -5.46484375, -4.7275390625, -3.990234375, -3.2529296875, -2.515625, -1.7783203125, -1.041015625, -0.3037109375, 0.43359375, 1.1708984375, 1.908203125, 2.6455078125, 3.3828125, 4.1201171875, 4.857421875, 5.5947265625, 6.33203125, 7.0693359375, 7.806640625, 8.5439453125, 9.28125, 10.0185546875, 10.755859375, 11.4931640625, 12.23046875, 12.9677734375, 13.705078125, 14.4423828125, 15.1796875, 15.9169921875, 16.654296875, 17.3916015625, 18.12890625, 18.8662109375, 19.603515625, 20.3408203125, 21.078125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 6.0, 9.0, 11.0, 22.0, 23.0, 28.0, 31.0, 56.0, 70.0, 90.0, 95.0, 122.0, 95.0, 78.0, 66.0, 43.0, 32.0, 26.0, 17.0, 9.0, 10.0, 8.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.4794921875, -1.4376373291015625, -1.395782470703125, -1.3539276123046875, -1.31207275390625, -1.2702178955078125, -1.228363037109375, -1.1865081787109375, -1.1446533203125, -1.1027984619140625, -1.060943603515625, -1.0190887451171875, -0.97723388671875, -0.9353790283203125, -0.893524169921875, -0.8516693115234375, -0.809814453125, -0.7679595947265625, -0.726104736328125, -0.6842498779296875, -0.64239501953125, -0.6005401611328125, -0.558685302734375, -0.5168304443359375, -0.4749755859375, -0.4331207275390625, -0.391265869140625, -0.3494110107421875, -0.30755615234375, -0.2657012939453125, -0.223846435546875, -0.1819915771484375, -0.14013671875, -0.0982818603515625, -0.056427001953125, -0.0145721435546875, 0.02728271484375, 0.0691375732421875, 0.110992431640625, 0.1528472900390625, 0.1947021484375, 0.2365570068359375, 0.278411865234375, 0.3202667236328125, 0.36212158203125, 0.4039764404296875, 0.445831298828125, 0.4876861572265625, 0.529541015625, 0.5713958740234375, 0.613250732421875, 0.6551055908203125, 0.69696044921875, 0.7388153076171875, 0.780670166015625, 0.8225250244140625, 0.8643798828125, 0.9062347412109375, 0.948089599609375, 0.9899444580078125, 1.03179931640625, 1.0736541748046875, 1.115509033203125, 1.1573638916015625, 1.19921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 13.0, 12.0, 16.0, 20.0, 36.0, 68.0, 79.0, 197.0, 776.0, 7875.0, 3850158.0, 330110.0, 4002.0, 480.0, 158.0, 82.0, 42.0, 29.0, 27.0, 16.0, 13.0, 10.0, 11.0, 6.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.78125, -50.2060546875, -48.630859375, -47.0556640625, -45.48046875, -43.9052734375, -42.330078125, -40.7548828125, -39.1796875, -37.6044921875, -36.029296875, -34.4541015625, -32.87890625, -31.3037109375, -29.728515625, -28.1533203125, -26.578125, -25.0029296875, -23.427734375, -21.8525390625, -20.27734375, -18.7021484375, -17.126953125, -15.5517578125, -13.9765625, -12.4013671875, -10.826171875, -9.2509765625, -7.67578125, -6.1005859375, -4.525390625, -2.9501953125, -1.375, 0.2001953125, 1.775390625, 3.3505859375, 4.92578125, 6.5009765625, 8.076171875, 9.6513671875, 11.2265625, 12.8017578125, 14.376953125, 15.9521484375, 17.52734375, 19.1025390625, 20.677734375, 22.2529296875, 23.828125, 25.4033203125, 26.978515625, 28.5537109375, 30.12890625, 31.7041015625, 33.279296875, 34.8544921875, 36.4296875, 38.0048828125, 39.580078125, 41.1552734375, 42.73046875, 44.3056640625, 45.880859375, 47.4560546875, 49.03125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 12.0, 6.0, 11.0, 17.0, 21.0, 18.0, 37.0, 43.0, 87.0, 111.0, 182.0, 338.0, 710.0, 1254.0, 476.0, 268.0, 149.0, 103.0, 51.0, 43.0, 31.0, 22.0, 13.0, 13.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.15234375, -2.08343505859375, -2.0145263671875, -1.94561767578125, -1.876708984375, -1.80780029296875, -1.7388916015625, -1.66998291015625, -1.60107421875, -1.53216552734375, -1.4632568359375, -1.39434814453125, -1.325439453125, -1.25653076171875, -1.1876220703125, -1.11871337890625, -1.0498046875, -0.98089599609375, -0.9119873046875, -0.84307861328125, -0.774169921875, -0.70526123046875, -0.6363525390625, -0.56744384765625, -0.49853515625, -0.42962646484375, -0.3607177734375, -0.29180908203125, -0.222900390625, -0.15399169921875, -0.0850830078125, -0.01617431640625, 0.052734375, 0.12164306640625, 0.1905517578125, 0.25946044921875, 0.328369140625, 0.39727783203125, 0.4661865234375, 0.53509521484375, 0.60400390625, 0.67291259765625, 0.7418212890625, 0.81072998046875, 0.879638671875, 0.94854736328125, 1.0174560546875, 1.08636474609375, 1.1552734375, 1.22418212890625, 1.2930908203125, 1.36199951171875, 1.430908203125, 1.49981689453125, 1.5687255859375, 1.63763427734375, 1.70654296875, 1.77545166015625, 1.8443603515625, 1.91326904296875, 1.982177734375, 2.05108642578125, 2.1199951171875, 2.18890380859375, 2.2578125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 14.0, 30.0, 97.0, 242.0, 324.0, 181.0, 56.0, 31.0, 12.0, 6.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.327363967895508, -7.588978290557861, -6.850592613220215, -6.112206935882568, -5.373821258544922, -4.635435581207275, -3.897049903869629, -3.1586642265319824, -2.420278549194336, -1.6818928718566895, -0.943507194519043, -0.20512151718139648, 0.53326416015625, 1.2716498374938965, 2.010035514831543, 2.7484211921691895, 3.486806869506836, 4.225192546844482, 4.963578224182129, 5.701963901519775, 6.440349578857422, 7.178735256195068, 7.917120933532715, 8.655506134033203, 9.393892288208008, 10.132278442382812, 10.8706636428833, 11.609048843383789, 12.347434997558594, 13.085821151733398, 13.824206352233887, 14.562591552734375, 15.300979614257812, 16.039365768432617, 16.777751922607422, 17.516136169433594, 18.2545223236084, 18.992908477783203, 19.731292724609375, 20.46967887878418, 21.208065032958984, 21.94645118713379, 22.684837341308594, 23.423221588134766, 24.16160774230957, 24.899993896484375, 25.638378143310547, 26.37676429748535, 27.115150451660156, 27.85353660583496, 28.591922760009766, 29.330307006835938, 30.068693161010742, 30.807079315185547, 31.54546356201172, 32.283851623535156, 33.02223587036133, 33.7606201171875, 34.49900817871094, 35.23739242553711, 35.97577667236328, 36.71416473388672, 37.45254898071289, 38.19093704223633, 38.9293212890625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 6.0, 11.0, 13.0, 11.0, 23.0, 23.0, 48.0, 41.0, 45.0, 69.0, 75.0, 68.0, 88.0, 81.0, 80.0, 62.0, 51.0, 47.0, 41.0, 36.0, 20.0, 20.0, 15.0, 8.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.226205825805664, -10.805607795715332, -10.385010719299316, -9.964412689208984, -9.543814659118652, -9.12321662902832, -8.702619552612305, -8.282021522521973, -7.861423969268799, -7.440826416015625, -7.020228385925293, -6.599630832672119, -6.179033279418945, -5.758435249328613, -5.3378376960754395, -4.917240142822266, -4.496642112731934, -4.07604455947876, -3.6554465293884277, -3.234848976135254, -2.814251184463501, -2.393653392791748, -1.9730558395385742, -1.5524580478668213, -1.1318602561950684, -0.7112625241279602, -0.29066479206085205, 0.12993288040161133, 0.5505306720733643, 0.9711284637451172, 1.391726016998291, 1.812323808670044, 2.2329225540161133, 2.653520345687866, 3.074118137359619, 3.494715690612793, 3.915313482284546, 4.335911273956299, 4.756508827209473, 5.177106857299805, 5.5977044105529785, 6.018301963806152, 6.438899993896484, 6.859497547149658, 7.280095100402832, 7.700693130493164, 8.12129020690918, 8.541888236999512, 8.962486267089844, 9.383084297180176, 9.803681373596191, 10.224279403686523, 10.644877433776855, 11.065475463867188, 11.486072540283203, 11.906670570373535, 12.327268600463867, 12.7478666305542, 13.168463706970215, 13.589061737060547, 14.009659767150879, 14.430257797241211, 14.850854873657227, 15.271452903747559, 15.692049980163574]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 9.0, 4.0, 5.0, 8.0, 12.0, 30.0, 29.0, 39.0, 57.0, 96.0, 132.0, 217.0, 343.0, 547.0, 943.0, 1624.0, 3019.0, 6082.0, 14278.0, 41546.0, 157451.0, 515313.0, 219574.0, 54078.0, 17909.0, 7356.0, 3451.0, 1789.0, 1029.0, 523.0, 359.0, 191.0, 162.0, 105.0, 88.0, 38.0, 38.0, 24.0, 15.0, 12.0, 10.0, 10.0, 1.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.8203125, -7.5648193359375, -7.309326171875, -7.0538330078125, -6.79833984375, -6.5428466796875, -6.287353515625, -6.0318603515625, -5.7763671875, -5.5208740234375, -5.265380859375, -5.0098876953125, -4.75439453125, -4.4989013671875, -4.243408203125, -3.9879150390625, -3.732421875, -3.4769287109375, -3.221435546875, -2.9659423828125, -2.71044921875, -2.4549560546875, -2.199462890625, -1.9439697265625, -1.6884765625, -1.4329833984375, -1.177490234375, -0.9219970703125, -0.66650390625, -0.4110107421875, -0.155517578125, 0.0999755859375, 0.35546875, 0.6109619140625, 0.866455078125, 1.1219482421875, 1.37744140625, 1.6329345703125, 1.888427734375, 2.1439208984375, 2.3994140625, 2.6549072265625, 2.910400390625, 3.1658935546875, 3.42138671875, 3.6768798828125, 3.932373046875, 4.1878662109375, 4.443359375, 4.6988525390625, 4.954345703125, 5.2098388671875, 5.46533203125, 5.7208251953125, 5.976318359375, 6.2318115234375, 6.4873046875, 6.7427978515625, 6.998291015625, 7.2537841796875, 7.50927734375, 7.7647705078125, 8.020263671875, 8.2757568359375, 8.53125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 8.0, 9.0, 9.0, 10.0, 17.0, 21.0, 32.0, 37.0, 41.0, 75.0, 73.0, 75.0, 102.0, 81.0, 97.0, 72.0, 61.0, 48.0, 37.0, 27.0, 14.0, 12.0, 14.0, 8.0, 1.0, 6.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2275390625, -1.1880035400390625, -1.148468017578125, -1.1089324951171875, -1.06939697265625, -1.0298614501953125, -0.990325927734375, -0.9507904052734375, -0.9112548828125, -0.8717193603515625, -0.832183837890625, -0.7926483154296875, -0.75311279296875, -0.7135772705078125, -0.674041748046875, -0.6345062255859375, -0.594970703125, -0.5554351806640625, -0.515899658203125, -0.4763641357421875, -0.43682861328125, -0.3972930908203125, -0.357757568359375, -0.3182220458984375, -0.2786865234375, -0.2391510009765625, -0.199615478515625, -0.1600799560546875, -0.12054443359375, -0.0810089111328125, -0.041473388671875, -0.0019378662109375, 0.03759765625, 0.0771331787109375, 0.116668701171875, 0.1562042236328125, 0.19573974609375, 0.2352752685546875, 0.274810791015625, 0.3143463134765625, 0.3538818359375, 0.3934173583984375, 0.432952880859375, 0.4724884033203125, 0.51202392578125, 0.5515594482421875, 0.591094970703125, 0.6306304931640625, 0.670166015625, 0.7097015380859375, 0.749237060546875, 0.7887725830078125, 0.82830810546875, 0.8678436279296875, 0.907379150390625, 0.9469146728515625, 0.9864501953125, 1.0259857177734375, 1.065521240234375, 1.1050567626953125, 1.14459228515625, 1.1841278076171875, 1.223663330078125, 1.2631988525390625, 1.302734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 13.0, 12.0, 17.0, 22.0, 31.0, 36.0, 59.0, 86.0, 121.0, 183.0, 270.0, 468.0, 740.0, 1393.0, 2527.0, 5066.0, 11203.0, 26353.0, 71651.0, 226860.0, 424426.0, 179935.0, 57245.0, 21429.0, 9146.0, 4177.0, 2097.0, 1129.0, 672.0, 418.0, 232.0, 168.0, 111.0, 68.0, 56.0, 45.0, 17.0, 17.0, 17.0, 7.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.00390625, -6.78082275390625, -6.5577392578125, -6.33465576171875, -6.111572265625, -5.88848876953125, -5.6654052734375, -5.44232177734375, -5.21923828125, -4.99615478515625, -4.7730712890625, -4.54998779296875, -4.326904296875, -4.10382080078125, -3.8807373046875, -3.65765380859375, -3.4345703125, -3.21148681640625, -2.9884033203125, -2.76531982421875, -2.542236328125, -2.31915283203125, -2.0960693359375, -1.87298583984375, -1.64990234375, -1.42681884765625, -1.2037353515625, -0.98065185546875, -0.757568359375, -0.53448486328125, -0.3114013671875, -0.08831787109375, 0.134765625, 0.35784912109375, 0.5809326171875, 0.80401611328125, 1.027099609375, 1.25018310546875, 1.4732666015625, 1.69635009765625, 1.91943359375, 2.14251708984375, 2.3656005859375, 2.58868408203125, 2.811767578125, 3.03485107421875, 3.2579345703125, 3.48101806640625, 3.7041015625, 3.92718505859375, 4.1502685546875, 4.37335205078125, 4.596435546875, 4.81951904296875, 5.0426025390625, 5.26568603515625, 5.48876953125, 5.71185302734375, 5.9349365234375, 6.15802001953125, 6.381103515625, 6.60418701171875, 6.8272705078125, 7.05035400390625, 7.2734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 6.0, 8.0, 9.0, 17.0, 17.0, 25.0, 17.0, 19.0, 15.0, 18.0, 38.0, 30.0, 36.0, 40.0, 47.0, 40.0, 49.0, 46.0, 46.0, 40.0, 50.0, 43.0, 42.0, 43.0, 39.0, 27.0, 36.0, 24.0, 17.0, 18.0, 20.0, 10.0, 6.0, 9.0, 10.0, 5.0, 2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.07421875, -4.90960693359375, -4.7449951171875, -4.58038330078125, -4.415771484375, -4.25115966796875, -4.0865478515625, -3.92193603515625, -3.75732421875, -3.59271240234375, -3.4281005859375, -3.26348876953125, -3.098876953125, -2.93426513671875, -2.7696533203125, -2.60504150390625, -2.4404296875, -2.27581787109375, -2.1112060546875, -1.94659423828125, -1.781982421875, -1.61737060546875, -1.4527587890625, -1.28814697265625, -1.12353515625, -0.95892333984375, -0.7943115234375, -0.62969970703125, -0.465087890625, -0.30047607421875, -0.1358642578125, 0.02874755859375, 0.193359375, 0.35797119140625, 0.5225830078125, 0.68719482421875, 0.851806640625, 1.01641845703125, 1.1810302734375, 1.34564208984375, 1.51025390625, 1.67486572265625, 1.8394775390625, 2.00408935546875, 2.168701171875, 2.33331298828125, 2.4979248046875, 2.66253662109375, 2.8271484375, 2.99176025390625, 3.1563720703125, 3.32098388671875, 3.485595703125, 3.65020751953125, 3.8148193359375, 3.97943115234375, 4.14404296875, 4.30865478515625, 4.4732666015625, 4.63787841796875, 4.802490234375, 4.96710205078125, 5.1317138671875, 5.29632568359375, 5.4609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 10.0, 14.0, 25.0, 25.0, 63.0, 90.0, 174.0, 322.0, 721.0, 1764.0, 5027.0, 17190.0, 81108.0, 470354.0, 386170.0, 64050.0, 14269.0, 4361.0, 1533.0, 639.0, 269.0, 160.0, 85.0, 43.0, 27.0, 13.0, 10.0, 11.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.28125, -8.06292724609375, -7.8446044921875, -7.62628173828125, -7.407958984375, -7.18963623046875, -6.9713134765625, -6.75299072265625, -6.53466796875, -6.31634521484375, -6.0980224609375, -5.87969970703125, -5.661376953125, -5.44305419921875, -5.2247314453125, -5.00640869140625, -4.7880859375, -4.56976318359375, -4.3514404296875, -4.13311767578125, -3.914794921875, -3.69647216796875, -3.4781494140625, -3.25982666015625, -3.04150390625, -2.82318115234375, -2.6048583984375, -2.38653564453125, -2.168212890625, -1.94989013671875, -1.7315673828125, -1.51324462890625, -1.294921875, -1.07659912109375, -0.8582763671875, -0.63995361328125, -0.421630859375, -0.20330810546875, 0.0150146484375, 0.23333740234375, 0.45166015625, 0.66998291015625, 0.8883056640625, 1.10662841796875, 1.324951171875, 1.54327392578125, 1.7615966796875, 1.97991943359375, 2.1982421875, 2.41656494140625, 2.6348876953125, 2.85321044921875, 3.071533203125, 3.28985595703125, 3.5081787109375, 3.72650146484375, 3.94482421875, 4.16314697265625, 4.3814697265625, 4.59979248046875, 4.818115234375, 5.03643798828125, 5.2547607421875, 5.47308349609375, 5.69140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 12.0, 11.0, 11.0, 16.0, 37.0, 42.0, 67.0, 88.0, 113.0, 160.0, 115.0, 107.0, 58.0, 56.0, 23.0, 33.0, 8.0, 13.0, 11.0, 5.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009918212890625, -0.0009691119194030762, -0.0009464025497436523, -0.0009236931800842285, -0.0009009838104248047, -0.0008782744407653809, -0.000855565071105957, -0.0008328557014465332, -0.0008101463317871094, -0.0007874369621276855, -0.0007647275924682617, -0.0007420182228088379, -0.0007193088531494141, -0.0006965994834899902, -0.0006738901138305664, -0.0006511807441711426, -0.0006284713745117188, -0.0006057620048522949, -0.0005830526351928711, -0.0005603432655334473, -0.0005376338958740234, -0.0005149245262145996, -0.0004922151565551758, -0.00046950578689575195, -0.0004467964172363281, -0.0004240870475769043, -0.00040137767791748047, -0.00037866830825805664, -0.0003559589385986328, -0.000333249568939209, -0.00031054019927978516, -0.00028783082962036133, -0.0002651214599609375, -0.00024241209030151367, -0.00021970272064208984, -0.00019699335098266602, -0.0001742839813232422, -0.00015157461166381836, -0.00012886524200439453, -0.0001061558723449707, -8.344650268554688e-05, -6.073713302612305e-05, -3.802776336669922e-05, -1.531839370727539e-05, 7.3909759521484375e-06, 3.0100345611572266e-05, 5.2809715270996094e-05, 7.551908493041992e-05, 9.822845458984375e-05, 0.00012093782424926758, 0.0001436471939086914, 0.00016635656356811523, 0.00018906593322753906, 0.0002117753028869629, 0.00023448467254638672, 0.00025719404220581055, 0.0002799034118652344, 0.0003026127815246582, 0.00032532215118408203, 0.00034803152084350586, 0.0003707408905029297, 0.0003934502601623535, 0.00041615962982177734, 0.00043886899948120117, 0.000461578369140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 13.0, 17.0, 19.0, 49.0, 61.0, 67.0, 132.0, 205.0, 319.0, 609.0, 1138.0, 2397.0, 5463.0, 13943.0, 41281.0, 143006.0, 463753.0, 267905.0, 71188.0, 22189.0, 8051.0, 3376.0, 1516.0, 770.0, 405.0, 234.0, 144.0, 103.0, 56.0, 39.0, 32.0, 19.0, 12.0, 6.0, 3.0, 3.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.3875732421875, -4.239990234375, -4.0924072265625, -3.94482421875, -3.7972412109375, -3.649658203125, -3.5020751953125, -3.3544921875, -3.2069091796875, -3.059326171875, -2.9117431640625, -2.76416015625, -2.6165771484375, -2.468994140625, -2.3214111328125, -2.173828125, -2.0262451171875, -1.878662109375, -1.7310791015625, -1.58349609375, -1.4359130859375, -1.288330078125, -1.1407470703125, -0.9931640625, -0.8455810546875, -0.697998046875, -0.5504150390625, -0.40283203125, -0.2552490234375, -0.107666015625, 0.0399169921875, 0.1875, 0.3350830078125, 0.482666015625, 0.6302490234375, 0.77783203125, 0.9254150390625, 1.072998046875, 1.2205810546875, 1.3681640625, 1.5157470703125, 1.663330078125, 1.8109130859375, 1.95849609375, 2.1060791015625, 2.253662109375, 2.4012451171875, 2.548828125, 2.6964111328125, 2.843994140625, 2.9915771484375, 3.13916015625, 3.2867431640625, 3.434326171875, 3.5819091796875, 3.7294921875, 3.8770751953125, 4.024658203125, 4.1722412109375, 4.31982421875, 4.4674072265625, 4.614990234375, 4.7625732421875, 4.91015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 7.0, 10.0, 17.0, 14.0, 13.0, 21.0, 25.0, 26.0, 31.0, 31.0, 41.0, 55.0, 52.0, 55.0, 64.0, 72.0, 58.0, 50.0, 51.0, 38.0, 31.0, 41.0, 33.0, 23.0, 17.0, 16.0, 19.0, 15.0, 13.0, 8.0, 7.0, 1.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.681640625, -2.6031494140625, -2.524658203125, -2.4461669921875, -2.36767578125, -2.2891845703125, -2.210693359375, -2.1322021484375, -2.0537109375, -1.9752197265625, -1.896728515625, -1.8182373046875, -1.73974609375, -1.6612548828125, -1.582763671875, -1.5042724609375, -1.42578125, -1.3472900390625, -1.268798828125, -1.1903076171875, -1.11181640625, -1.0333251953125, -0.954833984375, -0.8763427734375, -0.7978515625, -0.7193603515625, -0.640869140625, -0.5623779296875, -0.48388671875, -0.4053955078125, -0.326904296875, -0.2484130859375, -0.169921875, -0.0914306640625, -0.012939453125, 0.0655517578125, 0.14404296875, 0.2225341796875, 0.301025390625, 0.3795166015625, 0.4580078125, 0.5364990234375, 0.614990234375, 0.6934814453125, 0.77197265625, 0.8504638671875, 0.928955078125, 1.0074462890625, 1.0859375, 1.1644287109375, 1.242919921875, 1.3214111328125, 1.39990234375, 1.4783935546875, 1.556884765625, 1.6353759765625, 1.7138671875, 1.7923583984375, 1.870849609375, 1.9493408203125, 2.02783203125, 2.1063232421875, 2.184814453125, 2.2633056640625, 2.341796875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 12.0, 15.0, 47.0, 61.0, 139.0, 250.0, 232.0, 101.0, 74.0, 33.0, 6.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.492095947265625, -48.19110870361328, -45.89012145996094, -43.589134216308594, -41.28814697265625, -38.987159729003906, -36.68617248535156, -34.38518524169922, -32.084197998046875, -29.78321075439453, -27.482223510742188, -25.181236267089844, -22.8802490234375, -20.579261779785156, -18.278274536132812, -15.977287292480469, -13.676300048828125, -11.375312805175781, -9.074325561523438, -6.773338317871094, -4.47235107421875, -2.1713638305664062, 0.1296234130859375, 2.4306106567382812, 4.731597900390625, 7.032585144042969, 9.333572387695312, 11.634559631347656, 13.935546875, 16.236534118652344, 18.537521362304688, 20.83850860595703, 23.139495849609375, 25.44048309326172, 27.741470336914062, 30.042457580566406, 32.34344482421875, 34.644432067871094, 36.94541931152344, 39.24640655517578, 41.547393798828125, 43.84838104248047, 46.14936828613281, 48.450355529785156, 50.7513427734375, 53.052330017089844, 55.35331726074219, 57.65430450439453, 59.955291748046875, 62.25627899169922, 64.55726623535156, 66.8582534790039, 69.15924072265625, 71.4602279663086, 73.76121520996094, 76.06220245361328, 78.36318969726562, 80.66417694091797, 82.96516418457031, 85.26615142822266, 87.567138671875, 89.86812591552734, 92.16911315917969, 94.47010040283203, 96.77108764648438]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 9.0, 9.0, 9.0, 15.0, 22.0, 19.0, 21.0, 31.0, 43.0, 40.0, 39.0, 52.0, 46.0, 75.0, 69.0, 59.0, 41.0, 65.0, 60.0, 39.0, 55.0, 37.0, 27.0, 25.0, 18.0, 15.0, 14.0, 14.0, 12.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.827789306640625, -33.273231506347656, -31.718669891357422, -30.16411018371582, -28.60955047607422, -27.054990768432617, -25.500431060791016, -23.945873260498047, -22.391311645507812, -20.83675193786621, -19.28219223022461, -17.727632522583008, -16.173072814941406, -14.618513107299805, -13.06395435333252, -11.509394645690918, -9.954835891723633, -8.400276184082031, -6.84571647644043, -5.291157245635986, -3.7365975379943848, -2.182037830352783, -0.6274785995483398, 0.9270811080932617, 2.4816408157348633, 4.036200523376465, 5.590760231018066, 7.14531946182251, 8.699878692626953, 10.254438400268555, 11.808998107910156, 13.363557815551758, 14.91811752319336, 16.47267723083496, 18.027236938476562, 19.581796646118164, 21.136356353759766, 22.690916061401367, 24.24547576904297, 25.800033569335938, 27.354595184326172, 28.909154891967773, 30.463714599609375, 32.018272399902344, 33.57283401489258, 35.12739181518555, 36.68195343017578, 38.23651123046875, 39.79106903076172, 41.34562683105469, 42.90018844604492, 44.45474624633789, 46.009307861328125, 47.563865661621094, 49.11842727661133, 50.6729850769043, 52.22754669189453, 53.7821044921875, 55.336666107177734, 56.8912239074707, 58.44578552246094, 60.000343322753906, 61.55490493774414, 63.10946273803711, 64.66402435302734]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 8.0, 6.0, 5.0, 12.0, 21.0, 26.0, 47.0, 83.0, 135.0, 276.0, 533.0, 1194.0, 3073.0, 11035.0, 85584.0, 3882230.0, 181978.0, 18640.0, 5202.0, 2004.0, 914.0, 509.0, 252.0, 168.0, 108.0, 81.0, 51.0, 23.0, 27.0, 18.0, 12.0, 6.0, 8.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.421875, -24.501708984375, -23.58154296875, -22.661376953125, -21.7412109375, -20.821044921875, -19.90087890625, -18.980712890625, -18.060546875, -17.140380859375, -16.22021484375, -15.300048828125, -14.3798828125, -13.459716796875, -12.53955078125, -11.619384765625, -10.69921875, -9.779052734375, -8.85888671875, -7.938720703125, -7.0185546875, -6.098388671875, -5.17822265625, -4.258056640625, -3.337890625, -2.417724609375, -1.49755859375, -0.577392578125, 0.3427734375, 1.262939453125, 2.18310546875, 3.103271484375, 4.0234375, 4.943603515625, 5.86376953125, 6.783935546875, 7.7041015625, 8.624267578125, 9.54443359375, 10.464599609375, 11.384765625, 12.304931640625, 13.22509765625, 14.145263671875, 15.0654296875, 15.985595703125, 16.90576171875, 17.825927734375, 18.74609375, 19.666259765625, 20.58642578125, 21.506591796875, 22.4267578125, 23.346923828125, 24.26708984375, 25.187255859375, 26.107421875, 27.027587890625, 27.94775390625, 28.867919921875, 29.7880859375, 30.708251953125, 31.62841796875, 32.548583984375, 33.46875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 6.0, 11.0, 19.0, 23.0, 18.0, 28.0, 44.0, 53.0, 79.0, 80.0, 92.0, 82.0, 83.0, 77.0, 53.0, 61.0, 48.0, 41.0, 19.0, 17.0, 13.0, 15.0, 8.0, 4.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.3499603271484375, -1.297576904296875, -1.2451934814453125, -1.19281005859375, -1.1404266357421875, -1.088043212890625, -1.0356597900390625, -0.9832763671875, -0.9308929443359375, -0.878509521484375, -0.8261260986328125, -0.77374267578125, -0.7213592529296875, -0.668975830078125, -0.6165924072265625, -0.564208984375, -0.5118255615234375, -0.459442138671875, -0.4070587158203125, -0.35467529296875, -0.3022918701171875, -0.249908447265625, -0.1975250244140625, -0.1451416015625, -0.0927581787109375, -0.040374755859375, 0.0120086669921875, 0.06439208984375, 0.1167755126953125, 0.169158935546875, 0.2215423583984375, 0.27392578125, 0.3263092041015625, 0.378692626953125, 0.4310760498046875, 0.48345947265625, 0.5358428955078125, 0.588226318359375, 0.6406097412109375, 0.6929931640625, 0.7453765869140625, 0.797760009765625, 0.8501434326171875, 0.90252685546875, 0.9549102783203125, 1.007293701171875, 1.0596771240234375, 1.112060546875, 1.1644439697265625, 1.216827392578125, 1.2692108154296875, 1.32159423828125, 1.3739776611328125, 1.426361083984375, 1.4787445068359375, 1.5311279296875, 1.5835113525390625, 1.635894775390625, 1.6882781982421875, 1.74066162109375, 1.7930450439453125, 1.845428466796875, 1.8978118896484375, 1.9501953125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 5.0, 1.0, 8.0, 8.0, 18.0, 31.0, 38.0, 39.0, 104.0, 129.0, 246.0, 380.0, 656.0, 1353.0, 2850.0, 6742.0, 18473.0, 68245.0, 495158.0, 3289120.0, 244965.0, 43920.0, 12730.0, 4723.0, 2039.0, 1020.0, 518.0, 287.0, 167.0, 106.0, 65.0, 45.0, 32.0, 16.0, 12.0, 14.0, 9.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3125, -11.943359375, -11.57421875, -11.205078125, -10.8359375, -10.466796875, -10.09765625, -9.728515625, -9.359375, -8.990234375, -8.62109375, -8.251953125, -7.8828125, -7.513671875, -7.14453125, -6.775390625, -6.40625, -6.037109375, -5.66796875, -5.298828125, -4.9296875, -4.560546875, -4.19140625, -3.822265625, -3.453125, -3.083984375, -2.71484375, -2.345703125, -1.9765625, -1.607421875, -1.23828125, -0.869140625, -0.5, -0.130859375, 0.23828125, 0.607421875, 0.9765625, 1.345703125, 1.71484375, 2.083984375, 2.453125, 2.822265625, 3.19140625, 3.560546875, 3.9296875, 4.298828125, 4.66796875, 5.037109375, 5.40625, 5.775390625, 6.14453125, 6.513671875, 6.8828125, 7.251953125, 7.62109375, 7.990234375, 8.359375, 8.728515625, 9.09765625, 9.466796875, 9.8359375, 10.205078125, 10.57421875, 10.943359375, 11.3125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 4.0, 4.0, 8.0, 5.0, 16.0, 22.0, 24.0, 39.0, 68.0, 68.0, 114.0, 222.0, 509.0, 1559.0, 687.0, 314.0, 154.0, 85.0, 53.0, 46.0, 26.0, 12.0, 13.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55859375, -4.443450927734375, -4.32830810546875, -4.213165283203125, -4.0980224609375, -3.982879638671875, -3.86773681640625, -3.752593994140625, -3.637451171875, -3.522308349609375, -3.40716552734375, -3.292022705078125, -3.1768798828125, -3.061737060546875, -2.94659423828125, -2.831451416015625, -2.71630859375, -2.601165771484375, -2.48602294921875, -2.370880126953125, -2.2557373046875, -2.140594482421875, -2.02545166015625, -1.910308837890625, -1.795166015625, -1.680023193359375, -1.56488037109375, -1.449737548828125, -1.3345947265625, -1.219451904296875, -1.10430908203125, -0.989166259765625, -0.8740234375, -0.758880615234375, -0.64373779296875, -0.528594970703125, -0.4134521484375, -0.298309326171875, -0.18316650390625, -0.068023681640625, 0.047119140625, 0.162261962890625, 0.27740478515625, 0.392547607421875, 0.5076904296875, 0.622833251953125, 0.73797607421875, 0.853118896484375, 0.96826171875, 1.083404541015625, 1.19854736328125, 1.313690185546875, 1.4288330078125, 1.543975830078125, 1.65911865234375, 1.774261474609375, 1.889404296875, 2.004547119140625, 2.11968994140625, 2.234832763671875, 2.3499755859375, 2.465118408203125, 2.58026123046875, 2.695404052734375, 2.810546875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 12.0, 26.0, 58.0, 129.0, 226.0, 269.0, 161.0, 61.0, 30.0, 14.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.090229034423828, -17.23044204711914, -16.370656967163086, -15.510869979858398, -14.651083946228027, -13.791297912597656, -12.931510925292969, -12.071724891662598, -11.211938858032227, -10.352152824401855, -9.492365837097168, -8.632579803466797, -7.772793769836426, -6.9130072593688965, -6.053220748901367, -5.193434715270996, -4.333647727966309, -3.4738614559173584, -2.614075183868408, -1.754288673400879, -0.8945024013519287, -0.034716129302978516, 0.8250703811645508, 1.6848564147949219, 2.544642925262451, 3.4044291973114014, 4.264215469360352, 5.124001979827881, 5.98378849029541, 6.843574523925781, 7.7033610343933105, 8.563146591186523, 9.422933578491211, 10.282719612121582, 11.14250659942627, 12.00229263305664, 12.862078666687012, 13.721864700317383, 14.58165168762207, 15.441437721252441, 16.301223754882812, 17.1610107421875, 18.020795822143555, 18.880582809448242, 19.74036979675293, 20.600154876708984, 21.459941864013672, 22.31972885131836, 23.179515838623047, 24.039302825927734, 24.89908790588379, 25.758874893188477, 26.618661880493164, 27.47844696044922, 28.338233947753906, 29.198020935058594, 30.05780601501465, 30.917593002319336, 31.77737808227539, 32.63716506958008, 33.496952056884766, 34.35673904418945, 35.216522216796875, 36.07630920410156, 36.93609619140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 7.0, 12.0, 8.0, 11.0, 16.0, 20.0, 24.0, 12.0, 24.0, 33.0, 35.0, 31.0, 39.0, 34.0, 49.0, 66.0, 40.0, 69.0, 40.0, 34.0, 39.0, 51.0, 36.0, 31.0, 29.0, 35.0, 27.0, 18.0, 20.0, 13.0, 23.0, 8.0, 10.0, 9.0, 9.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.776859283447266, -11.430984497070312, -11.085108757019043, -10.739233016967773, -10.39335823059082, -10.047483444213867, -9.701607704162598, -9.355731964111328, -9.009857177734375, -8.663982391357422, -8.318106651306152, -7.972231388092041, -7.62635612487793, -7.280480861663818, -6.934605598449707, -6.588730335235596, -6.242855072021484, -5.896979808807373, -5.551104545593262, -5.20522928237915, -4.859354019165039, -4.513478755950928, -4.167603492736816, -3.821728229522705, -3.4758529663085938, -3.1299777030944824, -2.784102439880371, -2.4382271766662598, -2.0923519134521484, -1.746476650238037, -1.4006013870239258, -1.0547261238098145, -0.7088508605957031, -0.3629755973815918, -0.01710033416748047, 0.32877492904663086, 0.6746501922607422, 1.0205254554748535, 1.3664007186889648, 1.7122759819030762, 2.0581512451171875, 2.404026508331299, 2.74990177154541, 3.0957770347595215, 3.441652297973633, 3.787527561187744, 4.1334028244018555, 4.479278087615967, 4.825153350830078, 5.1710286140441895, 5.516903877258301, 5.862779140472412, 6.208654403686523, 6.554529666900635, 6.900404930114746, 7.246280193328857, 7.592155456542969, 7.93803071975708, 8.283905982971191, 8.629781723022461, 8.975656509399414, 9.321531295776367, 9.667407035827637, 10.013282775878906, 10.35915756225586]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 9.0, 10.0, 17.0, 23.0, 50.0, 44.0, 75.0, 133.0, 271.0, 497.0, 1091.0, 2540.0, 7323.0, 29743.0, 171994.0, 617216.0, 175199.0, 29893.0, 7704.0, 2585.0, 1036.0, 475.0, 253.0, 142.0, 67.0, 45.0, 34.0, 28.0, 17.0, 11.0, 8.0, 3.0, 5.0, 0.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1171875, -10.7271728515625, -10.337158203125, -9.9471435546875, -9.55712890625, -9.1671142578125, -8.777099609375, -8.3870849609375, -7.9970703125, -7.6070556640625, -7.217041015625, -6.8270263671875, -6.43701171875, -6.0469970703125, -5.656982421875, -5.2669677734375, -4.876953125, -4.4869384765625, -4.096923828125, -3.7069091796875, -3.31689453125, -2.9268798828125, -2.536865234375, -2.1468505859375, -1.7568359375, -1.3668212890625, -0.976806640625, -0.5867919921875, -0.19677734375, 0.1932373046875, 0.583251953125, 0.9732666015625, 1.36328125, 1.7532958984375, 2.143310546875, 2.5333251953125, 2.92333984375, 3.3133544921875, 3.703369140625, 4.0933837890625, 4.4833984375, 4.8734130859375, 5.263427734375, 5.6534423828125, 6.04345703125, 6.4334716796875, 6.823486328125, 7.2135009765625, 7.603515625, 7.9935302734375, 8.383544921875, 8.7735595703125, 9.16357421875, 9.5535888671875, 9.943603515625, 10.3336181640625, 10.7236328125, 11.1136474609375, 11.503662109375, 11.8936767578125, 12.28369140625, 12.6737060546875, 13.063720703125, 13.4537353515625, 13.84375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 6.0, 6.0, 12.0, 19.0, 30.0, 28.0, 49.0, 63.0, 77.0, 66.0, 112.0, 100.0, 88.0, 81.0, 90.0, 48.0, 43.0, 33.0, 14.0, 10.0, 12.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.50390625, -1.439666748046875, -1.37542724609375, -1.311187744140625, -1.2469482421875, -1.182708740234375, -1.11846923828125, -1.054229736328125, -0.989990234375, -0.925750732421875, -0.86151123046875, -0.797271728515625, -0.7330322265625, -0.668792724609375, -0.60455322265625, -0.540313720703125, -0.47607421875, -0.411834716796875, -0.34759521484375, -0.283355712890625, -0.2191162109375, -0.154876708984375, -0.09063720703125, -0.026397705078125, 0.037841796875, 0.102081298828125, 0.16632080078125, 0.230560302734375, 0.2947998046875, 0.359039306640625, 0.42327880859375, 0.487518310546875, 0.5517578125, 0.615997314453125, 0.68023681640625, 0.744476318359375, 0.8087158203125, 0.872955322265625, 0.93719482421875, 1.001434326171875, 1.065673828125, 1.129913330078125, 1.19415283203125, 1.258392333984375, 1.3226318359375, 1.386871337890625, 1.45111083984375, 1.515350341796875, 1.57958984375, 1.643829345703125, 1.70806884765625, 1.772308349609375, 1.8365478515625, 1.900787353515625, 1.96502685546875, 2.029266357421875, 2.093505859375, 2.157745361328125, 2.22198486328125, 2.286224365234375, 2.3504638671875, 2.414703369140625, 2.47894287109375, 2.543182373046875, 2.607421875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 7.0, 5.0, 9.0, 12.0, 20.0, 22.0, 28.0, 44.0, 63.0, 89.0, 108.0, 171.0, 274.0, 416.0, 608.0, 1110.0, 1913.0, 3431.0, 6710.0, 13990.0, 32021.0, 77460.0, 207907.0, 374866.0, 195586.0, 73834.0, 29861.0, 13486.0, 6581.0, 3308.0, 1770.0, 1027.0, 602.0, 393.0, 255.0, 154.0, 131.0, 73.0, 60.0, 43.0, 24.0, 17.0, 23.0, 12.0, 11.0, 8.0, 5.0, 8.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0], "bins": [-6.7265625, -6.51934814453125, -6.3121337890625, -6.10491943359375, -5.897705078125, -5.69049072265625, -5.4832763671875, -5.27606201171875, -5.06884765625, -4.86163330078125, -4.6544189453125, -4.44720458984375, -4.239990234375, -4.03277587890625, -3.8255615234375, -3.61834716796875, -3.4111328125, -3.20391845703125, -2.9967041015625, -2.78948974609375, -2.582275390625, -2.37506103515625, -2.1678466796875, -1.96063232421875, -1.75341796875, -1.54620361328125, -1.3389892578125, -1.13177490234375, -0.924560546875, -0.71734619140625, -0.5101318359375, -0.30291748046875, -0.095703125, 0.11151123046875, 0.3187255859375, 0.52593994140625, 0.733154296875, 0.94036865234375, 1.1475830078125, 1.35479736328125, 1.56201171875, 1.76922607421875, 1.9764404296875, 2.18365478515625, 2.390869140625, 2.59808349609375, 2.8052978515625, 3.01251220703125, 3.2197265625, 3.42694091796875, 3.6341552734375, 3.84136962890625, 4.048583984375, 4.25579833984375, 4.4630126953125, 4.67022705078125, 4.87744140625, 5.08465576171875, 5.2918701171875, 5.49908447265625, 5.706298828125, 5.91351318359375, 6.1207275390625, 6.32794189453125, 6.53515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 1.0, 5.0, 12.0, 13.0, 8.0, 12.0, 19.0, 27.0, 26.0, 21.0, 31.0, 33.0, 22.0, 35.0, 24.0, 43.0, 43.0, 51.0, 56.0, 54.0, 60.0, 49.0, 36.0, 47.0, 39.0, 34.0, 35.0, 22.0, 23.0, 28.0, 14.0, 10.0, 14.0, 14.0, 10.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.1328125, -6.919189453125, -6.70556640625, -6.491943359375, -6.2783203125, -6.064697265625, -5.85107421875, -5.637451171875, -5.423828125, -5.210205078125, -4.99658203125, -4.782958984375, -4.5693359375, -4.355712890625, -4.14208984375, -3.928466796875, -3.71484375, -3.501220703125, -3.28759765625, -3.073974609375, -2.8603515625, -2.646728515625, -2.43310546875, -2.219482421875, -2.005859375, -1.792236328125, -1.57861328125, -1.364990234375, -1.1513671875, -0.937744140625, -0.72412109375, -0.510498046875, -0.296875, -0.083251953125, 0.13037109375, 0.343994140625, 0.5576171875, 0.771240234375, 0.98486328125, 1.198486328125, 1.412109375, 1.625732421875, 1.83935546875, 2.052978515625, 2.2666015625, 2.480224609375, 2.69384765625, 2.907470703125, 3.12109375, 3.334716796875, 3.54833984375, 3.761962890625, 3.9755859375, 4.189208984375, 4.40283203125, 4.616455078125, 4.830078125, 5.043701171875, 5.25732421875, 5.470947265625, 5.6845703125, 5.898193359375, 6.11181640625, 6.325439453125, 6.5390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 12.0, 15.0, 17.0, 22.0, 30.0, 49.0, 64.0, 125.0, 234.0, 434.0, 999.0, 2818.0, 10613.0, 53690.0, 335857.0, 528237.0, 91699.0, 16849.0, 4211.0, 1345.0, 561.0, 262.0, 142.0, 87.0, 55.0, 36.0, 25.0, 15.0, 6.0, 16.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.671875, -5.4837646484375, -5.295654296875, -5.1075439453125, -4.91943359375, -4.7313232421875, -4.543212890625, -4.3551025390625, -4.1669921875, -3.9788818359375, -3.790771484375, -3.6026611328125, -3.41455078125, -3.2264404296875, -3.038330078125, -2.8502197265625, -2.662109375, -2.4739990234375, -2.285888671875, -2.0977783203125, -1.90966796875, -1.7215576171875, -1.533447265625, -1.3453369140625, -1.1572265625, -0.9691162109375, -0.781005859375, -0.5928955078125, -0.40478515625, -0.2166748046875, -0.028564453125, 0.1595458984375, 0.34765625, 0.5357666015625, 0.723876953125, 0.9119873046875, 1.10009765625, 1.2882080078125, 1.476318359375, 1.6644287109375, 1.8525390625, 2.0406494140625, 2.228759765625, 2.4168701171875, 2.60498046875, 2.7930908203125, 2.981201171875, 3.1693115234375, 3.357421875, 3.5455322265625, 3.733642578125, 3.9217529296875, 4.10986328125, 4.2979736328125, 4.486083984375, 4.6741943359375, 4.8623046875, 5.0504150390625, 5.238525390625, 5.4266357421875, 5.61474609375, 5.8028564453125, 5.990966796875, 6.1790771484375, 6.3671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 4.0, 0.0, 3.0, 8.0, 5.0, 8.0, 7.0, 16.0, 14.0, 15.0, 22.0, 49.0, 39.0, 41.0, 67.0, 86.0, 108.0, 93.0, 68.0, 66.0, 55.0, 41.0, 47.0, 29.0, 23.0, 16.0, 16.0, 13.0, 13.0, 9.0, 6.0, 3.0, 6.0, 5.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003540515899658203, -0.00033976510167121887, -0.00032547861337661743, -0.000311192125082016, -0.00029690563678741455, -0.0002826191484928131, -0.00026833266019821167, -0.00025404617190361023, -0.0002397596836090088, -0.00022547319531440735, -0.0002111867070198059, -0.00019690021872520447, -0.00018261373043060303, -0.0001683272421360016, -0.00015404075384140015, -0.0001397542655467987, -0.00012546777725219727, -0.00011118128895759583, -9.689480066299438e-05, -8.260831236839294e-05, -6.83218240737915e-05, -5.4035335779190063e-05, -3.974884748458862e-05, -2.5462359189987183e-05, -1.1175870895385742e-05, 3.1106173992156982e-06, 1.739710569381714e-05, 3.168359398841858e-05, 4.597008228302002e-05, 6.025657057762146e-05, 7.45430588722229e-05, 8.882954716682434e-05, 0.00010311603546142578, 0.00011740252375602722, 0.00013168901205062866, 0.0001459755003452301, 0.00016026198863983154, 0.00017454847693443298, 0.00018883496522903442, 0.00020312145352363586, 0.0002174079418182373, 0.00023169443011283875, 0.0002459809184074402, 0.0002602674067020416, 0.00027455389499664307, 0.0002888403832912445, 0.00030312687158584595, 0.0003174133598804474, 0.00033169984817504883, 0.00034598633646965027, 0.0003602728247642517, 0.00037455931305885315, 0.0003888458013534546, 0.00040313228964805603, 0.00041741877794265747, 0.0004317052662372589, 0.00044599175453186035, 0.0004602782428264618, 0.00047456473112106323, 0.0004888512194156647, 0.0005031377077102661, 0.0005174241960048676, 0.000531710684299469, 0.0005459971725940704, 0.0005602836608886719]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 13.0, 9.0, 12.0, 26.0, 27.0, 37.0, 52.0, 78.0, 113.0, 157.0, 258.0, 447.0, 749.0, 1329.0, 2662.0, 5699.0, 13907.0, 37344.0, 106351.0, 347689.0, 358856.0, 108794.0, 37793.0, 14215.0, 5910.0, 2658.0, 1358.0, 734.0, 422.0, 286.0, 186.0, 109.0, 73.0, 59.0, 34.0, 30.0, 17.0, 15.0, 17.0, 7.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.99609375, -3.86724853515625, -3.7384033203125, -3.60955810546875, -3.480712890625, -3.35186767578125, -3.2230224609375, -3.09417724609375, -2.96533203125, -2.83648681640625, -2.7076416015625, -2.57879638671875, -2.449951171875, -2.32110595703125, -2.1922607421875, -2.06341552734375, -1.9345703125, -1.80572509765625, -1.6768798828125, -1.54803466796875, -1.419189453125, -1.29034423828125, -1.1614990234375, -1.03265380859375, -0.90380859375, -0.77496337890625, -0.6461181640625, -0.51727294921875, -0.388427734375, -0.25958251953125, -0.1307373046875, -0.00189208984375, 0.126953125, 0.25579833984375, 0.3846435546875, 0.51348876953125, 0.642333984375, 0.77117919921875, 0.9000244140625, 1.02886962890625, 1.15771484375, 1.28656005859375, 1.4154052734375, 1.54425048828125, 1.673095703125, 1.80194091796875, 1.9307861328125, 2.05963134765625, 2.1884765625, 2.31732177734375, 2.4461669921875, 2.57501220703125, 2.703857421875, 2.83270263671875, 2.9615478515625, 3.09039306640625, 3.21923828125, 3.34808349609375, 3.4769287109375, 3.60577392578125, 3.734619140625, 3.86346435546875, 3.9923095703125, 4.12115478515625, 4.25]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 5.0, 7.0, 6.0, 15.0, 13.0, 14.0, 17.0, 16.0, 35.0, 31.0, 53.0, 57.0, 60.0, 50.0, 76.0, 90.0, 86.0, 74.0, 53.0, 41.0, 45.0, 19.0, 23.0, 24.0, 11.0, 15.0, 14.0, 12.0, 8.0, 7.0, 10.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.306640625, -3.201995849609375, -3.09735107421875, -2.992706298828125, -2.8880615234375, -2.783416748046875, -2.67877197265625, -2.574127197265625, -2.469482421875, -2.364837646484375, -2.26019287109375, -2.155548095703125, -2.0509033203125, -1.946258544921875, -1.84161376953125, -1.736968994140625, -1.63232421875, -1.527679443359375, -1.42303466796875, -1.318389892578125, -1.2137451171875, -1.109100341796875, -1.00445556640625, -0.899810791015625, -0.795166015625, -0.690521240234375, -0.58587646484375, -0.481231689453125, -0.3765869140625, -0.271942138671875, -0.16729736328125, -0.062652587890625, 0.0419921875, 0.146636962890625, 0.25128173828125, 0.355926513671875, 0.4605712890625, 0.565216064453125, 0.66986083984375, 0.774505615234375, 0.879150390625, 0.983795166015625, 1.08843994140625, 1.193084716796875, 1.2977294921875, 1.402374267578125, 1.50701904296875, 1.611663818359375, 1.71630859375, 1.820953369140625, 1.92559814453125, 2.030242919921875, 2.1348876953125, 2.239532470703125, 2.34417724609375, 2.448822021484375, 2.553466796875, 2.658111572265625, 2.76275634765625, 2.867401123046875, 2.9720458984375, 3.076690673828125, 3.18133544921875, 3.285980224609375, 3.390625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 8.0, 25.0, 26.0, 59.0, 148.0, 202.0, 225.0, 136.0, 77.0, 39.0, 21.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.62757110595703, -53.079689025878906, -50.531803131103516, -47.983917236328125, -45.43603515625, -42.888153076171875, -40.340267181396484, -37.792381286621094, -35.24449920654297, -32.696617126464844, -30.148731231689453, -27.600847244262695, -25.052963256835938, -22.50507926940918, -19.957195281982422, -17.409311294555664, -14.861427307128906, -12.313543319702148, -9.76565933227539, -7.217775344848633, -4.669891357421875, -2.122007369995117, 0.4258766174316406, 2.9737606048583984, 5.521644592285156, 8.069528579711914, 10.617412567138672, 13.16529655456543, 15.713180541992188, 18.261064529418945, 20.808948516845703, 23.35683250427246, 25.90472412109375, 28.452608108520508, 31.000492095947266, 33.548377990722656, 36.09626007080078, 38.644142150878906, 41.1920280456543, 43.73991394042969, 46.28779602050781, 48.83567810058594, 51.38356399536133, 53.93144989013672, 56.479331970214844, 59.02721405029297, 61.57509994506836, 64.12298583984375, 66.67086791992188, 69.21875, 71.76663208007812, 74.31452178955078, 76.8624038696289, 79.41028594970703, 81.95817565917969, 84.50605773925781, 87.05393981933594, 89.60182189941406, 92.14970397949219, 94.69759368896484, 97.24547576904297, 99.7933578491211, 102.34124755859375, 104.88912963867188, 107.43701171875]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 4.0, 7.0, 11.0, 13.0, 14.0, 16.0, 20.0, 17.0, 22.0, 38.0, 29.0, 31.0, 37.0, 36.0, 51.0, 43.0, 49.0, 56.0, 51.0, 41.0, 45.0, 57.0, 48.0, 29.0, 39.0, 27.0, 27.0, 28.0, 21.0, 18.0, 20.0, 11.0, 12.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-52.24089813232422, -50.60310745239258, -48.96531677246094, -47.32752990722656, -45.68973922729492, -44.05194854736328, -42.414161682128906, -40.776371002197266, -39.138580322265625, -37.500789642333984, -35.862998962402344, -34.22521209716797, -32.58742141723633, -30.949630737304688, -29.31184196472168, -27.674053192138672, -26.03626251220703, -24.39847183227539, -22.760683059692383, -21.122894287109375, -19.485103607177734, -17.847312927246094, -16.209524154663086, -14.571734428405762, -12.933944702148438, -11.296154975891113, -9.658365249633789, -8.020575523376465, -6.382785797119141, -4.744996070861816, -3.107206344604492, -1.469416618347168, 0.16836929321289062, 1.8061590194702148, 3.443948745727539, 5.081738471984863, 6.7195281982421875, 8.357317924499512, 9.995107650756836, 11.63289737701416, 13.270687103271484, 14.908476829528809, 16.546266555786133, 18.18405532836914, 19.82184600830078, 21.459636688232422, 23.09742546081543, 24.735214233398438, 26.373004913330078, 28.01079559326172, 29.648584365844727, 31.286373138427734, 32.924163818359375, 34.561954498291016, 36.199745178222656, 37.83753204345703, 39.47532272338867, 41.11311340332031, 42.75090026855469, 44.38869094848633, 46.02648162841797, 47.66427230834961, 49.30206298828125, 50.939849853515625, 52.577640533447266]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 7.0, 4.0, 10.0, 17.0, 22.0, 32.0, 36.0, 42.0, 77.0, 148.0, 211.0, 408.0, 977.0, 2394.0, 8247.0, 45767.0, 3705099.0, 398477.0, 23590.0, 5306.0, 1725.0, 771.0, 362.0, 191.0, 125.0, 73.0, 43.0, 30.0, 27.0, 12.0, 12.0, 13.0, 6.0, 8.0, 6.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.046875, -23.336181640625, -22.62548828125, -21.914794921875, -21.2041015625, -20.493408203125, -19.78271484375, -19.072021484375, -18.361328125, -17.650634765625, -16.93994140625, -16.229248046875, -15.5185546875, -14.807861328125, -14.09716796875, -13.386474609375, -12.67578125, -11.965087890625, -11.25439453125, -10.543701171875, -9.8330078125, -9.122314453125, -8.41162109375, -7.700927734375, -6.990234375, -6.279541015625, -5.56884765625, -4.858154296875, -4.1474609375, -3.436767578125, -2.72607421875, -2.015380859375, -1.3046875, -0.593994140625, 0.11669921875, 0.827392578125, 1.5380859375, 2.248779296875, 2.95947265625, 3.670166015625, 4.380859375, 5.091552734375, 5.80224609375, 6.512939453125, 7.2236328125, 7.934326171875, 8.64501953125, 9.355712890625, 10.06640625, 10.777099609375, 11.48779296875, 12.198486328125, 12.9091796875, 13.619873046875, 14.33056640625, 15.041259765625, 15.751953125, 16.462646484375, 17.17333984375, 17.884033203125, 18.5947265625, 19.305419921875, 20.01611328125, 20.726806640625, 21.4375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 7.0, 3.0, 5.0, 16.0, 9.0, 21.0, 29.0, 24.0, 23.0, 20.0, 42.0, 43.0, 29.0, 43.0, 42.0, 44.0, 76.0, 53.0, 68.0, 46.0, 45.0, 45.0, 42.0, 45.0, 23.0, 36.0, 31.0, 18.0, 11.0, 9.0, 11.0, 8.0, 8.0, 5.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6484375, -1.5988922119140625, -1.549346923828125, -1.4998016357421875, -1.45025634765625, -1.4007110595703125, -1.351165771484375, -1.3016204833984375, -1.2520751953125, -1.2025299072265625, -1.152984619140625, -1.1034393310546875, -1.05389404296875, -1.0043487548828125, -0.954803466796875, -0.9052581787109375, -0.855712890625, -0.8061676025390625, -0.756622314453125, -0.7070770263671875, -0.65753173828125, -0.6079864501953125, -0.558441162109375, -0.5088958740234375, -0.4593505859375, -0.4098052978515625, -0.360260009765625, -0.3107147216796875, -0.26116943359375, -0.2116241455078125, -0.162078857421875, -0.1125335693359375, -0.06298828125, -0.0134429931640625, 0.036102294921875, 0.0856475830078125, 0.13519287109375, 0.1847381591796875, 0.234283447265625, 0.2838287353515625, 0.3333740234375, 0.3829193115234375, 0.432464599609375, 0.4820098876953125, 0.53155517578125, 0.5811004638671875, 0.630645751953125, 0.6801910400390625, 0.729736328125, 0.7792816162109375, 0.828826904296875, 0.8783721923828125, 0.92791748046875, 0.9774627685546875, 1.027008056640625, 1.0765533447265625, 1.1260986328125, 1.1756439208984375, 1.225189208984375, 1.2747344970703125, 1.32427978515625, 1.3738250732421875, 1.423370361328125, 1.4729156494140625, 1.5224609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 11.0, 12.0, 11.0, 19.0, 62.0, 100.0, 149.0, 327.0, 539.0, 991.0, 2011.0, 4614.0, 12769.0, 47098.0, 459913.0, 3481485.0, 145385.0, 25267.0, 7691.0, 3061.0, 1353.0, 659.0, 326.0, 191.0, 96.0, 55.0, 30.0, 19.0, 10.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.796875, -10.451904296875, -10.10693359375, -9.761962890625, -9.4169921875, -9.072021484375, -8.72705078125, -8.382080078125, -8.037109375, -7.692138671875, -7.34716796875, -7.002197265625, -6.6572265625, -6.312255859375, -5.96728515625, -5.622314453125, -5.27734375, -4.932373046875, -4.58740234375, -4.242431640625, -3.8974609375, -3.552490234375, -3.20751953125, -2.862548828125, -2.517578125, -2.172607421875, -1.82763671875, -1.482666015625, -1.1376953125, -0.792724609375, -0.44775390625, -0.102783203125, 0.2421875, 0.587158203125, 0.93212890625, 1.277099609375, 1.6220703125, 1.967041015625, 2.31201171875, 2.656982421875, 3.001953125, 3.346923828125, 3.69189453125, 4.036865234375, 4.3818359375, 4.726806640625, 5.07177734375, 5.416748046875, 5.76171875, 6.106689453125, 6.45166015625, 6.796630859375, 7.1416015625, 7.486572265625, 7.83154296875, 8.176513671875, 8.521484375, 8.866455078125, 9.21142578125, 9.556396484375, 9.9013671875, 10.246337890625, 10.59130859375, 10.936279296875, 11.28125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 13.0, 15.0, 14.0, 21.0, 28.0, 41.0, 61.0, 88.0, 196.0, 410.0, 1500.0, 935.0, 314.0, 144.0, 87.0, 52.0, 30.0, 30.0, 20.0, 9.0, 12.0, 6.0, 4.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15625, -3.06011962890625, -2.9639892578125, -2.86785888671875, -2.771728515625, -2.67559814453125, -2.5794677734375, -2.48333740234375, -2.38720703125, -2.29107666015625, -2.1949462890625, -2.09881591796875, -2.002685546875, -1.90655517578125, -1.8104248046875, -1.71429443359375, -1.6181640625, -1.52203369140625, -1.4259033203125, -1.32977294921875, -1.233642578125, -1.13751220703125, -1.0413818359375, -0.94525146484375, -0.84912109375, -0.75299072265625, -0.6568603515625, -0.56072998046875, -0.464599609375, -0.36846923828125, -0.2723388671875, -0.17620849609375, -0.080078125, 0.01605224609375, 0.1121826171875, 0.20831298828125, 0.304443359375, 0.40057373046875, 0.4967041015625, 0.59283447265625, 0.68896484375, 0.78509521484375, 0.8812255859375, 0.97735595703125, 1.073486328125, 1.16961669921875, 1.2657470703125, 1.36187744140625, 1.4580078125, 1.55413818359375, 1.6502685546875, 1.74639892578125, 1.842529296875, 1.93865966796875, 2.0347900390625, 2.13092041015625, 2.22705078125, 2.32318115234375, 2.4193115234375, 2.51544189453125, 2.611572265625, 2.70770263671875, 2.8038330078125, 2.89996337890625, 2.99609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 12.0, 16.0, 28.0, 56.0, 124.0, 170.0, 228.0, 174.0, 110.0, 37.0, 25.0, 12.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.380817413330078, -20.72154426574707, -20.062271118164062, -19.402996063232422, -18.743722915649414, -18.084449768066406, -17.425174713134766, -16.765901565551758, -16.10662841796875, -15.447355270385742, -14.788081169128418, -14.128807067871094, -13.469533920288086, -12.810260772705078, -12.150986671447754, -11.49171257019043, -10.832439422607422, -10.173166275024414, -9.51389217376709, -8.854618072509766, -8.195344924926758, -7.536071300506592, -6.876797676086426, -6.21752405166626, -5.558250427246094, -4.898976802825928, -4.239703178405762, -3.5804295539855957, -2.9211559295654297, -2.2618823051452637, -1.6026086807250977, -0.9433350563049316, -0.2840614318847656, 0.3752121925354004, 1.0344858169555664, 1.6937594413757324, 2.3530330657958984, 3.0123066902160645, 3.6715803146362305, 4.3308539390563965, 4.9901275634765625, 5.6494011878967285, 6.3086748123168945, 6.9679484367370605, 7.627222061157227, 8.286495208740234, 8.945769309997559, 9.605043411254883, 10.26431655883789, 10.923589706420898, 11.582863807678223, 12.242137908935547, 12.901411056518555, 13.560684204101562, 14.219958305358887, 14.879232406616211, 15.538505554199219, 16.197778701782227, 16.857051849365234, 17.516326904296875, 18.175600051879883, 18.83487319946289, 19.49414825439453, 20.15342140197754, 20.812694549560547]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 8.0, 11.0, 9.0, 12.0, 19.0, 22.0, 22.0, 28.0, 44.0, 39.0, 54.0, 63.0, 42.0, 59.0, 68.0, 55.0, 54.0, 57.0, 51.0, 43.0, 40.0, 30.0, 34.0, 21.0, 26.0, 20.0, 19.0, 17.0, 10.0, 8.0, 4.0, 3.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.195487022399902, -8.793401718139648, -8.391315460205078, -7.989230155944824, -7.587144374847412, -7.18505859375, -6.782973289489746, -6.380887508392334, -5.978801727294922, -5.57671594619751, -5.174630165100098, -4.772544860839844, -4.370459079742432, -3.9683732986450195, -3.5662877559661865, -3.1642022132873535, -2.7621164321899414, -2.3600306510925293, -1.9579451084136963, -1.5558594465255737, -1.1537737846374512, -0.7516880035400391, -0.34960246086120605, 0.05248308181762695, 0.45456886291503906, 0.8566545248031616, 1.2587401866912842, 1.6608258485794067, 2.0629115104675293, 2.4649972915649414, 2.8670828342437744, 3.2691683769226074, 3.671253204345703, 4.073338985443115, 4.475424766540527, 4.877510070800781, 5.279595851898193, 5.6816816329956055, 6.083766937255859, 6.4858527183532715, 6.887938499450684, 7.290024280548096, 7.692110061645508, 8.094195365905762, 8.496280670166016, 8.898366928100586, 9.30045223236084, 9.702537536621094, 10.104623794555664, 10.506709098815918, 10.908795356750488, 11.310880661010742, 11.712966918945312, 12.115052223205566, 12.51713752746582, 12.91922378540039, 13.321309089660645, 13.723394393920898, 14.125480651855469, 14.527565956115723, 14.929651260375977, 15.331737518310547, 15.7338228225708, 16.135908126831055, 16.537994384765625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 11.0, 10.0, 18.0, 33.0, 46.0, 64.0, 85.0, 132.0, 186.0, 241.0, 395.0, 535.0, 843.0, 1251.0, 2034.0, 3160.0, 5031.0, 8184.0, 13754.0, 24060.0, 43321.0, 85234.0, 173394.0, 280582.0, 194843.0, 96457.0, 48706.0, 26406.0, 15303.0, 9048.0, 5470.0, 3413.0, 2105.0, 1394.0, 895.0, 603.0, 390.0, 283.0, 185.0, 116.0, 103.0, 72.0, 41.0, 31.0, 23.0, 18.0, 12.0, 9.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.55078125, -4.4111328125, -4.271484375, -4.1318359375, -3.9921875, -3.8525390625, -3.712890625, -3.5732421875, -3.43359375, -3.2939453125, -3.154296875, -3.0146484375, -2.875, -2.7353515625, -2.595703125, -2.4560546875, -2.31640625, -2.1767578125, -2.037109375, -1.8974609375, -1.7578125, -1.6181640625, -1.478515625, -1.3388671875, -1.19921875, -1.0595703125, -0.919921875, -0.7802734375, -0.640625, -0.5009765625, -0.361328125, -0.2216796875, -0.08203125, 0.0576171875, 0.197265625, 0.3369140625, 0.4765625, 0.6162109375, 0.755859375, 0.8955078125, 1.03515625, 1.1748046875, 1.314453125, 1.4541015625, 1.59375, 1.7333984375, 1.873046875, 2.0126953125, 2.15234375, 2.2919921875, 2.431640625, 2.5712890625, 2.7109375, 2.8505859375, 2.990234375, 3.1298828125, 3.26953125, 3.4091796875, 3.548828125, 3.6884765625, 3.828125, 3.9677734375, 4.107421875, 4.2470703125, 4.38671875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 8.0, 5.0, 5.0, 13.0, 17.0, 24.0, 16.0, 17.0, 25.0, 30.0, 27.0, 37.0, 42.0, 43.0, 52.0, 47.0, 52.0, 52.0, 59.0, 43.0, 43.0, 43.0, 48.0, 41.0, 33.0, 34.0, 30.0, 24.0, 16.0, 18.0, 11.0, 11.0, 5.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.6025390625, -1.554962158203125, -1.50738525390625, -1.459808349609375, -1.4122314453125, -1.364654541015625, -1.31707763671875, -1.269500732421875, -1.221923828125, -1.174346923828125, -1.12677001953125, -1.079193115234375, -1.0316162109375, -0.984039306640625, -0.93646240234375, -0.888885498046875, -0.84130859375, -0.793731689453125, -0.74615478515625, -0.698577880859375, -0.6510009765625, -0.603424072265625, -0.55584716796875, -0.508270263671875, -0.460693359375, -0.413116455078125, -0.36553955078125, -0.317962646484375, -0.2703857421875, -0.222808837890625, -0.17523193359375, -0.127655029296875, -0.080078125, -0.032501220703125, 0.01507568359375, 0.062652587890625, 0.1102294921875, 0.157806396484375, 0.20538330078125, 0.252960205078125, 0.300537109375, 0.348114013671875, 0.39569091796875, 0.443267822265625, 0.4908447265625, 0.538421630859375, 0.58599853515625, 0.633575439453125, 0.68115234375, 0.728729248046875, 0.77630615234375, 0.823883056640625, 0.8714599609375, 0.919036865234375, 0.96661376953125, 1.014190673828125, 1.061767578125, 1.109344482421875, 1.15692138671875, 1.204498291015625, 1.2520751953125, 1.299652099609375, 1.34722900390625, 1.394805908203125, 1.4423828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 10.0, 15.0, 9.0, 20.0, 35.0, 48.0, 71.0, 94.0, 166.0, 235.0, 348.0, 552.0, 937.0, 1579.0, 2639.0, 4700.0, 8998.0, 17793.0, 37961.0, 91595.0, 238537.0, 356015.0, 165090.0, 63666.0, 27754.0, 13524.0, 6843.0, 3755.0, 2157.0, 1300.0, 754.0, 472.0, 289.0, 194.0, 122.0, 96.0, 63.0, 40.0, 17.0, 17.0, 12.0, 8.0, 10.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.44140625, -5.267578125, -5.09375, -4.919921875, -4.74609375, -4.572265625, -4.3984375, -4.224609375, -4.05078125, -3.876953125, -3.703125, -3.529296875, -3.35546875, -3.181640625, -3.0078125, -2.833984375, -2.66015625, -2.486328125, -2.3125, -2.138671875, -1.96484375, -1.791015625, -1.6171875, -1.443359375, -1.26953125, -1.095703125, -0.921875, -0.748046875, -0.57421875, -0.400390625, -0.2265625, -0.052734375, 0.12109375, 0.294921875, 0.46875, 0.642578125, 0.81640625, 0.990234375, 1.1640625, 1.337890625, 1.51171875, 1.685546875, 1.859375, 2.033203125, 2.20703125, 2.380859375, 2.5546875, 2.728515625, 2.90234375, 3.076171875, 3.25, 3.423828125, 3.59765625, 3.771484375, 3.9453125, 4.119140625, 4.29296875, 4.466796875, 4.640625, 4.814453125, 4.98828125, 5.162109375, 5.3359375, 5.509765625, 5.68359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 7.0, 16.0, 12.0, 19.0, 23.0, 24.0, 39.0, 32.0, 33.0, 46.0, 51.0, 47.0, 55.0, 58.0, 57.0, 65.0, 53.0, 42.0, 45.0, 45.0, 43.0, 36.0, 26.0, 24.0, 23.0, 16.0, 11.0, 9.0, 10.0, 4.0, 6.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.5313720703125, -8.250244140625, -7.9691162109375, -7.68798828125, -7.4068603515625, -7.125732421875, -6.8446044921875, -6.5634765625, -6.2823486328125, -6.001220703125, -5.7200927734375, -5.43896484375, -5.1578369140625, -4.876708984375, -4.5955810546875, -4.314453125, -4.0333251953125, -3.752197265625, -3.4710693359375, -3.18994140625, -2.9088134765625, -2.627685546875, -2.3465576171875, -2.0654296875, -1.7843017578125, -1.503173828125, -1.2220458984375, -0.94091796875, -0.6597900390625, -0.378662109375, -0.0975341796875, 0.18359375, 0.4647216796875, 0.745849609375, 1.0269775390625, 1.30810546875, 1.5892333984375, 1.870361328125, 2.1514892578125, 2.4326171875, 2.7137451171875, 2.994873046875, 3.2760009765625, 3.55712890625, 3.8382568359375, 4.119384765625, 4.4005126953125, 4.681640625, 4.9627685546875, 5.243896484375, 5.5250244140625, 5.80615234375, 6.0872802734375, 6.368408203125, 6.6495361328125, 6.9306640625, 7.2117919921875, 7.492919921875, 7.7740478515625, 8.05517578125, 8.3363037109375, 8.617431640625, 8.8985595703125, 9.1796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 12.0, 11.0, 10.0, 24.0, 20.0, 44.0, 48.0, 86.0, 118.0, 239.0, 530.0, 1175.0, 2616.0, 7197.0, 23242.0, 91179.0, 355174.0, 410539.0, 114202.0, 28158.0, 8482.0, 2858.0, 1199.0, 614.0, 308.0, 153.0, 98.0, 57.0, 44.0, 33.0, 20.0, 14.0, 8.0, 4.0, 11.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.45703125, -2.38043212890625, -2.3038330078125, -2.22723388671875, -2.150634765625, -2.07403564453125, -1.9974365234375, -1.92083740234375, -1.84423828125, -1.76763916015625, -1.6910400390625, -1.61444091796875, -1.537841796875, -1.46124267578125, -1.3846435546875, -1.30804443359375, -1.2314453125, -1.15484619140625, -1.0782470703125, -1.00164794921875, -0.925048828125, -0.84844970703125, -0.7718505859375, -0.69525146484375, -0.61865234375, -0.54205322265625, -0.4654541015625, -0.38885498046875, -0.312255859375, -0.23565673828125, -0.1590576171875, -0.08245849609375, -0.005859375, 0.07073974609375, 0.1473388671875, 0.22393798828125, 0.300537109375, 0.37713623046875, 0.4537353515625, 0.53033447265625, 0.60693359375, 0.68353271484375, 0.7601318359375, 0.83673095703125, 0.913330078125, 0.98992919921875, 1.0665283203125, 1.14312744140625, 1.2197265625, 1.29632568359375, 1.3729248046875, 1.44952392578125, 1.526123046875, 1.60272216796875, 1.6793212890625, 1.75592041015625, 1.83251953125, 1.90911865234375, 1.9857177734375, 2.06231689453125, 2.138916015625, 2.21551513671875, 2.2921142578125, 2.36871337890625, 2.4453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 15.0, 12.0, 16.0, 17.0, 19.0, 22.0, 21.0, 13.0, 28.0, 30.0, 47.0, 44.0, 61.0, 83.0, 102.0, 75.0, 75.0, 61.0, 47.0, 29.0, 24.0, 21.0, 18.0, 22.0, 13.0, 15.0, 15.0, 8.0, 8.0, 10.0, 4.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0003299713134765625, -0.0003207176923751831, -0.0003114640712738037, -0.0003022104501724243, -0.0002929568290710449, -0.00028370320796966553, -0.00027444958686828613, -0.00026519596576690674, -0.00025594234466552734, -0.00024668872356414795, -0.00023743510246276855, -0.00022818148136138916, -0.00021892786026000977, -0.00020967423915863037, -0.00020042061805725098, -0.00019116699695587158, -0.0001819133758544922, -0.0001726597547531128, -0.0001634061336517334, -0.000154152512550354, -0.0001448988914489746, -0.00013564527034759521, -0.00012639164924621582, -0.00011713802814483643, -0.00010788440704345703, -9.863078594207764e-05, -8.937716484069824e-05, -8.012354373931885e-05, -7.086992263793945e-05, -6.161630153656006e-05, -5.2362680435180664e-05, -4.310905933380127e-05, -3.3855438232421875e-05, -2.460181713104248e-05, -1.5348196029663086e-05, -6.094574928283691e-06, 3.159046173095703e-06, 1.2412667274475098e-05, 2.1666288375854492e-05, 3.091990947723389e-05, 4.017353057861328e-05, 4.9427151679992676e-05, 5.868077278137207e-05, 6.793439388275146e-05, 7.718801498413086e-05, 8.644163608551025e-05, 9.569525718688965e-05, 0.00010494887828826904, 0.00011420249938964844, 0.00012345612049102783, 0.00013270974159240723, 0.00014196336269378662, 0.00015121698379516602, 0.0001604706048965454, 0.0001697242259979248, 0.0001789778470993042, 0.0001882314682006836, 0.000197485089302063, 0.00020673871040344238, 0.00021599233150482178, 0.00022524595260620117, 0.00023449957370758057, 0.00024375319480895996, 0.00025300681591033936, 0.00026226043701171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 7.0, 2.0, 4.0, 6.0, 10.0, 15.0, 16.0, 16.0, 32.0, 44.0, 57.0, 71.0, 88.0, 165.0, 263.0, 431.0, 634.0, 1057.0, 2039.0, 3967.0, 8892.0, 22763.0, 68886.0, 225524.0, 430436.0, 189728.0, 57883.0, 19427.0, 7868.0, 3585.0, 1899.0, 994.0, 602.0, 378.0, 240.0, 161.0, 93.0, 72.0, 47.0, 39.0, 34.0, 20.0, 11.0, 12.0, 12.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-2.228515625, -2.1597900390625, -2.091064453125, -2.0223388671875, -1.95361328125, -1.8848876953125, -1.816162109375, -1.7474365234375, -1.6787109375, -1.6099853515625, -1.541259765625, -1.4725341796875, -1.40380859375, -1.3350830078125, -1.266357421875, -1.1976318359375, -1.12890625, -1.0601806640625, -0.991455078125, -0.9227294921875, -0.85400390625, -0.7852783203125, -0.716552734375, -0.6478271484375, -0.5791015625, -0.5103759765625, -0.441650390625, -0.3729248046875, -0.30419921875, -0.2354736328125, -0.166748046875, -0.0980224609375, -0.029296875, 0.0394287109375, 0.108154296875, 0.1768798828125, 0.24560546875, 0.3143310546875, 0.383056640625, 0.4517822265625, 0.5205078125, 0.5892333984375, 0.657958984375, 0.7266845703125, 0.79541015625, 0.8641357421875, 0.932861328125, 1.0015869140625, 1.0703125, 1.1390380859375, 1.207763671875, 1.2764892578125, 1.34521484375, 1.4139404296875, 1.482666015625, 1.5513916015625, 1.6201171875, 1.6888427734375, 1.757568359375, 1.8262939453125, 1.89501953125, 1.9637451171875, 2.032470703125, 2.1011962890625, 2.169921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 3.0, 9.0, 16.0, 18.0, 19.0, 30.0, 36.0, 52.0, 58.0, 58.0, 66.0, 92.0, 76.0, 91.0, 86.0, 62.0, 60.0, 37.0, 27.0, 22.0, 21.0, 17.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.6875, -2.6175079345703125, -2.547515869140625, -2.4775238037109375, -2.40753173828125, -2.3375396728515625, -2.267547607421875, -2.1975555419921875, -2.1275634765625, -2.0575714111328125, -1.987579345703125, -1.9175872802734375, -1.84759521484375, -1.7776031494140625, -1.707611083984375, -1.6376190185546875, -1.567626953125, -1.4976348876953125, -1.427642822265625, -1.3576507568359375, -1.28765869140625, -1.2176666259765625, -1.147674560546875, -1.0776824951171875, -1.0076904296875, -0.9376983642578125, -0.867706298828125, -0.7977142333984375, -0.72772216796875, -0.6577301025390625, -0.587738037109375, -0.5177459716796875, -0.44775390625, -0.3777618408203125, -0.307769775390625, -0.2377777099609375, -0.16778564453125, -0.0977935791015625, -0.027801513671875, 0.0421905517578125, 0.1121826171875, 0.1821746826171875, 0.252166748046875, 0.3221588134765625, 0.39215087890625, 0.4621429443359375, 0.532135009765625, 0.6021270751953125, 0.672119140625, 0.7421112060546875, 0.812103271484375, 0.8820953369140625, 0.95208740234375, 1.0220794677734375, 1.092071533203125, 1.1620635986328125, 1.2320556640625, 1.3020477294921875, 1.372039794921875, 1.4420318603515625, 1.51202392578125, 1.5820159912109375, 1.652008056640625, 1.7220001220703125, 1.7919921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 7.0, 12.0, 18.0, 30.0, 55.0, 108.0, 173.0, 170.0, 156.0, 111.0, 57.0, 30.0, 22.0, 17.0, 7.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.653076171875, -65.89630126953125, -64.1395263671875, -62.382747650146484, -60.62596893310547, -58.86919403076172, -57.11241912841797, -55.35564422607422, -53.5988655090332, -51.84209060668945, -50.08531188964844, -48.32853698730469, -46.57176208496094, -44.81498336791992, -43.05820846557617, -41.301429748535156, -39.544654846191406, -37.787879943847656, -36.03110122680664, -34.27432632446289, -32.517547607421875, -30.760772705078125, -29.003997802734375, -27.247220993041992, -25.49044418334961, -23.733667373657227, -21.976890563964844, -20.220115661621094, -18.46333885192871, -16.706562042236328, -14.949786186218262, -13.193010330200195, -11.436233520507812, -9.67945671081543, -7.922680854797363, -6.165904521942139, -4.409128189086914, -2.6523513793945312, -0.8955755233764648, 0.8612003326416016, 2.6179771423339844, 4.374753475189209, 6.131529808044434, 7.888306140899658, 9.645082473754883, 11.401859283447266, 13.158635139465332, 14.915410995483398, 16.67218780517578, 18.428964614868164, 20.185741424560547, 21.942516326904297, 23.69929313659668, 25.456069946289062, 27.212844848632812, 28.969621658325195, 30.726398468017578, 32.48317337036133, 34.239952087402344, 35.996726989746094, 37.753501892089844, 39.51028060913086, 41.26705551147461, 43.023834228515625, 44.780609130859375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 12.0, 10.0, 16.0, 12.0, 15.0, 17.0, 21.0, 20.0, 33.0, 28.0, 56.0, 57.0, 45.0, 52.0, 53.0, 46.0, 56.0, 56.0, 57.0, 58.0, 38.0, 31.0, 28.0, 25.0, 25.0, 26.0, 23.0, 17.0, 13.0, 13.0, 12.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.121543884277344, -53.53910446166992, -51.9566650390625, -50.37422561645508, -48.791786193847656, -47.209346771240234, -45.62690734863281, -44.044464111328125, -42.46202850341797, -40.87958908081055, -39.297149658203125, -37.7147102355957, -36.13227081298828, -34.54983139038086, -32.96739196777344, -31.384950637817383, -29.802509307861328, -28.220069885253906, -26.637630462646484, -25.055191040039062, -23.47275161743164, -21.89031219482422, -20.307870864868164, -18.725431442260742, -17.14299201965332, -15.560552597045898, -13.978113174438477, -12.395672798156738, -10.813233375549316, -9.230793952941895, -7.648353576660156, -6.065914154052734, -4.483478546142578, -2.901038885116577, -1.3185992240905762, 0.2638406753540039, 1.8462800979614258, 3.4287195205688477, 5.011159896850586, 6.593599319458008, 8.17603874206543, 9.758478164672852, 11.340917587280273, 12.923357963562012, 14.505797386169434, 16.088237762451172, 17.670677185058594, 19.253116607666016, 20.835556030273438, 22.41799545288086, 24.00043487548828, 25.582874298095703, 27.165313720703125, 28.747753143310547, 30.3301944732666, 31.912633895874023, 33.49507141113281, 35.077510833740234, 36.659950256347656, 38.24238967895508, 39.8248291015625, 41.40726852416992, 42.989707946777344, 44.57215118408203, 46.15459060668945]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 12.0, 13.0, 13.0, 31.0, 42.0, 41.0, 61.0, 69.0, 121.0, 165.0, 254.0, 406.0, 563.0, 886.0, 1368.0, 2259.0, 4223.0, 8771.0, 21825.0, 82628.0, 3073782.0, 899992.0, 61265.0, 18182.0, 7639.0, 3800.0, 2168.0, 1221.0, 776.0, 518.0, 362.0, 228.0, 178.0, 111.0, 82.0, 51.0, 46.0, 34.0, 23.0, 11.0, 13.0, 7.0, 8.0, 8.0, 8.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.2578125, -7.02301025390625, -6.7882080078125, -6.55340576171875, -6.318603515625, -6.08380126953125, -5.8489990234375, -5.61419677734375, -5.37939453125, -5.14459228515625, -4.9097900390625, -4.67498779296875, -4.440185546875, -4.20538330078125, -3.9705810546875, -3.73577880859375, -3.5009765625, -3.26617431640625, -3.0313720703125, -2.79656982421875, -2.561767578125, -2.32696533203125, -2.0921630859375, -1.85736083984375, -1.62255859375, -1.38775634765625, -1.1529541015625, -0.91815185546875, -0.683349609375, -0.44854736328125, -0.2137451171875, 0.02105712890625, 0.255859375, 0.49066162109375, 0.7254638671875, 0.96026611328125, 1.195068359375, 1.42987060546875, 1.6646728515625, 1.89947509765625, 2.13427734375, 2.36907958984375, 2.6038818359375, 2.83868408203125, 3.073486328125, 3.30828857421875, 3.5430908203125, 3.77789306640625, 4.0126953125, 4.24749755859375, 4.4822998046875, 4.71710205078125, 4.951904296875, 5.18670654296875, 5.4215087890625, 5.65631103515625, 5.89111328125, 6.12591552734375, 6.3607177734375, 6.59552001953125, 6.830322265625, 7.06512451171875, 7.2999267578125, 7.53472900390625, 7.76953125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 7.0, 9.0, 8.0, 13.0, 14.0, 12.0, 26.0, 24.0, 29.0, 32.0, 31.0, 41.0, 46.0, 57.0, 53.0, 49.0, 47.0, 60.0, 53.0, 49.0, 55.0, 40.0, 42.0, 28.0, 30.0, 36.0, 22.0, 18.0, 18.0, 10.0, 14.0, 9.0, 2.0, 7.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.69921875, -1.645843505859375, -1.59246826171875, -1.539093017578125, -1.4857177734375, -1.432342529296875, -1.37896728515625, -1.325592041015625, -1.272216796875, -1.218841552734375, -1.16546630859375, -1.112091064453125, -1.0587158203125, -1.005340576171875, -0.95196533203125, -0.898590087890625, -0.84521484375, -0.791839599609375, -0.73846435546875, -0.685089111328125, -0.6317138671875, -0.578338623046875, -0.52496337890625, -0.471588134765625, -0.418212890625, -0.364837646484375, -0.31146240234375, -0.258087158203125, -0.2047119140625, -0.151336669921875, -0.09796142578125, -0.044586181640625, 0.0087890625, 0.062164306640625, 0.11553955078125, 0.168914794921875, 0.2222900390625, 0.275665283203125, 0.32904052734375, 0.382415771484375, 0.435791015625, 0.489166259765625, 0.54254150390625, 0.595916748046875, 0.6492919921875, 0.702667236328125, 0.75604248046875, 0.809417724609375, 0.86279296875, 0.916168212890625, 0.96954345703125, 1.022918701171875, 1.0762939453125, 1.129669189453125, 1.18304443359375, 1.236419677734375, 1.289794921875, 1.343170166015625, 1.39654541015625, 1.449920654296875, 1.5032958984375, 1.556671142578125, 1.61004638671875, 1.663421630859375, 1.716796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 6.0, 10.0, 17.0, 17.0, 33.0, 47.0, 46.0, 80.0, 128.0, 191.0, 305.0, 468.0, 867.0, 1766.0, 3433.0, 7912.0, 21194.0, 76986.0, 756132.0, 3097989.0, 167674.0, 35590.0, 12440.0, 5239.0, 2587.0, 1271.0, 784.0, 387.0, 261.0, 156.0, 88.0, 64.0, 39.0, 19.0, 17.0, 10.0, 4.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.4609375, -6.2720947265625, -6.083251953125, -5.8944091796875, -5.70556640625, -5.5167236328125, -5.327880859375, -5.1390380859375, -4.9501953125, -4.7613525390625, -4.572509765625, -4.3836669921875, -4.19482421875, -4.0059814453125, -3.817138671875, -3.6282958984375, -3.439453125, -3.2506103515625, -3.061767578125, -2.8729248046875, -2.68408203125, -2.4952392578125, -2.306396484375, -2.1175537109375, -1.9287109375, -1.7398681640625, -1.551025390625, -1.3621826171875, -1.17333984375, -0.9844970703125, -0.795654296875, -0.6068115234375, -0.41796875, -0.2291259765625, -0.040283203125, 0.1485595703125, 0.33740234375, 0.5262451171875, 0.715087890625, 0.9039306640625, 1.0927734375, 1.2816162109375, 1.470458984375, 1.6593017578125, 1.84814453125, 2.0369873046875, 2.225830078125, 2.4146728515625, 2.603515625, 2.7923583984375, 2.981201171875, 3.1700439453125, 3.35888671875, 3.5477294921875, 3.736572265625, 3.9254150390625, 4.1142578125, 4.3031005859375, 4.491943359375, 4.6807861328125, 4.86962890625, 5.0584716796875, 5.247314453125, 5.4361572265625, 5.625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 10.0, 8.0, 5.0, 14.0, 29.0, 41.0, 51.0, 120.0, 245.0, 789.0, 1807.0, 503.0, 178.0, 90.0, 56.0, 37.0, 23.0, 23.0, 7.0, 9.0, 9.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.291015625, -3.20281982421875, -3.1146240234375, -3.02642822265625, -2.938232421875, -2.85003662109375, -2.7618408203125, -2.67364501953125, -2.58544921875, -2.49725341796875, -2.4090576171875, -2.32086181640625, -2.232666015625, -2.14447021484375, -2.0562744140625, -1.96807861328125, -1.8798828125, -1.79168701171875, -1.7034912109375, -1.61529541015625, -1.527099609375, -1.43890380859375, -1.3507080078125, -1.26251220703125, -1.17431640625, -1.08612060546875, -0.9979248046875, -0.90972900390625, -0.821533203125, -0.73333740234375, -0.6451416015625, -0.55694580078125, -0.46875, -0.38055419921875, -0.2923583984375, -0.20416259765625, -0.115966796875, -0.02777099609375, 0.0604248046875, 0.14862060546875, 0.23681640625, 0.32501220703125, 0.4132080078125, 0.50140380859375, 0.589599609375, 0.67779541015625, 0.7659912109375, 0.85418701171875, 0.9423828125, 1.03057861328125, 1.1187744140625, 1.20697021484375, 1.295166015625, 1.38336181640625, 1.4715576171875, 1.55975341796875, 1.64794921875, 1.73614501953125, 1.8243408203125, 1.91253662109375, 2.000732421875, 2.08892822265625, 2.1771240234375, 2.26531982421875, 2.353515625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 24.0, 84.0, 253.0, 321.0, 203.0, 68.0, 21.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.121868133544922, -15.285350799560547, -14.448834419250488, -13.612317085266113, -12.775799751281738, -11.93928337097168, -11.102766036987305, -10.26624870300293, -9.429731369018555, -8.59321403503418, -7.756697177886963, -6.920180320739746, -6.083662986755371, -5.247146129608154, -4.4106292724609375, -3.5741119384765625, -2.737595558166504, -1.901078462600708, -1.0645614862442017, -0.2280445098876953, 0.6084725856781006, 1.4449896812438965, 2.2815065383911133, 3.1180238723754883, 3.954540729522705, 4.791057586669922, 5.627574920654297, 6.464091777801514, 7.3006086349487305, 8.137125968933105, 8.973642349243164, 9.810159683227539, 10.646677017211914, 11.483194351196289, 12.319710731506348, 13.156228065490723, 13.992745399475098, 14.829261779785156, 15.665779113769531, 16.502296447753906, 17.33881378173828, 18.175331115722656, 19.01184844970703, 19.848365783691406, 20.68488121032715, 21.521398544311523, 22.3579158782959, 23.194433212280273, 24.030948638916016, 24.86746597290039, 25.703983306884766, 26.54050064086914, 27.377016067504883, 28.213533401489258, 29.050050735473633, 29.886568069458008, 30.723085403442383, 31.559602737426758, 32.3961181640625, 33.232635498046875, 34.06915283203125, 34.905670166015625, 35.7421875, 36.578704833984375, 37.41522216796875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 13.0, 19.0, 23.0, 22.0, 46.0, 50.0, 52.0, 65.0, 69.0, 75.0, 65.0, 66.0, 86.0, 72.0, 58.0, 44.0, 29.0, 39.0, 33.0, 21.0, 13.0, 7.0, 9.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.528582572937012, -11.146173477172852, -10.763764381408691, -10.381355285644531, -9.998945236206055, -9.616536140441895, -9.234127044677734, -8.851717948913574, -8.469308853149414, -8.086899757385254, -7.704490661621094, -7.322081089019775, -6.939671993255615, -6.557262897491455, -6.174853324890137, -5.792444229125977, -5.410035133361816, -5.027626037597656, -4.645216941833496, -4.262807369232178, -3.8803982734680176, -3.4979891777038574, -3.115579843521118, -2.733170509338379, -2.3507614135742188, -1.968352198600769, -1.5859429836273193, -1.2035337686538696, -0.8211245536804199, -0.4387153387069702, -0.05630612373352051, 0.32610321044921875, 0.7085113525390625, 1.0909205675125122, 1.473329782485962, 1.8557389974594116, 2.2381482124328613, 2.6205573081970215, 3.0029666423797607, 3.3853759765625, 3.76778507232666, 4.15019416809082, 4.5326032638549805, 4.915012836456299, 5.297421932220459, 5.679831027984619, 6.0622406005859375, 6.444649696350098, 6.827058792114258, 7.209467887878418, 7.591876983642578, 7.9742865562438965, 8.356695175170898, 8.739105224609375, 9.121514320373535, 9.503923416137695, 9.886332511901855, 10.268741607666016, 10.651150703430176, 11.033559799194336, 11.415969848632812, 11.798378944396973, 12.180788040161133, 12.563197135925293, 12.945606231689453]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 8.0, 15.0, 15.0, 26.0, 34.0, 39.0, 62.0, 103.0, 136.0, 174.0, 253.0, 383.0, 520.0, 770.0, 1210.0, 1862.0, 2870.0, 4521.0, 7254.0, 11629.0, 19961.0, 34812.0, 64855.0, 125659.0, 236199.0, 244297.0, 132325.0, 68286.0, 36669.0, 20682.0, 12216.0, 7357.0, 4677.0, 2922.0, 1839.0, 1214.0, 802.0, 599.0, 378.0, 279.0, 189.0, 128.0, 96.0, 69.0, 53.0, 27.0, 25.0, 19.0, 10.0, 6.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.5625, -3.447723388671875, -3.33294677734375, -3.218170166015625, -3.1033935546875, -2.988616943359375, -2.87384033203125, -2.759063720703125, -2.644287109375, -2.529510498046875, -2.41473388671875, -2.299957275390625, -2.1851806640625, -2.070404052734375, -1.95562744140625, -1.840850830078125, -1.72607421875, -1.611297607421875, -1.49652099609375, -1.381744384765625, -1.2669677734375, -1.152191162109375, -1.03741455078125, -0.922637939453125, -0.807861328125, -0.693084716796875, -0.57830810546875, -0.463531494140625, -0.3487548828125, -0.233978271484375, -0.11920166015625, -0.004425048828125, 0.1103515625, 0.225128173828125, 0.33990478515625, 0.454681396484375, 0.5694580078125, 0.684234619140625, 0.79901123046875, 0.913787841796875, 1.028564453125, 1.143341064453125, 1.25811767578125, 1.372894287109375, 1.4876708984375, 1.602447509765625, 1.71722412109375, 1.832000732421875, 1.94677734375, 2.061553955078125, 2.17633056640625, 2.291107177734375, 2.4058837890625, 2.520660400390625, 2.63543701171875, 2.750213623046875, 2.864990234375, 2.979766845703125, 3.09454345703125, 3.209320068359375, 3.3240966796875, 3.438873291015625, 3.55364990234375, 3.668426513671875, 3.783203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 12.0, 18.0, 13.0, 21.0, 29.0, 28.0, 48.0, 31.0, 30.0, 45.0, 67.0, 54.0, 55.0, 62.0, 53.0, 54.0, 49.0, 57.0, 36.0, 43.0, 28.0, 29.0, 26.0, 25.0, 21.0, 9.0, 8.0, 9.0, 6.0, 7.0, 8.0, 2.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865234375, -1.631439208984375, -1.57635498046875, -1.521270751953125, -1.4661865234375, -1.411102294921875, -1.35601806640625, -1.300933837890625, -1.245849609375, -1.190765380859375, -1.13568115234375, -1.080596923828125, -1.0255126953125, -0.970428466796875, -0.91534423828125, -0.860260009765625, -0.80517578125, -0.750091552734375, -0.69500732421875, -0.639923095703125, -0.5848388671875, -0.529754638671875, -0.47467041015625, -0.419586181640625, -0.364501953125, -0.309417724609375, -0.25433349609375, -0.199249267578125, -0.1441650390625, -0.089080810546875, -0.03399658203125, 0.021087646484375, 0.076171875, 0.131256103515625, 0.18634033203125, 0.241424560546875, 0.2965087890625, 0.351593017578125, 0.40667724609375, 0.461761474609375, 0.516845703125, 0.571929931640625, 0.62701416015625, 0.682098388671875, 0.7371826171875, 0.792266845703125, 0.84735107421875, 0.902435302734375, 0.95751953125, 1.012603759765625, 1.06768798828125, 1.122772216796875, 1.1778564453125, 1.232940673828125, 1.28802490234375, 1.343109130859375, 1.398193359375, 1.453277587890625, 1.50836181640625, 1.563446044921875, 1.6185302734375, 1.673614501953125, 1.72869873046875, 1.783782958984375, 1.8388671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 6.0, 7.0, 5.0, 15.0, 14.0, 19.0, 29.0, 46.0, 66.0, 94.0, 158.0, 306.0, 504.0, 946.0, 1788.0, 3627.0, 7661.0, 17581.0, 43142.0, 118003.0, 346154.0, 327092.0, 108940.0, 40900.0, 16771.0, 7340.0, 3493.0, 1654.0, 904.0, 501.0, 292.0, 160.0, 107.0, 66.0, 52.0, 29.0, 25.0, 16.0, 8.0, 12.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.49609375, -5.318603515625, -5.14111328125, -4.963623046875, -4.7861328125, -4.608642578125, -4.43115234375, -4.253662109375, -4.076171875, -3.898681640625, -3.72119140625, -3.543701171875, -3.3662109375, -3.188720703125, -3.01123046875, -2.833740234375, -2.65625, -2.478759765625, -2.30126953125, -2.123779296875, -1.9462890625, -1.768798828125, -1.59130859375, -1.413818359375, -1.236328125, -1.058837890625, -0.88134765625, -0.703857421875, -0.5263671875, -0.348876953125, -0.17138671875, 0.006103515625, 0.18359375, 0.361083984375, 0.53857421875, 0.716064453125, 0.8935546875, 1.071044921875, 1.24853515625, 1.426025390625, 1.603515625, 1.781005859375, 1.95849609375, 2.135986328125, 2.3134765625, 2.490966796875, 2.66845703125, 2.845947265625, 3.0234375, 3.200927734375, 3.37841796875, 3.555908203125, 3.7333984375, 3.910888671875, 4.08837890625, 4.265869140625, 4.443359375, 4.620849609375, 4.79833984375, 4.975830078125, 5.1533203125, 5.330810546875, 5.50830078125, 5.685791015625, 5.86328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 4.0, 2.0, 11.0, 9.0, 20.0, 11.0, 14.0, 16.0, 24.0, 21.0, 26.0, 26.0, 37.0, 42.0, 34.0, 39.0, 40.0, 42.0, 30.0, 45.0, 36.0, 41.0, 40.0, 30.0, 29.0, 36.0, 35.0, 28.0, 22.0, 31.0, 28.0, 25.0, 19.0, 22.0, 12.0, 13.0, 7.0, 14.0, 8.0, 6.0, 3.0, 12.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.62890625, -6.4327392578125, -6.236572265625, -6.0404052734375, -5.84423828125, -5.6480712890625, -5.451904296875, -5.2557373046875, -5.0595703125, -4.8634033203125, -4.667236328125, -4.4710693359375, -4.27490234375, -4.0787353515625, -3.882568359375, -3.6864013671875, -3.490234375, -3.2940673828125, -3.097900390625, -2.9017333984375, -2.70556640625, -2.5093994140625, -2.313232421875, -2.1170654296875, -1.9208984375, -1.7247314453125, -1.528564453125, -1.3323974609375, -1.13623046875, -0.9400634765625, -0.743896484375, -0.5477294921875, -0.3515625, -0.1553955078125, 0.040771484375, 0.2369384765625, 0.43310546875, 0.6292724609375, 0.825439453125, 1.0216064453125, 1.2177734375, 1.4139404296875, 1.610107421875, 1.8062744140625, 2.00244140625, 2.1986083984375, 2.394775390625, 2.5909423828125, 2.787109375, 2.9832763671875, 3.179443359375, 3.3756103515625, 3.57177734375, 3.7679443359375, 3.964111328125, 4.1602783203125, 4.3564453125, 4.5526123046875, 4.748779296875, 4.9449462890625, 5.14111328125, 5.3372802734375, 5.533447265625, 5.7296142578125, 5.92578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 9.0, 6.0, 9.0, 17.0, 18.0, 21.0, 27.0, 54.0, 62.0, 117.0, 190.0, 395.0, 838.0, 2304.0, 7920.0, 79450.0, 869947.0, 75514.0, 7669.0, 2287.0, 801.0, 390.0, 168.0, 95.0, 71.0, 46.0, 33.0, 21.0, 18.0, 10.0, 8.0, 11.0, 8.0, 9.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59375, -4.42034912109375, -4.2469482421875, -4.07354736328125, -3.900146484375, -3.72674560546875, -3.5533447265625, -3.37994384765625, -3.20654296875, -3.03314208984375, -2.8597412109375, -2.68634033203125, -2.512939453125, -2.33953857421875, -2.1661376953125, -1.99273681640625, -1.8193359375, -1.64593505859375, -1.4725341796875, -1.29913330078125, -1.125732421875, -0.95233154296875, -0.7789306640625, -0.60552978515625, -0.43212890625, -0.25872802734375, -0.0853271484375, 0.08807373046875, 0.261474609375, 0.43487548828125, 0.6082763671875, 0.78167724609375, 0.955078125, 1.12847900390625, 1.3018798828125, 1.47528076171875, 1.648681640625, 1.82208251953125, 1.9954833984375, 2.16888427734375, 2.34228515625, 2.51568603515625, 2.6890869140625, 2.86248779296875, 3.035888671875, 3.20928955078125, 3.3826904296875, 3.55609130859375, 3.7294921875, 3.90289306640625, 4.0762939453125, 4.24969482421875, 4.423095703125, 4.59649658203125, 4.7698974609375, 4.94329833984375, 5.11669921875, 5.29010009765625, 5.4635009765625, 5.63690185546875, 5.810302734375, 5.98370361328125, 6.1571044921875, 6.33050537109375, 6.50390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 4.0, 11.0, 6.0, 10.0, 18.0, 14.0, 32.0, 22.0, 36.0, 31.0, 62.0, 63.0, 78.0, 104.0, 101.0, 93.0, 81.0, 42.0, 43.0, 21.0, 27.0, 11.0, 15.0, 14.0, 14.0, 6.0, 8.0, 5.0, 1.0, 11.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003681182861328125, -0.00035691261291503906, -0.0003457069396972656, -0.0003345012664794922, -0.00032329559326171875, -0.0003120899200439453, -0.0003008842468261719, -0.00028967857360839844, -0.000278472900390625, -0.00026726722717285156, -0.0002560615539550781, -0.0002448558807373047, -0.00023365020751953125, -0.0002224445343017578, -0.00021123886108398438, -0.00020003318786621094, -0.0001888275146484375, -0.00017762184143066406, -0.00016641616821289062, -0.0001552104949951172, -0.00014400482177734375, -0.0001327991485595703, -0.00012159347534179688, -0.00011038780212402344, -9.918212890625e-05, -8.797645568847656e-05, -7.677078247070312e-05, -6.556510925292969e-05, -5.435943603515625e-05, -4.315376281738281e-05, -3.1948089599609375e-05, -2.0742416381835938e-05, -9.5367431640625e-06, 1.6689300537109375e-06, 1.2874603271484375e-05, 2.4080276489257812e-05, 3.528594970703125e-05, 4.649162292480469e-05, 5.7697296142578125e-05, 6.890296936035156e-05, 8.0108642578125e-05, 9.131431579589844e-05, 0.00010251998901367188, 0.00011372566223144531, 0.00012493133544921875, 0.0001361370086669922, 0.00014734268188476562, 0.00015854835510253906, 0.0001697540283203125, 0.00018095970153808594, 0.00019216537475585938, 0.0002033710479736328, 0.00021457672119140625, 0.0002257823944091797, 0.00023698806762695312, 0.00024819374084472656, 0.0002593994140625, 0.00027060508728027344, 0.0002818107604980469, 0.0002930164337158203, 0.00030422210693359375, 0.0003154277801513672, 0.0003266334533691406, 0.00033783912658691406, 0.0003490447998046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 5.0, 10.0, 13.0, 15.0, 26.0, 34.0, 44.0, 58.0, 95.0, 159.0, 236.0, 478.0, 824.0, 1537.0, 3531.0, 10377.0, 101099.0, 876871.0, 40134.0, 7275.0, 2749.0, 1259.0, 672.0, 375.0, 239.0, 140.0, 99.0, 57.0, 48.0, 28.0, 14.0, 12.0, 11.0, 5.0, 6.0, 2.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.30926513671875, -7.0833740234375, -6.85748291015625, -6.631591796875, -6.40570068359375, -6.1798095703125, -5.95391845703125, -5.72802734375, -5.50213623046875, -5.2762451171875, -5.05035400390625, -4.824462890625, -4.59857177734375, -4.3726806640625, -4.14678955078125, -3.9208984375, -3.69500732421875, -3.4691162109375, -3.24322509765625, -3.017333984375, -2.79144287109375, -2.5655517578125, -2.33966064453125, -2.11376953125, -1.88787841796875, -1.6619873046875, -1.43609619140625, -1.210205078125, -0.98431396484375, -0.7584228515625, -0.53253173828125, -0.306640625, -0.08074951171875, 0.1451416015625, 0.37103271484375, 0.596923828125, 0.82281494140625, 1.0487060546875, 1.27459716796875, 1.50048828125, 1.72637939453125, 1.9522705078125, 2.17816162109375, 2.404052734375, 2.62994384765625, 2.8558349609375, 3.08172607421875, 3.3076171875, 3.53350830078125, 3.7593994140625, 3.98529052734375, 4.211181640625, 4.43707275390625, 4.6629638671875, 4.88885498046875, 5.11474609375, 5.34063720703125, 5.5665283203125, 5.79241943359375, 6.018310546875, 6.24420166015625, 6.4700927734375, 6.69598388671875, 6.921875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 12.0, 13.0, 10.0, 21.0, 68.0, 182.0, 305.0, 208.0, 82.0, 35.0, 18.0, 10.0, 4.0, 8.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.44317626953125, -8.1988525390625, -7.95452880859375, -7.710205078125, -7.46588134765625, -7.2215576171875, -6.97723388671875, -6.73291015625, -6.48858642578125, -6.2442626953125, -5.99993896484375, -5.755615234375, -5.51129150390625, -5.2669677734375, -5.02264404296875, -4.7783203125, -4.53399658203125, -4.2896728515625, -4.04534912109375, -3.801025390625, -3.55670166015625, -3.3123779296875, -3.06805419921875, -2.82373046875, -2.57940673828125, -2.3350830078125, -2.09075927734375, -1.846435546875, -1.60211181640625, -1.3577880859375, -1.11346435546875, -0.869140625, -0.62481689453125, -0.3804931640625, -0.13616943359375, 0.108154296875, 0.35247802734375, 0.5968017578125, 0.84112548828125, 1.08544921875, 1.32977294921875, 1.5740966796875, 1.81842041015625, 2.062744140625, 2.30706787109375, 2.5513916015625, 2.79571533203125, 3.0400390625, 3.28436279296875, 3.5286865234375, 3.77301025390625, 4.017333984375, 4.26165771484375, 4.5059814453125, 4.75030517578125, 4.99462890625, 5.23895263671875, 5.4832763671875, 5.72760009765625, 5.971923828125, 6.21624755859375, 6.4605712890625, 6.70489501953125, 6.94921875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 8.0, 16.0, 36.0, 98.0, 252.0, 365.0, 150.0, 44.0, 21.0, 11.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-92.34872436523438, -88.9442367553711, -85.53974914550781, -82.13526153564453, -78.73077392578125, -75.32628631591797, -71.92179870605469, -68.51731872558594, -65.11282348632812, -61.708335876464844, -58.30384826660156, -54.89936065673828, -51.494873046875, -48.09038543701172, -44.6859016418457, -41.28141403198242, -37.876930236816406, -34.472442626953125, -31.067955017089844, -27.663469314575195, -24.258981704711914, -20.854494094848633, -17.450008392333984, -14.045520782470703, -10.641033172607422, -7.236546039581299, -3.832058906555176, -0.42757225036621094, 2.9769153594970703, 6.381402969360352, 9.785888671875, 13.190376281738281, 16.594863891601562, 19.999351501464844, 23.403839111328125, 26.808324813842773, 30.212812423706055, 33.61730194091797, 37.021785736083984, 40.426273345947266, 43.83076095581055, 47.23524856567383, 50.63973617553711, 54.044219970703125, 57.448707580566406, 60.85319519042969, 64.25768280029297, 67.66217041015625, 71.06665802001953, 74.47114562988281, 77.8756332397461, 81.28012084960938, 84.68460845947266, 88.08909606933594, 91.49357604980469, 94.8980712890625, 98.30255126953125, 101.70703887939453, 105.11152648925781, 108.5160140991211, 111.92050170898438, 115.32498931884766, 118.72947692871094, 122.13395690917969, 125.5384521484375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 8.0, 15.0, 13.0, 19.0, 14.0, 18.0, 20.0, 27.0, 30.0, 21.0, 30.0, 35.0, 50.0, 50.0, 48.0, 54.0, 40.0, 49.0, 45.0, 51.0, 39.0, 36.0, 28.0, 32.0, 35.0, 28.0, 25.0, 23.0, 22.0, 21.0, 11.0, 10.0, 9.0, 7.0, 8.0, 5.0, 4.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.71440887451172, -36.37226867675781, -35.03012466430664, -33.687984466552734, -32.34584045410156, -31.003700256347656, -29.661558151245117, -28.319416046142578, -26.977275848388672, -25.635133743286133, -24.292991638183594, -22.950851440429688, -21.60870933532715, -20.26656723022461, -18.92442512512207, -17.58228302001953, -16.240140914916992, -14.897998809814453, -13.55585765838623, -12.213715553283691, -10.871574401855469, -9.52943229675293, -8.18729019165039, -6.845149040222168, -5.503006935119629, -4.160865306854248, -2.818723440170288, -1.4765815734863281, -0.13443994522094727, 1.2077016830444336, 2.5498437881469727, 3.8919849395751953, 5.234127044677734, 6.576268672943115, 7.918410301208496, 9.260552406311035, 10.602693557739258, 11.944835662841797, 13.286977767944336, 14.629118919372559, 15.971261024475098, 17.31340217590332, 18.65554428100586, 19.9976863861084, 21.339828491210938, 22.681968688964844, 24.024112701416016, 25.366252899169922, 26.70839500427246, 28.050537109375, 29.39267921447754, 30.734821319580078, 32.076961517333984, 33.419105529785156, 34.76124572753906, 36.10338592529297, 37.44552993774414, 38.78767013549805, 40.12981414794922, 41.471954345703125, 42.8140983581543, 44.1562385559082, 45.498382568359375, 46.84052276611328, 48.18266296386719]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 22.0, 14.0, 26.0, 32.0, 46.0, 95.0, 112.0, 181.0, 256.0, 418.0, 651.0, 1153.0, 2056.0, 3689.0, 7947.0, 19873.0, 68689.0, 572536.0, 3305624.0, 152413.0, 33816.0, 12235.0, 5441.0, 2797.0, 1532.0, 944.0, 551.0, 357.0, 228.0, 144.0, 101.0, 85.0, 65.0, 25.0, 27.0, 20.0, 23.0, 10.0, 7.0, 8.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7109375, -5.4932861328125, -5.275634765625, -5.0579833984375, -4.84033203125, -4.6226806640625, -4.405029296875, -4.1873779296875, -3.9697265625, -3.7520751953125, -3.534423828125, -3.3167724609375, -3.09912109375, -2.8814697265625, -2.663818359375, -2.4461669921875, -2.228515625, -2.0108642578125, -1.793212890625, -1.5755615234375, -1.35791015625, -1.1402587890625, -0.922607421875, -0.7049560546875, -0.4873046875, -0.2696533203125, -0.052001953125, 0.1656494140625, 0.38330078125, 0.6009521484375, 0.818603515625, 1.0362548828125, 1.25390625, 1.4715576171875, 1.689208984375, 1.9068603515625, 2.12451171875, 2.3421630859375, 2.559814453125, 2.7774658203125, 2.9951171875, 3.2127685546875, 3.430419921875, 3.6480712890625, 3.86572265625, 4.0833740234375, 4.301025390625, 4.5186767578125, 4.736328125, 4.9539794921875, 5.171630859375, 5.3892822265625, 5.60693359375, 5.8245849609375, 6.042236328125, 6.2598876953125, 6.4775390625, 6.6951904296875, 6.912841796875, 7.1304931640625, 7.34814453125, 7.5657958984375, 7.783447265625, 8.0010986328125, 8.21875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 2.0, 3.0, 11.0, 17.0, 10.0, 22.0, 25.0, 27.0, 26.0, 35.0, 29.0, 46.0, 57.0, 49.0, 64.0, 54.0, 64.0, 58.0, 46.0, 43.0, 43.0, 50.0, 35.0, 35.0, 26.0, 28.0, 14.0, 28.0, 10.0, 9.0, 8.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.541015625, -1.484588623046875, -1.42816162109375, -1.371734619140625, -1.3153076171875, -1.258880615234375, -1.20245361328125, -1.146026611328125, -1.089599609375, -1.033172607421875, -0.97674560546875, -0.920318603515625, -0.8638916015625, -0.807464599609375, -0.75103759765625, -0.694610595703125, -0.63818359375, -0.581756591796875, -0.52532958984375, -0.468902587890625, -0.4124755859375, -0.356048583984375, -0.29962158203125, -0.243194580078125, -0.186767578125, -0.130340576171875, -0.07391357421875, -0.017486572265625, 0.0389404296875, 0.095367431640625, 0.15179443359375, 0.208221435546875, 0.2646484375, 0.321075439453125, 0.37750244140625, 0.433929443359375, 0.4903564453125, 0.546783447265625, 0.60321044921875, 0.659637451171875, 0.716064453125, 0.772491455078125, 0.82891845703125, 0.885345458984375, 0.9417724609375, 0.998199462890625, 1.05462646484375, 1.111053466796875, 1.16748046875, 1.223907470703125, 1.28033447265625, 1.336761474609375, 1.3931884765625, 1.449615478515625, 1.50604248046875, 1.562469482421875, 1.618896484375, 1.675323486328125, 1.73175048828125, 1.788177490234375, 1.8446044921875, 1.901031494140625, 1.95745849609375, 2.013885498046875, 2.0703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 3.0, 5.0, 7.0, 13.0, 12.0, 10.0, 28.0, 32.0, 62.0, 76.0, 109.0, 224.0, 378.0, 881.0, 2254.0, 6766.0, 40505.0, 1353296.0, 2721411.0, 55410.0, 8476.0, 2443.0, 927.0, 419.0, 217.0, 149.0, 59.0, 39.0, 21.0, 19.0, 11.0, 10.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.159423828125, -7.85791015625, -7.556396484375, -7.2548828125, -6.953369140625, -6.65185546875, -6.350341796875, -6.048828125, -5.747314453125, -5.44580078125, -5.144287109375, -4.8427734375, -4.541259765625, -4.23974609375, -3.938232421875, -3.63671875, -3.335205078125, -3.03369140625, -2.732177734375, -2.4306640625, -2.129150390625, -1.82763671875, -1.526123046875, -1.224609375, -0.923095703125, -0.62158203125, -0.320068359375, -0.0185546875, 0.282958984375, 0.58447265625, 0.885986328125, 1.1875, 1.489013671875, 1.79052734375, 2.092041015625, 2.3935546875, 2.695068359375, 2.99658203125, 3.298095703125, 3.599609375, 3.901123046875, 4.20263671875, 4.504150390625, 4.8056640625, 5.107177734375, 5.40869140625, 5.710205078125, 6.01171875, 6.313232421875, 6.61474609375, 6.916259765625, 7.2177734375, 7.519287109375, 7.82080078125, 8.122314453125, 8.423828125, 8.725341796875, 9.02685546875, 9.328369140625, 9.6298828125, 9.931396484375, 10.23291015625, 10.534423828125, 10.8359375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 11.0, 23.0, 42.0, 93.0, 174.0, 500.0, 1818.0, 874.0, 253.0, 111.0, 57.0, 38.0, 31.0, 14.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.375, -6.225677490234375, -6.07635498046875, -5.927032470703125, -5.7777099609375, -5.628387451171875, -5.47906494140625, -5.329742431640625, -5.180419921875, -5.031097412109375, -4.88177490234375, -4.732452392578125, -4.5831298828125, -4.433807373046875, -4.28448486328125, -4.135162353515625, -3.98583984375, -3.836517333984375, -3.68719482421875, -3.537872314453125, -3.3885498046875, -3.239227294921875, -3.08990478515625, -2.940582275390625, -2.791259765625, -2.641937255859375, -2.49261474609375, -2.343292236328125, -2.1939697265625, -2.044647216796875, -1.89532470703125, -1.746002197265625, -1.5966796875, -1.447357177734375, -1.29803466796875, -1.148712158203125, -0.9993896484375, -0.850067138671875, -0.70074462890625, -0.551422119140625, -0.402099609375, -0.252777099609375, -0.10345458984375, 0.045867919921875, 0.1951904296875, 0.344512939453125, 0.49383544921875, 0.643157958984375, 0.79248046875, 0.941802978515625, 1.09112548828125, 1.240447998046875, 1.3897705078125, 1.539093017578125, 1.68841552734375, 1.837738037109375, 1.987060546875, 2.136383056640625, 2.28570556640625, 2.435028076171875, 2.5843505859375, 2.733673095703125, 2.88299560546875, 3.032318115234375, 3.181640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 11.0, 24.0, 19.0, 48.0, 72.0, 119.0, 160.0, 177.0, 150.0, 93.0, 62.0, 28.0, 10.0, 13.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.470561981201172, -10.867326736450195, -10.264092445373535, -9.660857200622559, -9.057621955871582, -8.454387664794922, -7.851152420043945, -7.247917175292969, -6.64468240737915, -6.041447639465332, -5.4382123947143555, -4.834977626800537, -4.231742858886719, -3.628507614135742, -3.025272846221924, -2.4220376014709473, -1.818802833557129, -1.2155678272247314, -0.6123329401016235, -0.009098052978515625, 0.5941369533538818, 1.1973719596862793, 1.8006067276000977, 2.403841972351074, 3.0070767402648926, 3.61031174659729, 4.2135467529296875, 4.816781520843506, 5.420016288757324, 6.023251533508301, 6.626486301422119, 7.229721546173096, 7.832956314086914, 8.43619155883789, 9.03942584991455, 9.642661094665527, 10.245896339416504, 10.849130630493164, 11.45236587524414, 12.055601119995117, 12.658836364746094, 13.26207160949707, 13.86530590057373, 14.468541145324707, 15.071776390075684, 15.675010681152344, 16.27824592590332, 16.881481170654297, 17.48471450805664, 18.087949752807617, 18.691184997558594, 19.294418334960938, 19.897653579711914, 20.50088882446289, 21.104124069213867, 21.707359313964844, 22.31059455871582, 22.913829803466797, 23.517065048217773, 24.12030029296875, 24.723533630371094, 25.32676887512207, 25.930004119873047, 26.533239364624023, 27.136474609375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 7.0, 12.0, 11.0, 13.0, 18.0, 26.0, 27.0, 22.0, 53.0, 50.0, 44.0, 54.0, 59.0, 65.0, 57.0, 61.0, 59.0, 68.0, 44.0, 42.0, 31.0, 42.0, 27.0, 20.0, 23.0, 18.0, 9.0, 4.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.177499771118164, -10.747265815734863, -10.317030906677246, -9.886796951293945, -9.456562042236328, -9.026328086853027, -8.59609317779541, -8.16585922241211, -7.735624313354492, -7.305389881134033, -6.875155448913574, -6.444921016693115, -6.014686584472656, -5.5844526290893555, -5.154217720031738, -4.7239837646484375, -4.2937493324279785, -3.8635149002075195, -3.4332804679870605, -3.0030460357666016, -2.5728116035461426, -2.1425774097442627, -1.7123429775238037, -1.2821085453033447, -0.8518741130828857, -0.42163971066474915, 0.008594691753387451, 0.43882906436920166, 0.8690634965896606, 1.29929780960083, 1.729532241821289, 2.159766674041748, 2.590001106262207, 3.020235538482666, 3.450469970703125, 3.880704402923584, 4.310938835144043, 4.741172790527344, 5.171407699584961, 5.601641654968262, 6.031876564025879, 6.462110996246338, 6.892345428466797, 7.322579860687256, 7.752814292907715, 8.183048248291016, 8.613283157348633, 9.043517112731934, 9.473751068115234, 9.903985023498535, 10.334219932556152, 10.764453887939453, 11.19468879699707, 11.624922752380371, 12.055157661437988, 12.485391616821289, 12.915626525878906, 13.345860481262207, 13.776095390319824, 14.206329345703125, 14.636564254760742, 15.066798210144043, 15.49703311920166, 15.927267074584961, 16.357501983642578]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 12.0, 11.0, 16.0, 16.0, 40.0, 38.0, 62.0, 102.0, 156.0, 238.0, 326.0, 575.0, 989.0, 1607.0, 2892.0, 5386.0, 10685.0, 22433.0, 52225.0, 137431.0, 365907.0, 274086.0, 98162.0, 38924.0, 17389.0, 8430.0, 4407.0, 2398.0, 1400.0, 757.0, 525.0, 323.0, 211.0, 137.0, 82.0, 56.0, 33.0, 27.0, 14.0, 11.0, 9.0, 8.0, 3.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9296875, -5.73736572265625, -5.5450439453125, -5.35272216796875, -5.160400390625, -4.96807861328125, -4.7757568359375, -4.58343505859375, -4.39111328125, -4.19879150390625, -4.0064697265625, -3.81414794921875, -3.621826171875, -3.42950439453125, -3.2371826171875, -3.04486083984375, -2.8525390625, -2.66021728515625, -2.4678955078125, -2.27557373046875, -2.083251953125, -1.89093017578125, -1.6986083984375, -1.50628662109375, -1.31396484375, -1.12164306640625, -0.9293212890625, -0.73699951171875, -0.544677734375, -0.35235595703125, -0.1600341796875, 0.03228759765625, 0.224609375, 0.41693115234375, 0.6092529296875, 0.80157470703125, 0.993896484375, 1.18621826171875, 1.3785400390625, 1.57086181640625, 1.76318359375, 1.95550537109375, 2.1478271484375, 2.34014892578125, 2.532470703125, 2.72479248046875, 2.9171142578125, 3.10943603515625, 3.3017578125, 3.49407958984375, 3.6864013671875, 3.87872314453125, 4.071044921875, 4.26336669921875, 4.4556884765625, 4.64801025390625, 4.84033203125, 5.03265380859375, 5.2249755859375, 5.41729736328125, 5.609619140625, 5.80194091796875, 5.9942626953125, 6.18658447265625, 6.37890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 3.0, 6.0, 5.0, 5.0, 10.0, 17.0, 16.0, 13.0, 30.0, 24.0, 32.0, 32.0, 34.0, 49.0, 59.0, 60.0, 70.0, 69.0, 51.0, 53.0, 42.0, 42.0, 39.0, 47.0, 37.0, 25.0, 32.0, 20.0, 13.0, 18.0, 12.0, 6.0, 10.0, 5.0, 2.0, 8.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6630859375, -1.6072998046875, -1.551513671875, -1.4957275390625, -1.43994140625, -1.3841552734375, -1.328369140625, -1.2725830078125, -1.216796875, -1.1610107421875, -1.105224609375, -1.0494384765625, -0.99365234375, -0.9378662109375, -0.882080078125, -0.8262939453125, -0.7705078125, -0.7147216796875, -0.658935546875, -0.6031494140625, -0.54736328125, -0.4915771484375, -0.435791015625, -0.3800048828125, -0.32421875, -0.2684326171875, -0.212646484375, -0.1568603515625, -0.10107421875, -0.0452880859375, 0.010498046875, 0.0662841796875, 0.1220703125, 0.1778564453125, 0.233642578125, 0.2894287109375, 0.34521484375, 0.4010009765625, 0.456787109375, 0.5125732421875, 0.568359375, 0.6241455078125, 0.679931640625, 0.7357177734375, 0.79150390625, 0.8472900390625, 0.903076171875, 0.9588623046875, 1.0146484375, 1.0704345703125, 1.126220703125, 1.1820068359375, 1.23779296875, 1.2935791015625, 1.349365234375, 1.4051513671875, 1.4609375, 1.5167236328125, 1.572509765625, 1.6282958984375, 1.68408203125, 1.7398681640625, 1.795654296875, 1.8514404296875, 1.9072265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 4.0, 6.0, 7.0, 14.0, 24.0, 33.0, 48.0, 55.0, 85.0, 150.0, 184.0, 271.0, 463.0, 724.0, 1197.0, 2080.0, 3784.0, 6854.0, 13964.0, 29140.0, 66386.0, 174161.0, 378924.0, 218757.0, 81974.0, 34673.0, 16363.0, 8019.0, 4184.0, 2388.0, 1350.0, 816.0, 467.0, 344.0, 214.0, 154.0, 83.0, 74.0, 43.0, 25.0, 25.0, 9.0, 11.0, 9.0, 9.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.75390625, -4.608154296875, -4.46240234375, -4.316650390625, -4.1708984375, -4.025146484375, -3.87939453125, -3.733642578125, -3.587890625, -3.442138671875, -3.29638671875, -3.150634765625, -3.0048828125, -2.859130859375, -2.71337890625, -2.567626953125, -2.421875, -2.276123046875, -2.13037109375, -1.984619140625, -1.8388671875, -1.693115234375, -1.54736328125, -1.401611328125, -1.255859375, -1.110107421875, -0.96435546875, -0.818603515625, -0.6728515625, -0.527099609375, -0.38134765625, -0.235595703125, -0.08984375, 0.055908203125, 0.20166015625, 0.347412109375, 0.4931640625, 0.638916015625, 0.78466796875, 0.930419921875, 1.076171875, 1.221923828125, 1.36767578125, 1.513427734375, 1.6591796875, 1.804931640625, 1.95068359375, 2.096435546875, 2.2421875, 2.387939453125, 2.53369140625, 2.679443359375, 2.8251953125, 2.970947265625, 3.11669921875, 3.262451171875, 3.408203125, 3.553955078125, 3.69970703125, 3.845458984375, 3.9912109375, 4.136962890625, 4.28271484375, 4.428466796875, 4.57421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 6.0, 5.0, 12.0, 20.0, 17.0, 21.0, 30.0, 33.0, 44.0, 38.0, 43.0, 57.0, 52.0, 62.0, 50.0, 51.0, 44.0, 61.0, 44.0, 49.0, 49.0, 40.0, 27.0, 27.0, 26.0, 19.0, 17.0, 9.0, 12.0, 10.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0078125, -7.74658203125, -7.4853515625, -7.22412109375, -6.962890625, -6.70166015625, -6.4404296875, -6.17919921875, -5.91796875, -5.65673828125, -5.3955078125, -5.13427734375, -4.873046875, -4.61181640625, -4.3505859375, -4.08935546875, -3.828125, -3.56689453125, -3.3056640625, -3.04443359375, -2.783203125, -2.52197265625, -2.2607421875, -1.99951171875, -1.73828125, -1.47705078125, -1.2158203125, -0.95458984375, -0.693359375, -0.43212890625, -0.1708984375, 0.09033203125, 0.3515625, 0.61279296875, 0.8740234375, 1.13525390625, 1.396484375, 1.65771484375, 1.9189453125, 2.18017578125, 2.44140625, 2.70263671875, 2.9638671875, 3.22509765625, 3.486328125, 3.74755859375, 4.0087890625, 4.27001953125, 4.53125, 4.79248046875, 5.0537109375, 5.31494140625, 5.576171875, 5.83740234375, 6.0986328125, 6.35986328125, 6.62109375, 6.88232421875, 7.1435546875, 7.40478515625, 7.666015625, 7.92724609375, 8.1884765625, 8.44970703125, 8.7109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 8.0, 5.0, 9.0, 10.0, 11.0, 13.0, 18.0, 27.0, 47.0, 57.0, 101.0, 194.0, 360.0, 821.0, 2004.0, 8010.0, 62755.0, 762294.0, 190562.0, 15815.0, 3214.0, 1102.0, 483.0, 259.0, 131.0, 79.0, 44.0, 33.0, 20.0, 15.0, 7.0, 13.0, 4.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.4453125, -4.3050537109375, -4.164794921875, -4.0245361328125, -3.88427734375, -3.7440185546875, -3.603759765625, -3.4635009765625, -3.3232421875, -3.1829833984375, -3.042724609375, -2.9024658203125, -2.76220703125, -2.6219482421875, -2.481689453125, -2.3414306640625, -2.201171875, -2.0609130859375, -1.920654296875, -1.7803955078125, -1.64013671875, -1.4998779296875, -1.359619140625, -1.2193603515625, -1.0791015625, -0.9388427734375, -0.798583984375, -0.6583251953125, -0.51806640625, -0.3778076171875, -0.237548828125, -0.0972900390625, 0.04296875, 0.1832275390625, 0.323486328125, 0.4637451171875, 0.60400390625, 0.7442626953125, 0.884521484375, 1.0247802734375, 1.1650390625, 1.3052978515625, 1.445556640625, 1.5858154296875, 1.72607421875, 1.8663330078125, 2.006591796875, 2.1468505859375, 2.287109375, 2.4273681640625, 2.567626953125, 2.7078857421875, 2.84814453125, 2.9884033203125, 3.128662109375, 3.2689208984375, 3.4091796875, 3.5494384765625, 3.689697265625, 3.8299560546875, 3.97021484375, 4.1104736328125, 4.250732421875, 4.3909912109375, 4.53125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 6.0, 12.0, 18.0, 28.0, 32.0, 69.0, 88.0, 171.0, 214.0, 134.0, 77.0, 48.0, 25.0, 16.0, 14.0, 8.0, 11.0, 7.0, 1.0, 3.0, 3.0, 0.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034046173095703125, -0.0003227442502975464, -0.0003050267696380615, -0.00028730928897857666, -0.0002695918083190918, -0.00025187432765960693, -0.00023415684700012207, -0.0002164393663406372, -0.00019872188568115234, -0.00018100440502166748, -0.00016328692436218262, -0.00014556944370269775, -0.0001278519630432129, -0.00011013448238372803, -9.241700172424316e-05, -7.46995210647583e-05, -5.698204040527344e-05, -3.9264559745788574e-05, -2.154707908630371e-05, -3.829598426818848e-06, 1.3887882232666016e-05, 3.160536289215088e-05, 4.932284355163574e-05, 6.70403242111206e-05, 8.475780487060547e-05, 0.00010247528553009033, 0.0001201927661895752, 0.00013791024684906006, 0.00015562772750854492, 0.00017334520816802979, 0.00019106268882751465, 0.0002087801694869995, 0.00022649765014648438, 0.00024421513080596924, 0.0002619326114654541, 0.00027965009212493896, 0.00029736757278442383, 0.0003150850534439087, 0.00033280253410339355, 0.0003505200147628784, 0.0003682374954223633, 0.00038595497608184814, 0.000403672456741333, 0.00042138993740081787, 0.00043910741806030273, 0.0004568248987197876, 0.00047454237937927246, 0.0004922598600387573, 0.0005099773406982422, 0.000527694821357727, 0.0005454123020172119, 0.0005631297826766968, 0.0005808472633361816, 0.0005985647439956665, 0.0006162822246551514, 0.0006339997053146362, 0.0006517171859741211, 0.000669434666633606, 0.0006871521472930908, 0.0007048696279525757, 0.0007225871086120605, 0.0007403045892715454, 0.0007580220699310303, 0.0007757395505905151, 0.00079345703125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 9.0, 10.0, 9.0, 14.0, 20.0, 27.0, 53.0, 69.0, 87.0, 147.0, 250.0, 429.0, 741.0, 1219.0, 2728.0, 7452.0, 32689.0, 440364.0, 511730.0, 37031.0, 7592.0, 2786.0, 1322.0, 689.0, 367.0, 273.0, 157.0, 84.0, 51.0, 51.0, 27.0, 13.0, 22.0, 11.0, 11.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96875, -3.83203125, -3.6953125, -3.55859375, -3.421875, -3.28515625, -3.1484375, -3.01171875, -2.875, -2.73828125, -2.6015625, -2.46484375, -2.328125, -2.19140625, -2.0546875, -1.91796875, -1.78125, -1.64453125, -1.5078125, -1.37109375, -1.234375, -1.09765625, -0.9609375, -0.82421875, -0.6875, -0.55078125, -0.4140625, -0.27734375, -0.140625, -0.00390625, 0.1328125, 0.26953125, 0.40625, 0.54296875, 0.6796875, 0.81640625, 0.953125, 1.08984375, 1.2265625, 1.36328125, 1.5, 1.63671875, 1.7734375, 1.91015625, 2.046875, 2.18359375, 2.3203125, 2.45703125, 2.59375, 2.73046875, 2.8671875, 3.00390625, 3.140625, 3.27734375, 3.4140625, 3.55078125, 3.6875, 3.82421875, 3.9609375, 4.09765625, 4.234375, 4.37109375, 4.5078125, 4.64453125, 4.78125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 12.0, 23.0, 42.0, 79.0, 168.0, 292.0, 185.0, 90.0, 42.0, 18.0, 10.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0546875, -4.86444091796875, -4.6741943359375, -4.48394775390625, -4.293701171875, -4.10345458984375, -3.9132080078125, -3.72296142578125, -3.53271484375, -3.34246826171875, -3.1522216796875, -2.96197509765625, -2.771728515625, -2.58148193359375, -2.3912353515625, -2.20098876953125, -2.0107421875, -1.82049560546875, -1.6302490234375, -1.44000244140625, -1.249755859375, -1.05950927734375, -0.8692626953125, -0.67901611328125, -0.48876953125, -0.29852294921875, -0.1082763671875, 0.08197021484375, 0.272216796875, 0.46246337890625, 0.6527099609375, 0.84295654296875, 1.033203125, 1.22344970703125, 1.4136962890625, 1.60394287109375, 1.794189453125, 1.98443603515625, 2.1746826171875, 2.36492919921875, 2.55517578125, 2.74542236328125, 2.9356689453125, 3.12591552734375, 3.316162109375, 3.50640869140625, 3.6966552734375, 3.88690185546875, 4.0771484375, 4.26739501953125, 4.4576416015625, 4.64788818359375, 4.838134765625, 5.02838134765625, 5.2186279296875, 5.40887451171875, 5.59912109375, 5.78936767578125, 5.9796142578125, 6.16986083984375, 6.360107421875, 6.55035400390625, 6.7406005859375, 6.93084716796875, 7.12109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 7.0, 4.0, 12.0, 29.0, 39.0, 63.0, 100.0, 170.0, 176.0, 141.0, 84.0, 75.0, 23.0, 28.0, 9.0, 13.0, 10.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.101444244384766, -31.63323211669922, -30.165019989013672, -28.696807861328125, -27.228595733642578, -25.76038360595703, -24.292171478271484, -22.823959350585938, -21.35574722290039, -19.887535095214844, -18.419322967529297, -16.95111083984375, -15.482898712158203, -14.014686584472656, -12.54647445678711, -11.078262329101562, -9.610050201416016, -8.141838073730469, -6.673625946044922, -5.205413818359375, -3.737201690673828, -2.2689895629882812, -0.8007774353027344, 0.6674346923828125, 2.1356468200683594, 3.6038589477539062, 5.072071075439453, 6.540283203125, 8.008495330810547, 9.476707458496094, 10.94491958618164, 12.413131713867188, 13.88134765625, 15.349559783935547, 16.817771911621094, 18.28598403930664, 19.754196166992188, 21.222408294677734, 22.69062042236328, 24.158832550048828, 25.627044677734375, 27.095256805419922, 28.56346893310547, 30.031681060791016, 31.499893188476562, 32.96810531616211, 34.436317443847656, 35.9045295715332, 37.37274169921875, 38.8409538269043, 40.309165954589844, 41.77737808227539, 43.24559020996094, 44.713802337646484, 46.18201446533203, 47.65022659301758, 49.118438720703125, 50.58665084838867, 52.05486297607422, 53.523075103759766, 54.99128723144531, 56.45949935913086, 57.927711486816406, 59.39592361450195, 60.8641357421875]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 10.0, 12.0, 19.0, 20.0, 20.0, 20.0, 31.0, 35.0, 25.0, 41.0, 38.0, 38.0, 46.0, 47.0, 55.0, 49.0, 43.0, 41.0, 39.0, 39.0, 33.0, 45.0, 32.0, 32.0, 29.0, 25.0, 28.0, 16.0, 11.0, 17.0, 10.0, 6.0, 10.0, 4.0, 7.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03066635131836, -38.79706573486328, -37.5634651184082, -36.329864501953125, -35.09626388549805, -33.86266326904297, -32.62906265258789, -31.395462036132812, -30.161861419677734, -28.928260803222656, -27.694660186767578, -26.4610595703125, -25.227458953857422, -23.993858337402344, -22.760257720947266, -21.526657104492188, -20.29305648803711, -19.05945587158203, -17.825855255126953, -16.592254638671875, -15.358654022216797, -14.125053405761719, -12.89145278930664, -11.657852172851562, -10.424251556396484, -9.190650939941406, -7.957050323486328, -6.72344970703125, -5.489849090576172, -4.256248474121094, -3.0226478576660156, -1.7890472412109375, -0.5554428100585938, 0.6781578063964844, 1.9117584228515625, 3.1453590393066406, 4.378959655761719, 5.612560272216797, 6.846160888671875, 8.079761505126953, 9.313362121582031, 10.54696273803711, 11.780563354492188, 13.014163970947266, 14.247764587402344, 15.481365203857422, 16.7149658203125, 17.948566436767578, 19.182167053222656, 20.415767669677734, 21.649368286132812, 22.88296890258789, 24.11656951904297, 25.350170135498047, 26.583770751953125, 27.817371368408203, 29.05097198486328, 30.28457260131836, 31.518173217773438, 32.751773834228516, 33.985374450683594, 35.21897506713867, 36.45257568359375, 37.68617630004883, 38.919776916503906]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 13.0, 13.0, 16.0, 35.0, 41.0, 47.0, 71.0, 98.0, 149.0, 215.0, 319.0, 481.0, 705.0, 1161.0, 1943.0, 3586.0, 7310.0, 16565.0, 56258.0, 740597.0, 3239716.0, 84135.0, 21534.0, 8670.0, 4195.0, 2387.0, 1409.0, 831.0, 571.0, 362.0, 233.0, 166.0, 122.0, 93.0, 56.0, 50.0, 35.0, 17.0, 26.0, 18.0, 9.0, 8.0, 2.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0625, -4.888671875, -4.71484375, -4.541015625, -4.3671875, -4.193359375, -4.01953125, -3.845703125, -3.671875, -3.498046875, -3.32421875, -3.150390625, -2.9765625, -2.802734375, -2.62890625, -2.455078125, -2.28125, -2.107421875, -1.93359375, -1.759765625, -1.5859375, -1.412109375, -1.23828125, -1.064453125, -0.890625, -0.716796875, -0.54296875, -0.369140625, -0.1953125, -0.021484375, 0.15234375, 0.326171875, 0.5, 0.673828125, 0.84765625, 1.021484375, 1.1953125, 1.369140625, 1.54296875, 1.716796875, 1.890625, 2.064453125, 2.23828125, 2.412109375, 2.5859375, 2.759765625, 2.93359375, 3.107421875, 3.28125, 3.455078125, 3.62890625, 3.802734375, 3.9765625, 4.150390625, 4.32421875, 4.498046875, 4.671875, 4.845703125, 5.01953125, 5.193359375, 5.3671875, 5.541015625, 5.71484375, 5.888671875, 6.0625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 8.0, 4.0, 11.0, 13.0, 14.0, 14.0, 25.0, 25.0, 20.0, 28.0, 38.0, 40.0, 59.0, 44.0, 47.0, 53.0, 51.0, 50.0, 54.0, 53.0, 42.0, 40.0, 41.0, 29.0, 42.0, 29.0, 20.0, 22.0, 18.0, 16.0, 7.0, 11.0, 5.0, 7.0, 4.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.732421875, -1.6767425537109375, -1.621063232421875, -1.5653839111328125, -1.50970458984375, -1.4540252685546875, -1.398345947265625, -1.3426666259765625, -1.2869873046875, -1.2313079833984375, -1.175628662109375, -1.1199493408203125, -1.06427001953125, -1.0085906982421875, -0.952911376953125, -0.8972320556640625, -0.841552734375, -0.7858734130859375, -0.730194091796875, -0.6745147705078125, -0.61883544921875, -0.5631561279296875, -0.507476806640625, -0.4517974853515625, -0.3961181640625, -0.3404388427734375, -0.284759521484375, -0.2290802001953125, -0.17340087890625, -0.1177215576171875, -0.062042236328125, -0.0063629150390625, 0.04931640625, 0.1049957275390625, 0.160675048828125, 0.2163543701171875, 0.27203369140625, 0.3277130126953125, 0.383392333984375, 0.4390716552734375, 0.4947509765625, 0.5504302978515625, 0.606109619140625, 0.6617889404296875, 0.71746826171875, 0.7731475830078125, 0.828826904296875, 0.8845062255859375, 0.940185546875, 0.9958648681640625, 1.051544189453125, 1.1072235107421875, 1.16290283203125, 1.2185821533203125, 1.274261474609375, 1.3299407958984375, 1.3856201171875, 1.4412994384765625, 1.496978759765625, 1.5526580810546875, 1.60833740234375, 1.6640167236328125, 1.719696044921875, 1.7753753662109375, 1.8310546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 4.0, 9.0, 14.0, 17.0, 16.0, 22.0, 23.0, 24.0, 28.0, 41.0, 47.0, 68.0, 82.0, 234.0, 466.0, 1443.0, 7320.0, 162105.0, 3979771.0, 37381.0, 3491.0, 868.0, 350.0, 142.0, 78.0, 41.0, 27.0, 35.0, 20.0, 26.0, 16.0, 13.0, 13.0, 9.0, 4.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6484375, -12.268798828125, -11.88916015625, -11.509521484375, -11.1298828125, -10.750244140625, -10.37060546875, -9.990966796875, -9.611328125, -9.231689453125, -8.85205078125, -8.472412109375, -8.0927734375, -7.713134765625, -7.33349609375, -6.953857421875, -6.57421875, -6.194580078125, -5.81494140625, -5.435302734375, -5.0556640625, -4.676025390625, -4.29638671875, -3.916748046875, -3.537109375, -3.157470703125, -2.77783203125, -2.398193359375, -2.0185546875, -1.638916015625, -1.25927734375, -0.879638671875, -0.5, -0.120361328125, 0.25927734375, 0.638916015625, 1.0185546875, 1.398193359375, 1.77783203125, 2.157470703125, 2.537109375, 2.916748046875, 3.29638671875, 3.676025390625, 4.0556640625, 4.435302734375, 4.81494140625, 5.194580078125, 5.57421875, 5.953857421875, 6.33349609375, 6.713134765625, 7.0927734375, 7.472412109375, 7.85205078125, 8.231689453125, 8.611328125, 8.990966796875, 9.37060546875, 9.750244140625, 10.1298828125, 10.509521484375, 10.88916015625, 11.268798828125, 11.6484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 6.0, 10.0, 29.0, 57.0, 210.0, 2406.0, 1190.0, 115.0, 29.0, 19.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3203125, -9.125701904296875, -8.93109130859375, -8.736480712890625, -8.5418701171875, -8.347259521484375, -8.15264892578125, -7.958038330078125, -7.763427734375, -7.568817138671875, -7.37420654296875, -7.179595947265625, -6.9849853515625, -6.790374755859375, -6.59576416015625, -6.401153564453125, -6.20654296875, -6.011932373046875, -5.81732177734375, -5.622711181640625, -5.4281005859375, -5.233489990234375, -5.03887939453125, -4.844268798828125, -4.649658203125, -4.455047607421875, -4.26043701171875, -4.065826416015625, -3.8712158203125, -3.676605224609375, -3.48199462890625, -3.287384033203125, -3.0927734375, -2.898162841796875, -2.70355224609375, -2.508941650390625, -2.3143310546875, -2.119720458984375, -1.92510986328125, -1.730499267578125, -1.535888671875, -1.341278076171875, -1.14666748046875, -0.952056884765625, -0.7574462890625, -0.562835693359375, -0.36822509765625, -0.173614501953125, 0.02099609375, 0.215606689453125, 0.41021728515625, 0.604827880859375, 0.7994384765625, 0.994049072265625, 1.18865966796875, 1.383270263671875, 1.577880859375, 1.772491455078125, 1.96710205078125, 2.161712646484375, 2.3563232421875, 2.550933837890625, 2.74554443359375, 2.940155029296875, 3.134765625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 17.0, 27.0, 50.0, 94.0, 181.0, 213.0, 187.0, 129.0, 51.0, 24.0, 11.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.377098083496094, -17.820680618286133, -17.264263153076172, -16.70784568786621, -16.15142822265625, -15.595010757446289, -15.038594245910645, -14.482176780700684, -13.925759315490723, -13.369341850280762, -12.8129243850708, -12.25650691986084, -11.700090408325195, -11.143672943115234, -10.587255477905273, -10.030838012695312, -9.474420547485352, -8.91800308227539, -8.36158561706543, -7.805168628692627, -7.248751163482666, -6.692333698272705, -6.135916709899902, -5.579499244689941, -5.0230817794799805, -4.4666643142700195, -3.9102470874786377, -3.353829860687256, -2.797412395477295, -2.240994930267334, -1.6845777034759521, -1.1281604766845703, -0.5717449188232422, -0.0153275728225708, 0.5410897731781006, 1.097507119178772, 1.6539244651794434, 2.2103419303894043, 2.766759157180786, 3.323176383972168, 3.879593849182129, 4.43601131439209, 4.992428779602051, 5.5488457679748535, 6.1052632331848145, 6.661680698394775, 7.218097686767578, 7.774515151977539, 8.3309326171875, 8.887350082397461, 9.443767547607422, 10.000185012817383, 10.556602478027344, 11.113019943237305, 11.66943645477295, 12.22585391998291, 12.782271385192871, 13.338688850402832, 13.895106315612793, 14.451523780822754, 15.007940292358398, 15.56435775756836, 16.12077522277832, 16.67719268798828, 17.233610153198242]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 12.0, 16.0, 18.0, 37.0, 37.0, 51.0, 54.0, 85.0, 99.0, 99.0, 86.0, 67.0, 77.0, 66.0, 54.0, 51.0, 26.0, 30.0, 11.0, 10.0, 4.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.301892280578613, -11.808430671691895, -11.314970016479492, -10.821508407592773, -10.328046798706055, -9.834585189819336, -9.341124534606934, -8.847662925720215, -8.354202270507812, -7.860741138458252, -7.367279529571533, -6.873818397521973, -6.380356788635254, -5.886895656585693, -5.393434524536133, -4.899972915649414, -4.406511306762695, -3.9130499362945557, -3.419588565826416, -2.9261274337768555, -2.432666063308716, -1.9392046928405762, -1.4457435607910156, -0.952282190322876, -0.45882081985473633, 0.034640491008758545, 0.5281018018722534, 1.0215630531311035, 1.5150244235992432, 2.008485794067383, 2.5019469261169434, 2.995408296585083, 3.488870620727539, 3.9823319911956787, 4.475793361663818, 4.969254493713379, 5.462716102600098, 5.956177234649658, 6.449638366699219, 6.9430999755859375, 7.436561107635498, 7.930022239685059, 8.423483848571777, 8.91694450378418, 9.410406112670898, 9.903867721557617, 10.397329330444336, 10.890789985656738, 11.384251594543457, 11.877713203430176, 12.371173858642578, 12.864635467529297, 13.358097076416016, 13.851558685302734, 14.345019340515137, 14.838480949401855, 15.331941604614258, 15.825403213500977, 16.318864822387695, 16.81232452392578, 17.3057861328125, 17.79924774169922, 18.292709350585938, 18.786170959472656, 19.279632568359375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 22.0, 21.0, 17.0, 42.0, 53.0, 77.0, 97.0, 160.0, 242.0, 360.0, 566.0, 846.0, 1252.0, 2076.0, 3239.0, 5132.0, 8935.0, 15282.0, 28325.0, 55729.0, 115440.0, 236786.0, 277914.0, 145516.0, 69953.0, 35218.0, 18492.0, 10411.0, 6094.0, 3636.0, 2317.0, 1491.0, 949.0, 631.0, 392.0, 238.0, 190.0, 124.0, 81.0, 59.0, 51.0, 30.0, 21.0, 15.0, 13.0, 8.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.640625, -4.5047607421875, -4.368896484375, -4.2330322265625, -4.09716796875, -3.9613037109375, -3.825439453125, -3.6895751953125, -3.5537109375, -3.4178466796875, -3.281982421875, -3.1461181640625, -3.01025390625, -2.8743896484375, -2.738525390625, -2.6026611328125, -2.466796875, -2.3309326171875, -2.195068359375, -2.0592041015625, -1.92333984375, -1.7874755859375, -1.651611328125, -1.5157470703125, -1.3798828125, -1.2440185546875, -1.108154296875, -0.9722900390625, -0.83642578125, -0.7005615234375, -0.564697265625, -0.4288330078125, -0.29296875, -0.1571044921875, -0.021240234375, 0.1146240234375, 0.25048828125, 0.3863525390625, 0.522216796875, 0.6580810546875, 0.7939453125, 0.9298095703125, 1.065673828125, 1.2015380859375, 1.33740234375, 1.4732666015625, 1.609130859375, 1.7449951171875, 1.880859375, 2.0167236328125, 2.152587890625, 2.2884521484375, 2.42431640625, 2.5601806640625, 2.696044921875, 2.8319091796875, 2.9677734375, 3.1036376953125, 3.239501953125, 3.3753662109375, 3.51123046875, 3.6470947265625, 3.782958984375, 3.9188232421875, 4.0546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 2.0, 6.0, 9.0, 13.0, 22.0, 9.0, 23.0, 27.0, 20.0, 30.0, 34.0, 37.0, 57.0, 57.0, 58.0, 46.0, 48.0, 56.0, 57.0, 57.0, 46.0, 45.0, 32.0, 24.0, 34.0, 24.0, 25.0, 19.0, 16.0, 10.0, 8.0, 8.0, 7.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.85546875, -1.79901123046875, -1.7425537109375, -1.68609619140625, -1.629638671875, -1.57318115234375, -1.5167236328125, -1.46026611328125, -1.40380859375, -1.34735107421875, -1.2908935546875, -1.23443603515625, -1.177978515625, -1.12152099609375, -1.0650634765625, -1.00860595703125, -0.9521484375, -0.89569091796875, -0.8392333984375, -0.78277587890625, -0.726318359375, -0.66986083984375, -0.6134033203125, -0.55694580078125, -0.50048828125, -0.44403076171875, -0.3875732421875, -0.33111572265625, -0.274658203125, -0.21820068359375, -0.1617431640625, -0.10528564453125, -0.048828125, 0.00762939453125, 0.0640869140625, 0.12054443359375, 0.177001953125, 0.23345947265625, 0.2899169921875, 0.34637451171875, 0.40283203125, 0.45928955078125, 0.5157470703125, 0.57220458984375, 0.628662109375, 0.68511962890625, 0.7415771484375, 0.79803466796875, 0.8544921875, 0.91094970703125, 0.9674072265625, 1.02386474609375, 1.080322265625, 1.13677978515625, 1.1932373046875, 1.24969482421875, 1.30615234375, 1.36260986328125, 1.4190673828125, 1.47552490234375, 1.531982421875, 1.58843994140625, 1.6448974609375, 1.70135498046875, 1.7578125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 8.0, 8.0, 15.0, 15.0, 20.0, 29.0, 56.0, 80.0, 82.0, 124.0, 175.0, 273.0, 364.0, 594.0, 1047.0, 1920.0, 3942.0, 8286.0, 20045.0, 54640.0, 174177.0, 423776.0, 238551.0, 74043.0, 25502.0, 10467.0, 4722.0, 2291.0, 1198.0, 738.0, 423.0, 284.0, 174.0, 140.0, 100.0, 64.0, 53.0, 43.0, 25.0, 19.0, 9.0, 10.0, 5.0, 6.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.6484375, -4.4915771484375, -4.334716796875, -4.1778564453125, -4.02099609375, -3.8641357421875, -3.707275390625, -3.5504150390625, -3.3935546875, -3.2366943359375, -3.079833984375, -2.9229736328125, -2.76611328125, -2.6092529296875, -2.452392578125, -2.2955322265625, -2.138671875, -1.9818115234375, -1.824951171875, -1.6680908203125, -1.51123046875, -1.3543701171875, -1.197509765625, -1.0406494140625, -0.8837890625, -0.7269287109375, -0.570068359375, -0.4132080078125, -0.25634765625, -0.0994873046875, 0.057373046875, 0.2142333984375, 0.37109375, 0.5279541015625, 0.684814453125, 0.8416748046875, 0.99853515625, 1.1553955078125, 1.312255859375, 1.4691162109375, 1.6259765625, 1.7828369140625, 1.939697265625, 2.0965576171875, 2.25341796875, 2.4102783203125, 2.567138671875, 2.7239990234375, 2.880859375, 3.0377197265625, 3.194580078125, 3.3514404296875, 3.50830078125, 3.6651611328125, 3.822021484375, 3.9788818359375, 4.1357421875, 4.2926025390625, 4.449462890625, 4.6063232421875, 4.76318359375, 4.9200439453125, 5.076904296875, 5.2337646484375, 5.390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 2.0, 7.0, 15.0, 10.0, 6.0, 17.0, 16.0, 22.0, 22.0, 24.0, 37.0, 39.0, 50.0, 41.0, 44.0, 46.0, 45.0, 57.0, 43.0, 50.0, 38.0, 40.0, 48.0, 35.0, 32.0, 30.0, 30.0, 29.0, 25.0, 20.0, 15.0, 11.0, 21.0, 6.0, 4.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.42156982421875, -5.1986083984375, -4.97564697265625, -4.752685546875, -4.52972412109375, -4.3067626953125, -4.08380126953125, -3.86083984375, -3.63787841796875, -3.4149169921875, -3.19195556640625, -2.968994140625, -2.74603271484375, -2.5230712890625, -2.30010986328125, -2.0771484375, -1.85418701171875, -1.6312255859375, -1.40826416015625, -1.185302734375, -0.96234130859375, -0.7393798828125, -0.51641845703125, -0.29345703125, -0.07049560546875, 0.1524658203125, 0.37542724609375, 0.598388671875, 0.82135009765625, 1.0443115234375, 1.26727294921875, 1.490234375, 1.71319580078125, 1.9361572265625, 2.15911865234375, 2.382080078125, 2.60504150390625, 2.8280029296875, 3.05096435546875, 3.27392578125, 3.49688720703125, 3.7198486328125, 3.94281005859375, 4.165771484375, 4.38873291015625, 4.6116943359375, 4.83465576171875, 5.0576171875, 5.28057861328125, 5.5035400390625, 5.72650146484375, 5.949462890625, 6.17242431640625, 6.3953857421875, 6.61834716796875, 6.84130859375, 7.06427001953125, 7.2872314453125, 7.51019287109375, 7.733154296875, 7.95611572265625, 8.1790771484375, 8.40203857421875, 8.625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 11.0, 9.0, 15.0, 31.0, 37.0, 72.0, 98.0, 198.0, 365.0, 684.0, 1644.0, 4100.0, 11432.0, 41209.0, 239092.0, 587312.0, 123321.0, 25503.0, 7839.0, 2973.0, 1254.0, 613.0, 308.0, 183.0, 78.0, 44.0, 28.0, 31.0, 12.0, 13.0, 10.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.85125732421875, -2.7630615234375, -2.67486572265625, -2.586669921875, -2.49847412109375, -2.4102783203125, -2.32208251953125, -2.23388671875, -2.14569091796875, -2.0574951171875, -1.96929931640625, -1.881103515625, -1.79290771484375, -1.7047119140625, -1.61651611328125, -1.5283203125, -1.44012451171875, -1.3519287109375, -1.26373291015625, -1.175537109375, -1.08734130859375, -0.9991455078125, -0.91094970703125, -0.82275390625, -0.73455810546875, -0.6463623046875, -0.55816650390625, -0.469970703125, -0.38177490234375, -0.2935791015625, -0.20538330078125, -0.1171875, -0.02899169921875, 0.0592041015625, 0.14739990234375, 0.235595703125, 0.32379150390625, 0.4119873046875, 0.50018310546875, 0.58837890625, 0.67657470703125, 0.7647705078125, 0.85296630859375, 0.941162109375, 1.02935791015625, 1.1175537109375, 1.20574951171875, 1.2939453125, 1.38214111328125, 1.4703369140625, 1.55853271484375, 1.646728515625, 1.73492431640625, 1.8231201171875, 1.91131591796875, 1.99951171875, 2.08770751953125, 2.1759033203125, 2.26409912109375, 2.352294921875, 2.44049072265625, 2.5286865234375, 2.61688232421875, 2.705078125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 9.0, 4.0, 6.0, 6.0, 8.0, 8.0, 15.0, 19.0, 29.0, 27.0, 23.0, 41.0, 52.0, 72.0, 104.0, 102.0, 119.0, 80.0, 67.0, 49.0, 25.0, 25.0, 20.0, 24.0, 14.0, 8.0, 11.0, 13.0, 8.0, 4.0, 2.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034689903259277344, -0.0003348439931869507, -0.00032278895378112793, -0.0003107339143753052, -0.0002986788749694824, -0.00028662383556365967, -0.0002745687961578369, -0.00026251375675201416, -0.0002504587173461914, -0.00023840367794036865, -0.0002263486385345459, -0.00021429359912872314, -0.0002022385597229004, -0.00019018352031707764, -0.00017812848091125488, -0.00016607344150543213, -0.00015401840209960938, -0.00014196336269378662, -0.00012990832328796387, -0.00011785328388214111, -0.00010579824447631836, -9.37432050704956e-05, -8.168816566467285e-05, -6.96331262588501e-05, -5.7578086853027344e-05, -4.552304744720459e-05, -3.3468008041381836e-05, -2.1412968635559082e-05, -9.357929229736328e-06, 2.6971101760864258e-06, 1.475214958190918e-05, 2.6807188987731934e-05, 3.886222839355469e-05, 5.091726779937744e-05, 6.29723072052002e-05, 7.502734661102295e-05, 8.70823860168457e-05, 9.913742542266846e-05, 0.00011119246482849121, 0.00012324750423431396, 0.00013530254364013672, 0.00014735758304595947, 0.00015941262245178223, 0.00017146766185760498, 0.00018352270126342773, 0.0001955777406692505, 0.00020763278007507324, 0.000219687819480896, 0.00023174285888671875, 0.0002437978982925415, 0.00025585293769836426, 0.000267907977104187, 0.00027996301651000977, 0.0002920180559158325, 0.0003040730953216553, 0.00031612813472747803, 0.0003281831741333008, 0.00034023821353912354, 0.0003522932529449463, 0.00036434829235076904, 0.0003764033317565918, 0.00038845837116241455, 0.0004005134105682373, 0.00041256844997406006, 0.0004246234893798828]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 4.0, 5.0, 13.0, 9.0, 25.0, 32.0, 59.0, 110.0, 185.0, 404.0, 779.0, 1934.0, 6279.0, 30625.0, 434856.0, 527866.0, 34613.0, 6932.0, 2156.0, 773.0, 389.0, 212.0, 125.0, 68.0, 29.0, 18.0, 14.0, 11.0, 5.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7109375, -4.5540771484375, -4.397216796875, -4.2403564453125, -4.08349609375, -3.9266357421875, -3.769775390625, -3.6129150390625, -3.4560546875, -3.2991943359375, -3.142333984375, -2.9854736328125, -2.82861328125, -2.6717529296875, -2.514892578125, -2.3580322265625, -2.201171875, -2.0443115234375, -1.887451171875, -1.7305908203125, -1.57373046875, -1.4168701171875, -1.260009765625, -1.1031494140625, -0.9462890625, -0.7894287109375, -0.632568359375, -0.4757080078125, -0.31884765625, -0.1619873046875, -0.005126953125, 0.1517333984375, 0.30859375, 0.4654541015625, 0.622314453125, 0.7791748046875, 0.93603515625, 1.0928955078125, 1.249755859375, 1.4066162109375, 1.5634765625, 1.7203369140625, 1.877197265625, 2.0340576171875, 2.19091796875, 2.3477783203125, 2.504638671875, 2.6614990234375, 2.818359375, 2.9752197265625, 3.132080078125, 3.2889404296875, 3.44580078125, 3.6026611328125, 3.759521484375, 3.9163818359375, 4.0732421875, 4.2301025390625, 4.386962890625, 4.5438232421875, 4.70068359375, 4.8575439453125, 5.014404296875, 5.1712646484375, 5.328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 6.0, 6.0, 6.0, 9.0, 16.0, 22.0, 34.0, 68.0, 153.0, 208.0, 180.0, 116.0, 60.0, 31.0, 18.0, 20.0, 8.0, 9.0, 10.0, 4.0, 7.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.2581787109375, -4.110107421875, -3.9620361328125, -3.81396484375, -3.6658935546875, -3.517822265625, -3.3697509765625, -3.2216796875, -3.0736083984375, -2.925537109375, -2.7774658203125, -2.62939453125, -2.4813232421875, -2.333251953125, -2.1851806640625, -2.037109375, -1.8890380859375, -1.740966796875, -1.5928955078125, -1.44482421875, -1.2967529296875, -1.148681640625, -1.0006103515625, -0.8525390625, -0.7044677734375, -0.556396484375, -0.4083251953125, -0.26025390625, -0.1121826171875, 0.035888671875, 0.1839599609375, 0.33203125, 0.4801025390625, 0.628173828125, 0.7762451171875, 0.92431640625, 1.0723876953125, 1.220458984375, 1.3685302734375, 1.5166015625, 1.6646728515625, 1.812744140625, 1.9608154296875, 2.10888671875, 2.2569580078125, 2.405029296875, 2.5531005859375, 2.701171875, 2.8492431640625, 2.997314453125, 3.1453857421875, 3.29345703125, 3.4415283203125, 3.589599609375, 3.7376708984375, 3.8857421875, 4.0338134765625, 4.181884765625, 4.3299560546875, 4.47802734375, 4.6260986328125, 4.774169921875, 4.9222412109375, 5.0703125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 9.0, 9.0, 25.0, 24.0, 44.0, 84.0, 130.0, 185.0, 202.0, 127.0, 71.0, 40.0, 23.0, 7.0, 9.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.56689453125, -21.887048721313477, -20.207202911376953, -18.527359008789062, -16.847511291503906, -15.1676664352417, -13.487821578979492, -11.807975769042969, -10.128129959106445, -8.448284149169922, -6.768438816070557, -5.088593482971191, -3.408747673034668, -1.7289018630981445, -0.0490570068359375, 1.630788803100586, 3.3106346130371094, 4.990480422973633, 6.670325756072998, 8.350171089172363, 10.030016899108887, 11.70986270904541, 13.389707565307617, 15.06955337524414, 16.749399185180664, 18.429244995117188, 20.10909080505371, 21.788936614990234, 23.468780517578125, 25.14862823486328, 26.828472137451172, 28.508317947387695, 30.18816375732422, 31.868009567260742, 33.547855377197266, 35.227699279785156, 36.90754699707031, 38.5873908996582, 40.267234802246094, 41.94708251953125, 43.626930236816406, 45.3067741394043, 46.98662185668945, 48.666465759277344, 50.3463134765625, 52.02615737915039, 53.70600128173828, 55.38584899902344, 57.06569290161133, 58.74553680419922, 60.425384521484375, 62.105228424072266, 63.78507614135742, 65.46492004394531, 67.14476776123047, 68.82461547851562, 70.50445556640625, 72.1843032836914, 73.86414337158203, 75.54399108886719, 77.22383880615234, 78.9036865234375, 80.58352661132812, 82.26337432861328, 83.94322204589844]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 3.0, 3.0, 11.0, 12.0, 12.0, 17.0, 11.0, 17.0, 15.0, 19.0, 18.0, 28.0, 25.0, 29.0, 26.0, 25.0, 37.0, 35.0, 32.0, 34.0, 38.0, 41.0, 44.0, 46.0, 22.0, 46.0, 34.0, 34.0, 34.0, 27.0, 30.0, 27.0, 23.0, 23.0, 19.0, 19.0, 19.0, 12.0, 3.0, 7.0, 7.0, 6.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-32.294132232666016, -31.28063201904297, -30.267131805419922, -29.253631591796875, -28.24013328552246, -27.226633071899414, -26.213132858276367, -25.19963264465332, -24.186134338378906, -23.17263412475586, -22.159133911132812, -21.145633697509766, -20.13213539123535, -19.118635177612305, -18.105134963989258, -17.09163475036621, -16.078134536743164, -15.064634323120117, -14.051135063171387, -13.03763484954834, -12.02413558959961, -11.010635375976562, -9.997135162353516, -8.983634948730469, -7.970135688781738, -6.95663595199585, -5.943136215209961, -4.929636001586914, -3.9161362648010254, -2.9026365280151367, -1.8891363143920898, -0.8756365776062012, 0.1378631591796875, 1.1513630151748657, 2.164862871170044, 3.1783628463745117, 4.1918625831604, 5.205362319946289, 6.218862533569336, 7.232362270355225, 8.245862007141113, 9.25936222076416, 10.27286148071289, 11.286361694335938, 12.299861907958984, 13.313361167907715, 14.326861381530762, 15.340360641479492, 16.35386085510254, 17.367361068725586, 18.380861282348633, 19.394359588623047, 20.407859802246094, 21.42136001586914, 22.434860229492188, 23.448360443115234, 24.46186065673828, 25.475360870361328, 26.488861083984375, 27.502361297607422, 28.515859603881836, 29.529359817504883, 30.54286003112793, 31.556360244750977, 32.56985855102539]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 10.0, 8.0, 20.0, 11.0, 38.0, 41.0, 70.0, 80.0, 119.0, 173.0, 315.0, 474.0, 835.0, 1605.0, 3067.0, 6764.0, 18756.0, 69487.0, 1084767.0, 2879607.0, 90730.0, 21585.0, 8014.0, 3389.0, 1723.0, 984.0, 564.0, 347.0, 226.0, 154.0, 85.0, 79.0, 35.0, 28.0, 35.0, 18.0, 9.0, 10.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.8828125, -6.68084716796875, -6.4788818359375, -6.27691650390625, -6.074951171875, -5.87298583984375, -5.6710205078125, -5.46905517578125, -5.26708984375, -5.06512451171875, -4.8631591796875, -4.66119384765625, -4.459228515625, -4.25726318359375, -4.0552978515625, -3.85333251953125, -3.6513671875, -3.44940185546875, -3.2474365234375, -3.04547119140625, -2.843505859375, -2.64154052734375, -2.4395751953125, -2.23760986328125, -2.03564453125, -1.83367919921875, -1.6317138671875, -1.42974853515625, -1.227783203125, -1.02581787109375, -0.8238525390625, -0.62188720703125, -0.419921875, -0.21795654296875, -0.0159912109375, 0.18597412109375, 0.387939453125, 0.58990478515625, 0.7918701171875, 0.99383544921875, 1.19580078125, 1.39776611328125, 1.5997314453125, 1.80169677734375, 2.003662109375, 2.20562744140625, 2.4075927734375, 2.60955810546875, 2.8115234375, 3.01348876953125, 3.2154541015625, 3.41741943359375, 3.619384765625, 3.82135009765625, 4.0233154296875, 4.22528076171875, 4.42724609375, 4.62921142578125, 4.8311767578125, 5.03314208984375, 5.235107421875, 5.43707275390625, 5.6390380859375, 5.84100341796875, 6.04296875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 3.0, 11.0, 10.0, 13.0, 19.0, 23.0, 28.0, 22.0, 27.0, 36.0, 33.0, 44.0, 49.0, 59.0, 53.0, 56.0, 53.0, 52.0, 56.0, 56.0, 39.0, 39.0, 49.0, 33.0, 29.0, 13.0, 15.0, 24.0, 11.0, 8.0, 6.0, 8.0, 3.0, 7.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21484375, -2.1518707275390625, -2.088897705078125, -2.0259246826171875, -1.96295166015625, -1.8999786376953125, -1.837005615234375, -1.7740325927734375, -1.7110595703125, -1.6480865478515625, -1.585113525390625, -1.5221405029296875, -1.45916748046875, -1.3961944580078125, -1.333221435546875, -1.2702484130859375, -1.207275390625, -1.1443023681640625, -1.081329345703125, -1.0183563232421875, -0.95538330078125, -0.8924102783203125, -0.829437255859375, -0.7664642333984375, -0.7034912109375, -0.6405181884765625, -0.577545166015625, -0.5145721435546875, -0.45159912109375, -0.3886260986328125, -0.325653076171875, -0.2626800537109375, -0.19970703125, -0.1367340087890625, -0.073760986328125, -0.0107879638671875, 0.05218505859375, 0.1151580810546875, 0.178131103515625, 0.2411041259765625, 0.3040771484375, 0.3670501708984375, 0.430023193359375, 0.4929962158203125, 0.55596923828125, 0.6189422607421875, 0.681915283203125, 0.7448883056640625, 0.807861328125, 0.8708343505859375, 0.933807373046875, 0.9967803955078125, 1.05975341796875, 1.1227264404296875, 1.185699462890625, 1.2486724853515625, 1.3116455078125, 1.3746185302734375, 1.437591552734375, 1.5005645751953125, 1.56353759765625, 1.6265106201171875, 1.689483642578125, 1.7524566650390625, 1.8154296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 6.0, 14.0, 16.0, 18.0, 24.0, 37.0, 47.0, 53.0, 103.0, 201.0, 362.0, 721.0, 1867.0, 4990.0, 19677.0, 155702.0, 3630404.0, 340445.0, 29219.0, 6457.0, 2162.0, 852.0, 340.0, 185.0, 114.0, 79.0, 54.0, 29.0, 35.0, 26.0, 15.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.48162841796875, -5.2757568359375, -5.06988525390625, -4.864013671875, -4.65814208984375, -4.4522705078125, -4.24639892578125, -4.04052734375, -3.83465576171875, -3.6287841796875, -3.42291259765625, -3.217041015625, -3.01116943359375, -2.8052978515625, -2.59942626953125, -2.3935546875, -2.18768310546875, -1.9818115234375, -1.77593994140625, -1.570068359375, -1.36419677734375, -1.1583251953125, -0.95245361328125, -0.74658203125, -0.54071044921875, -0.3348388671875, -0.12896728515625, 0.076904296875, 0.28277587890625, 0.4886474609375, 0.69451904296875, 0.900390625, 1.10626220703125, 1.3121337890625, 1.51800537109375, 1.723876953125, 1.92974853515625, 2.1356201171875, 2.34149169921875, 2.54736328125, 2.75323486328125, 2.9591064453125, 3.16497802734375, 3.370849609375, 3.57672119140625, 3.7825927734375, 3.98846435546875, 4.1943359375, 4.40020751953125, 4.6060791015625, 4.81195068359375, 5.017822265625, 5.22369384765625, 5.4295654296875, 5.63543701171875, 5.84130859375, 6.04718017578125, 6.2530517578125, 6.45892333984375, 6.664794921875, 6.87066650390625, 7.0765380859375, 7.28240966796875, 7.48828125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 8.0, 11.0, 20.0, 36.0, 51.0, 102.0, 286.0, 1120.0, 1830.0, 357.0, 128.0, 53.0, 24.0, 20.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5390625, -5.401092529296875, -5.26312255859375, -5.125152587890625, -4.9871826171875, -4.849212646484375, -4.71124267578125, -4.573272705078125, -4.435302734375, -4.297332763671875, -4.15936279296875, -4.021392822265625, -3.8834228515625, -3.745452880859375, -3.60748291015625, -3.469512939453125, -3.33154296875, -3.193572998046875, -3.05560302734375, -2.917633056640625, -2.7796630859375, -2.641693115234375, -2.50372314453125, -2.365753173828125, -2.227783203125, -2.089813232421875, -1.95184326171875, -1.813873291015625, -1.6759033203125, -1.537933349609375, -1.39996337890625, -1.261993408203125, -1.1240234375, -0.986053466796875, -0.84808349609375, -0.710113525390625, -0.5721435546875, -0.434173583984375, -0.29620361328125, -0.158233642578125, -0.020263671875, 0.117706298828125, 0.25567626953125, 0.393646240234375, 0.5316162109375, 0.669586181640625, 0.80755615234375, 0.945526123046875, 1.08349609375, 1.221466064453125, 1.35943603515625, 1.497406005859375, 1.6353759765625, 1.773345947265625, 1.91131591796875, 2.049285888671875, 2.187255859375, 2.325225830078125, 2.46319580078125, 2.601165771484375, 2.7391357421875, 2.877105712890625, 3.01507568359375, 3.153045654296875, 3.291015625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 7.0, 9.0, 10.0, 23.0, 25.0, 69.0, 78.0, 121.0, 155.0, 135.0, 110.0, 100.0, 60.0, 39.0, 17.0, 12.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.33620262145996, -15.902386665344238, -15.468570709228516, -15.03475570678711, -14.600939750671387, -14.167123794555664, -13.733307838439941, -13.299491882324219, -12.865676879882812, -12.43186092376709, -11.998044967651367, -11.564229965209961, -11.130414009094238, -10.696598052978516, -10.262782096862793, -9.82896614074707, -9.395150184631348, -8.961334228515625, -8.527518272399902, -8.09370231628418, -7.659887313842773, -7.226071357727051, -6.792255401611328, -6.3584394454956055, -5.924623966217041, -5.490808010101318, -5.056992530822754, -4.623176574707031, -4.189360618591309, -3.755545139312744, -3.3217291831970215, -2.887913465499878, -2.4540977478027344, -2.020282030105591, -1.5864661931991577, -1.1526503562927246, -0.718834638595581, -0.2850189208984375, 0.14879703521728516, 0.5826127529144287, 1.0164284706115723, 1.4502441883087158, 1.884060025215149, 2.317875862121582, 2.7516915798187256, 3.185507297515869, 3.619323253631592, 4.053138732910156, 4.486954689025879, 4.920770645141602, 5.354586124420166, 5.788402080535889, 6.222217559814453, 6.656033515930176, 7.089849472045898, 7.523665428161621, 7.9574809074401855, 8.39129638671875, 8.825112342834473, 9.258928298950195, 9.692744255065918, 10.12656021118164, 10.560375213623047, 10.99419116973877, 11.428007125854492]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 2.0, 4.0, 8.0, 5.0, 6.0, 13.0, 11.0, 20.0, 28.0, 26.0, 23.0, 15.0, 28.0, 28.0, 37.0, 38.0, 42.0, 40.0, 41.0, 40.0, 61.0, 51.0, 63.0, 32.0, 28.0, 39.0, 42.0, 24.0, 37.0, 29.0, 27.0, 15.0, 25.0, 10.0, 20.0, 14.0, 8.0, 6.0, 8.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.42820930480957, -9.1572847366333, -8.886359214782715, -8.615434646606445, -8.34450912475586, -8.07358455657959, -7.802659511566162, -7.531734466552734, -7.260809421539307, -6.989884376525879, -6.718959331512451, -6.448034286499023, -6.177109718322754, -5.906184196472168, -5.635259628295898, -5.364334583282471, -5.093409538269043, -4.822484493255615, -4.5515594482421875, -4.28063440322876, -4.009709358215332, -3.7387845516204834, -3.4678597450256348, -3.196934700012207, -2.9260096549987793, -2.6550846099853516, -2.384159564971924, -2.113234758377075, -1.8423097133636475, -1.5713846683502197, -1.3004597425460815, -1.0295348167419434, -0.7586097717285156, -0.48768478631973267, -0.2167598009109497, 0.05416518449783325, 0.3250901699066162, 0.596015214920044, 0.8669401407241821, 1.1378650665283203, 1.408790111541748, 1.6797151565551758, 1.950640082359314, 2.221565008163452, 2.49249005317688, 2.7634150981903076, 3.0343399047851562, 3.305264949798584, 3.5761899948120117, 3.8471150398254395, 4.118040084838867, 4.388965129852295, 4.659890174865723, 4.930814743041992, 5.20173978805542, 5.472664833068848, 5.743589878082275, 6.014514923095703, 6.285439968109131, 6.556365013122559, 6.827289581298828, 7.098215103149414, 7.369139671325684, 7.640064716339111, 7.910989761352539]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 11.0, 11.0, 25.0, 25.0, 53.0, 64.0, 66.0, 110.0, 223.0, 339.0, 572.0, 932.0, 1804.0, 3515.0, 7539.0, 17064.0, 44673.0, 131026.0, 433020.0, 271445.0, 82883.0, 29596.0, 12099.0, 5530.0, 2628.0, 1398.0, 724.0, 429.0, 245.0, 151.0, 106.0, 67.0, 47.0, 39.0, 20.0, 15.0, 20.0, 12.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.29296875, -6.10675048828125, -5.9205322265625, -5.73431396484375, -5.548095703125, -5.36187744140625, -5.1756591796875, -4.98944091796875, -4.80322265625, -4.61700439453125, -4.4307861328125, -4.24456787109375, -4.058349609375, -3.87213134765625, -3.6859130859375, -3.49969482421875, -3.3134765625, -3.12725830078125, -2.9410400390625, -2.75482177734375, -2.568603515625, -2.38238525390625, -2.1961669921875, -2.00994873046875, -1.82373046875, -1.63751220703125, -1.4512939453125, -1.26507568359375, -1.078857421875, -0.89263916015625, -0.7064208984375, -0.52020263671875, -0.333984375, -0.14776611328125, 0.0384521484375, 0.22467041015625, 0.410888671875, 0.59710693359375, 0.7833251953125, 0.96954345703125, 1.15576171875, 1.34197998046875, 1.5281982421875, 1.71441650390625, 1.900634765625, 2.08685302734375, 2.2730712890625, 2.45928955078125, 2.6455078125, 2.83172607421875, 3.0179443359375, 3.20416259765625, 3.390380859375, 3.57659912109375, 3.7628173828125, 3.94903564453125, 4.13525390625, 4.32147216796875, 4.5076904296875, 4.69390869140625, 4.880126953125, 5.06634521484375, 5.2525634765625, 5.43878173828125, 5.625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 10.0, 14.0, 15.0, 5.0, 14.0, 19.0, 24.0, 21.0, 35.0, 27.0, 32.0, 39.0, 47.0, 45.0, 60.0, 49.0, 49.0, 66.0, 47.0, 56.0, 41.0, 49.0, 36.0, 36.0, 31.0, 21.0, 25.0, 16.0, 14.0, 9.0, 9.0, 10.0, 9.0, 6.0, 6.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.095703125, -2.0369873046875, -1.978271484375, -1.9195556640625, -1.86083984375, -1.8021240234375, -1.743408203125, -1.6846923828125, -1.6259765625, -1.5672607421875, -1.508544921875, -1.4498291015625, -1.39111328125, -1.3323974609375, -1.273681640625, -1.2149658203125, -1.15625, -1.0975341796875, -1.038818359375, -0.9801025390625, -0.92138671875, -0.8626708984375, -0.803955078125, -0.7452392578125, -0.6865234375, -0.6278076171875, -0.569091796875, -0.5103759765625, -0.45166015625, -0.3929443359375, -0.334228515625, -0.2755126953125, -0.216796875, -0.1580810546875, -0.099365234375, -0.0406494140625, 0.01806640625, 0.0767822265625, 0.135498046875, 0.1942138671875, 0.2529296875, 0.3116455078125, 0.370361328125, 0.4290771484375, 0.48779296875, 0.5465087890625, 0.605224609375, 0.6639404296875, 0.72265625, 0.7813720703125, 0.840087890625, 0.8988037109375, 0.95751953125, 1.0162353515625, 1.074951171875, 1.1336669921875, 1.1923828125, 1.2510986328125, 1.309814453125, 1.3685302734375, 1.42724609375, 1.4859619140625, 1.544677734375, 1.6033935546875, 1.662109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 8.0, 11.0, 9.0, 16.0, 22.0, 29.0, 30.0, 41.0, 59.0, 74.0, 102.0, 170.0, 269.0, 394.0, 683.0, 1214.0, 2718.0, 7335.0, 25030.0, 113747.0, 605440.0, 229543.0, 42407.0, 11478.0, 3913.0, 1568.0, 811.0, 450.0, 284.0, 190.0, 124.0, 89.0, 67.0, 61.0, 40.0, 28.0, 28.0, 17.0, 11.0, 10.0, 5.0, 9.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.5546875, -7.3236083984375, -7.092529296875, -6.8614501953125, -6.63037109375, -6.3992919921875, -6.168212890625, -5.9371337890625, -5.7060546875, -5.4749755859375, -5.243896484375, -5.0128173828125, -4.78173828125, -4.5506591796875, -4.319580078125, -4.0885009765625, -3.857421875, -3.6263427734375, -3.395263671875, -3.1641845703125, -2.93310546875, -2.7020263671875, -2.470947265625, -2.2398681640625, -2.0087890625, -1.7777099609375, -1.546630859375, -1.3155517578125, -1.08447265625, -0.8533935546875, -0.622314453125, -0.3912353515625, -0.16015625, 0.0709228515625, 0.302001953125, 0.5330810546875, 0.76416015625, 0.9952392578125, 1.226318359375, 1.4573974609375, 1.6884765625, 1.9195556640625, 2.150634765625, 2.3817138671875, 2.61279296875, 2.8438720703125, 3.074951171875, 3.3060302734375, 3.537109375, 3.7681884765625, 3.999267578125, 4.2303466796875, 4.46142578125, 4.6925048828125, 4.923583984375, 5.1546630859375, 5.3857421875, 5.6168212890625, 5.847900390625, 6.0789794921875, 6.31005859375, 6.5411376953125, 6.772216796875, 7.0032958984375, 7.234375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 7.0, 14.0, 15.0, 18.0, 16.0, 19.0, 33.0, 28.0, 28.0, 42.0, 40.0, 41.0, 42.0, 55.0, 57.0, 48.0, 50.0, 54.0, 42.0, 52.0, 44.0, 32.0, 38.0, 27.0, 20.0, 18.0, 20.0, 16.0, 15.0, 8.0, 18.0, 7.0, 9.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.7236328125, -7.486328125, -7.2490234375, -7.01171875, -6.7744140625, -6.537109375, -6.2998046875, -6.0625, -5.8251953125, -5.587890625, -5.3505859375, -5.11328125, -4.8759765625, -4.638671875, -4.4013671875, -4.1640625, -3.9267578125, -3.689453125, -3.4521484375, -3.21484375, -2.9775390625, -2.740234375, -2.5029296875, -2.265625, -2.0283203125, -1.791015625, -1.5537109375, -1.31640625, -1.0791015625, -0.841796875, -0.6044921875, -0.3671875, -0.1298828125, 0.107421875, 0.3447265625, 0.58203125, 0.8193359375, 1.056640625, 1.2939453125, 1.53125, 1.7685546875, 2.005859375, 2.2431640625, 2.48046875, 2.7177734375, 2.955078125, 3.1923828125, 3.4296875, 3.6669921875, 3.904296875, 4.1416015625, 4.37890625, 4.6162109375, 4.853515625, 5.0908203125, 5.328125, 5.5654296875, 5.802734375, 6.0400390625, 6.27734375, 6.5146484375, 6.751953125, 6.9892578125, 7.2265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 9.0, 7.0, 10.0, 12.0, 14.0, 22.0, 33.0, 50.0, 69.0, 113.0, 214.0, 430.0, 1227.0, 4450.0, 27013.0, 330593.0, 634871.0, 40308.0, 6396.0, 1539.0, 543.0, 276.0, 116.0, 74.0, 48.0, 32.0, 22.0, 15.0, 12.0, 11.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.927734375, -3.805389404296875, -3.68304443359375, -3.560699462890625, -3.4383544921875, -3.316009521484375, -3.19366455078125, -3.071319580078125, -2.948974609375, -2.826629638671875, -2.70428466796875, -2.581939697265625, -2.4595947265625, -2.337249755859375, -2.21490478515625, -2.092559814453125, -1.97021484375, -1.847869873046875, -1.72552490234375, -1.603179931640625, -1.4808349609375, -1.358489990234375, -1.23614501953125, -1.113800048828125, -0.991455078125, -0.869110107421875, -0.74676513671875, -0.624420166015625, -0.5020751953125, -0.379730224609375, -0.25738525390625, -0.135040283203125, -0.0126953125, 0.109649658203125, 0.23199462890625, 0.354339599609375, 0.4766845703125, 0.599029541015625, 0.72137451171875, 0.843719482421875, 0.966064453125, 1.088409423828125, 1.21075439453125, 1.333099365234375, 1.4554443359375, 1.577789306640625, 1.70013427734375, 1.822479248046875, 1.94482421875, 2.067169189453125, 2.18951416015625, 2.311859130859375, 2.4342041015625, 2.556549072265625, 2.67889404296875, 2.801239013671875, 2.923583984375, 3.045928955078125, 3.16827392578125, 3.290618896484375, 3.4129638671875, 3.535308837890625, 3.65765380859375, 3.779998779296875, 3.90234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 10.0, 11.0, 17.0, 26.0, 30.0, 40.0, 81.0, 195.0, 248.0, 134.0, 69.0, 30.0, 26.0, 17.0, 14.0, 10.0, 10.0, 1.0, 8.0, 2.0, 2.0, 8.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008015632629394531, -0.0007816553115844727, -0.0007617473602294922, -0.0007418394088745117, -0.0007219314575195312, -0.0007020235061645508, -0.0006821155548095703, -0.0006622076034545898, -0.0006422996520996094, -0.0006223917007446289, -0.0006024837493896484, -0.000582575798034668, -0.0005626678466796875, -0.000542759895324707, -0.0005228519439697266, -0.0005029439926147461, -0.0004830360412597656, -0.00046312808990478516, -0.0004432201385498047, -0.0004233121871948242, -0.00040340423583984375, -0.0003834962844848633, -0.0003635883331298828, -0.00034368038177490234, -0.0003237724304199219, -0.0003038644790649414, -0.00028395652770996094, -0.00026404857635498047, -0.000244140625, -0.00022423267364501953, -0.00020432472229003906, -0.0001844167709350586, -0.00016450881958007812, -0.00014460086822509766, -0.0001246929168701172, -0.00010478496551513672, -8.487701416015625e-05, -6.496906280517578e-05, -4.506111145019531e-05, -2.5153160095214844e-05, -5.245208740234375e-06, 1.4662742614746094e-05, 3.457069396972656e-05, 5.447864532470703e-05, 7.43865966796875e-05, 9.429454803466797e-05, 0.00011420249938964844, 0.0001341104507446289, 0.00015401840209960938, 0.00017392635345458984, 0.0001938343048095703, 0.00021374225616455078, 0.00023365020751953125, 0.0002535581588745117, 0.0002734661102294922, 0.00029337406158447266, 0.0003132820129394531, 0.0003331899642944336, 0.00035309791564941406, 0.00037300586700439453, 0.000392913818359375, 0.00041282176971435547, 0.00043272972106933594, 0.0004526376724243164, 0.0004725456237792969]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 0.0, 8.0, 6.0, 9.0, 13.0, 20.0, 34.0, 68.0, 99.0, 164.0, 318.0, 644.0, 1745.0, 6917.0, 51239.0, 830936.0, 136904.0, 14685.0, 2798.0, 984.0, 445.0, 197.0, 107.0, 75.0, 46.0, 30.0, 19.0, 9.0, 8.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.33984375, -5.1943359375, -5.048828125, -4.9033203125, -4.7578125, -4.6123046875, -4.466796875, -4.3212890625, -4.17578125, -4.0302734375, -3.884765625, -3.7392578125, -3.59375, -3.4482421875, -3.302734375, -3.1572265625, -3.01171875, -2.8662109375, -2.720703125, -2.5751953125, -2.4296875, -2.2841796875, -2.138671875, -1.9931640625, -1.84765625, -1.7021484375, -1.556640625, -1.4111328125, -1.265625, -1.1201171875, -0.974609375, -0.8291015625, -0.68359375, -0.5380859375, -0.392578125, -0.2470703125, -0.1015625, 0.0439453125, 0.189453125, 0.3349609375, 0.48046875, 0.6259765625, 0.771484375, 0.9169921875, 1.0625, 1.2080078125, 1.353515625, 1.4990234375, 1.64453125, 1.7900390625, 1.935546875, 2.0810546875, 2.2265625, 2.3720703125, 2.517578125, 2.6630859375, 2.80859375, 2.9541015625, 3.099609375, 3.2451171875, 3.390625, 3.5361328125, 3.681640625, 3.8271484375, 3.97265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 3.0, 4.0, 9.0, 8.0, 10.0, 20.0, 29.0, 78.0, 142.0, 225.0, 223.0, 99.0, 60.0, 21.0, 15.0, 13.0, 10.0, 10.0, 3.0, 9.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.88671875, -4.757232666015625, -4.62774658203125, -4.498260498046875, -4.3687744140625, -4.239288330078125, -4.10980224609375, -3.980316162109375, -3.850830078125, -3.721343994140625, -3.59185791015625, -3.462371826171875, -3.3328857421875, -3.203399658203125, -3.07391357421875, -2.944427490234375, -2.81494140625, -2.685455322265625, -2.55596923828125, -2.426483154296875, -2.2969970703125, -2.167510986328125, -2.03802490234375, -1.908538818359375, -1.779052734375, -1.649566650390625, -1.52008056640625, -1.390594482421875, -1.2611083984375, -1.131622314453125, -1.00213623046875, -0.872650146484375, -0.7431640625, -0.613677978515625, -0.48419189453125, -0.354705810546875, -0.2252197265625, -0.095733642578125, 0.03375244140625, 0.163238525390625, 0.292724609375, 0.422210693359375, 0.55169677734375, 0.681182861328125, 0.8106689453125, 0.940155029296875, 1.06964111328125, 1.199127197265625, 1.32861328125, 1.458099365234375, 1.58758544921875, 1.717071533203125, 1.8465576171875, 1.976043701171875, 2.10552978515625, 2.235015869140625, 2.364501953125, 2.493988037109375, 2.62347412109375, 2.752960205078125, 2.8824462890625, 3.011932373046875, 3.14141845703125, 3.270904541015625, 3.400390625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 19.0, 47.0, 176.0, 414.0, 244.0, 71.0, 24.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.41777038574219, -92.81172180175781, -89.2056655883789, -85.59961700439453, -81.99356842041016, -78.38751220703125, -74.78146362304688, -71.1754150390625, -67.56936645507812, -63.963314056396484, -60.35726547241211, -56.75121307373047, -53.145164489746094, -49.53911209106445, -45.93305969238281, -42.32701110839844, -38.7209587097168, -35.114906311035156, -31.50885772705078, -27.90280532836914, -24.296756744384766, -20.690704345703125, -17.084653854370117, -13.47860336303711, -9.872552871704102, -6.266502380371094, -2.6604514122009277, 0.9455995559692383, 4.551650047302246, 8.15770149230957, 11.763751983642578, 15.369802474975586, 18.975852966308594, 22.5819034576416, 26.18795394897461, 29.79400634765625, 33.400054931640625, 37.006107330322266, 40.612159729003906, 44.21820831298828, 47.824256896972656, 51.4303092956543, 55.03635787963867, 58.64241027832031, 62.24845886230469, 65.85450744628906, 69.46056365966797, 73.06661224365234, 76.67266845703125, 80.27871704101562, 83.88477325439453, 87.4908218383789, 91.09687042236328, 94.70292663574219, 98.30897521972656, 101.91502380371094, 105.52107238769531, 109.12712097167969, 112.7331771850586, 116.33922576904297, 119.94527435302734, 123.55133056640625, 127.15737915039062, 130.763427734375, 134.36947631835938]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 12.0, 6.0, 8.0, 10.0, 20.0, 10.0, 11.0, 19.0, 16.0, 16.0, 19.0, 20.0, 36.0, 33.0, 27.0, 38.0, 44.0, 40.0, 40.0, 42.0, 34.0, 38.0, 38.0, 47.0, 43.0, 37.0, 28.0, 31.0, 24.0, 18.0, 25.0, 26.0, 28.0, 14.0, 12.0, 12.0, 14.0, 17.0, 12.0, 3.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.675559997558594, -31.67898941040039, -30.682416915893555, -29.68584632873535, -28.689273834228516, -27.692703247070312, -26.69613265991211, -25.699560165405273, -24.702987670898438, -23.706417083740234, -22.7098445892334, -21.713274002075195, -20.71670150756836, -19.720130920410156, -18.723560333251953, -17.726987838745117, -16.730417251586914, -15.733845710754395, -14.737274169921875, -13.740703582763672, -12.744131088256836, -11.747560501098633, -10.750988960266113, -9.754417419433594, -8.757845878601074, -7.761274337768555, -6.764702796936035, -5.768131732940674, -4.771560192108154, -3.7749886512756348, -2.7784175872802734, -1.781846046447754, -0.7852725982666016, 0.21129882335662842, 1.2078702449798584, 2.204441547393799, 3.2010130882263184, 4.197584629058838, 5.194155693054199, 6.190727233886719, 7.187298774719238, 8.183870315551758, 9.180441856384277, 10.177013397216797, 11.173583984375, 12.170156478881836, 13.166727066040039, 14.163298606872559, 15.159870147705078, 16.15644073486328, 17.153013229370117, 18.14958381652832, 19.146156311035156, 20.14272689819336, 21.139297485351562, 22.1358699798584, 23.132442474365234, 24.129013061523438, 25.125585556030273, 26.122156143188477, 27.118728637695312, 28.115299224853516, 29.11186981201172, 30.108442306518555, 31.105012893676758]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 7.0, 11.0, 12.0, 22.0, 23.0, 38.0, 56.0, 74.0, 105.0, 153.0, 185.0, 281.0, 455.0, 674.0, 1107.0, 1664.0, 2954.0, 5397.0, 11035.0, 25870.0, 84205.0, 1005973.0, 2885413.0, 110660.0, 31239.0, 12220.0, 5936.0, 3216.0, 1891.0, 1127.0, 686.0, 467.0, 321.0, 223.0, 157.0, 111.0, 80.0, 65.0, 53.0, 27.0, 23.0, 13.0, 11.0, 11.0, 7.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.23046875, -5.0770263671875, -4.923583984375, -4.7701416015625, -4.61669921875, -4.4632568359375, -4.309814453125, -4.1563720703125, -4.0029296875, -3.8494873046875, -3.696044921875, -3.5426025390625, -3.38916015625, -3.2357177734375, -3.082275390625, -2.9288330078125, -2.775390625, -2.6219482421875, -2.468505859375, -2.3150634765625, -2.16162109375, -2.0081787109375, -1.854736328125, -1.7012939453125, -1.5478515625, -1.3944091796875, -1.240966796875, -1.0875244140625, -0.93408203125, -0.7806396484375, -0.627197265625, -0.4737548828125, -0.3203125, -0.1668701171875, -0.013427734375, 0.1400146484375, 0.29345703125, 0.4468994140625, 0.600341796875, 0.7537841796875, 0.9072265625, 1.0606689453125, 1.214111328125, 1.3675537109375, 1.52099609375, 1.6744384765625, 1.827880859375, 1.9813232421875, 2.134765625, 2.2882080078125, 2.441650390625, 2.5950927734375, 2.74853515625, 2.9019775390625, 3.055419921875, 3.2088623046875, 3.3623046875, 3.5157470703125, 3.669189453125, 3.8226318359375, 3.97607421875, 4.1295166015625, 4.282958984375, 4.4364013671875, 4.58984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 12.0, 15.0, 18.0, 22.0, 12.0, 22.0, 26.0, 33.0, 28.0, 38.0, 40.0, 39.0, 38.0, 46.0, 63.0, 38.0, 43.0, 49.0, 42.0, 38.0, 34.0, 42.0, 43.0, 44.0, 37.0, 27.0, 22.0, 16.0, 9.0, 17.0, 9.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.189453125, -2.12860107421875, -2.0677490234375, -2.00689697265625, -1.946044921875, -1.88519287109375, -1.8243408203125, -1.76348876953125, -1.70263671875, -1.64178466796875, -1.5809326171875, -1.52008056640625, -1.459228515625, -1.39837646484375, -1.3375244140625, -1.27667236328125, -1.2158203125, -1.15496826171875, -1.0941162109375, -1.03326416015625, -0.972412109375, -0.91156005859375, -0.8507080078125, -0.78985595703125, -0.72900390625, -0.66815185546875, -0.6072998046875, -0.54644775390625, -0.485595703125, -0.42474365234375, -0.3638916015625, -0.30303955078125, -0.2421875, -0.18133544921875, -0.1204833984375, -0.05963134765625, 0.001220703125, 0.06207275390625, 0.1229248046875, 0.18377685546875, 0.24462890625, 0.30548095703125, 0.3663330078125, 0.42718505859375, 0.488037109375, 0.54888916015625, 0.6097412109375, 0.67059326171875, 0.7314453125, 0.79229736328125, 0.8531494140625, 0.91400146484375, 0.974853515625, 1.03570556640625, 1.0965576171875, 1.15740966796875, 1.21826171875, 1.27911376953125, 1.3399658203125, 1.40081787109375, 1.461669921875, 1.52252197265625, 1.5833740234375, 1.64422607421875, 1.705078125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 7.0, 4.0, 21.0, 13.0, 13.0, 24.0, 29.0, 36.0, 60.0, 62.0, 84.0, 117.0, 152.0, 296.0, 554.0, 1205.0, 3173.0, 10906.0, 60579.0, 3178753.0, 888676.0, 37306.0, 7783.0, 2372.0, 926.0, 419.0, 232.0, 116.0, 77.0, 80.0, 48.0, 37.0, 37.0, 17.0, 19.0, 11.0, 13.0, 5.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.78515625, -6.56549072265625, -6.3458251953125, -6.12615966796875, -5.906494140625, -5.68682861328125, -5.4671630859375, -5.24749755859375, -5.02783203125, -4.80816650390625, -4.5885009765625, -4.36883544921875, -4.149169921875, -3.92950439453125, -3.7098388671875, -3.49017333984375, -3.2705078125, -3.05084228515625, -2.8311767578125, -2.61151123046875, -2.391845703125, -2.17218017578125, -1.9525146484375, -1.73284912109375, -1.51318359375, -1.29351806640625, -1.0738525390625, -0.85418701171875, -0.634521484375, -0.41485595703125, -0.1951904296875, 0.02447509765625, 0.244140625, 0.46380615234375, 0.6834716796875, 0.90313720703125, 1.122802734375, 1.34246826171875, 1.5621337890625, 1.78179931640625, 2.00146484375, 2.22113037109375, 2.4407958984375, 2.66046142578125, 2.880126953125, 3.09979248046875, 3.3194580078125, 3.53912353515625, 3.7587890625, 3.97845458984375, 4.1981201171875, 4.41778564453125, 4.637451171875, 4.85711669921875, 5.0767822265625, 5.29644775390625, 5.51611328125, 5.73577880859375, 5.9554443359375, 6.17510986328125, 6.394775390625, 6.61444091796875, 6.8341064453125, 7.05377197265625, 7.2734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 9.0, 7.0, 10.0, 19.0, 27.0, 44.0, 88.0, 240.0, 1392.0, 1768.0, 282.0, 103.0, 33.0, 18.0, 17.0, 11.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65625, -5.533447265625, -5.41064453125, -5.287841796875, -5.1650390625, -5.042236328125, -4.91943359375, -4.796630859375, -4.673828125, -4.551025390625, -4.42822265625, -4.305419921875, -4.1826171875, -4.059814453125, -3.93701171875, -3.814208984375, -3.69140625, -3.568603515625, -3.44580078125, -3.322998046875, -3.2001953125, -3.077392578125, -2.95458984375, -2.831787109375, -2.708984375, -2.586181640625, -2.46337890625, -2.340576171875, -2.2177734375, -2.094970703125, -1.97216796875, -1.849365234375, -1.7265625, -1.603759765625, -1.48095703125, -1.358154296875, -1.2353515625, -1.112548828125, -0.98974609375, -0.866943359375, -0.744140625, -0.621337890625, -0.49853515625, -0.375732421875, -0.2529296875, -0.130126953125, -0.00732421875, 0.115478515625, 0.23828125, 0.361083984375, 0.48388671875, 0.606689453125, 0.7294921875, 0.852294921875, 0.97509765625, 1.097900390625, 1.220703125, 1.343505859375, 1.46630859375, 1.589111328125, 1.7119140625, 1.834716796875, 1.95751953125, 2.080322265625, 2.203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 26.0, 33.0, 72.0, 118.0, 162.0, 186.0, 174.0, 123.0, 50.0, 17.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.00313377380371, -18.516788482666016, -18.03044319152832, -17.544097900390625, -17.057750701904297, -16.5714054107666, -16.085060119628906, -15.598714828491211, -15.1123685836792, -14.626023292541504, -14.139677047729492, -13.653331756591797, -13.166986465454102, -12.68064022064209, -12.194294929504395, -11.707948684692383, -11.221603393554688, -10.735258102416992, -10.24891185760498, -9.762566566467285, -9.27622127532959, -8.789875030517578, -8.303529739379883, -7.817183971405029, -7.330839157104492, -6.844493389129639, -6.358148097991943, -5.87180233001709, -5.385456562042236, -4.899110794067383, -4.4127655029296875, -3.926419734954834, -3.4400739669799805, -2.953728437423706, -2.4673826694488525, -1.9810371398925781, -1.4946914911270142, -1.0083458423614502, -0.5220003128051758, -0.035654544830322266, 0.45069098472595215, 0.9370366334915161, 1.42338228225708, 1.9097278118133545, 2.396073341369629, 2.8824191093444824, 3.368764638900757, 3.8551104068756104, 4.341455936431885, 4.827801704406738, 5.314146995544434, 5.800492763519287, 6.286838531494141, 6.773183822631836, 7.2595295906066895, 7.745875358581543, 8.232220649719238, 8.718565940856934, 9.204912185668945, 9.69125747680664, 10.177602767944336, 10.663949012756348, 11.150294303894043, 11.636640548706055, 12.12298583984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 14.0, 16.0, 21.0, 27.0, 23.0, 44.0, 70.0, 62.0, 58.0, 77.0, 72.0, 93.0, 78.0, 67.0, 60.0, 51.0, 47.0, 38.0, 26.0, 17.0, 14.0, 14.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.701298713684082, -8.281000137329102, -7.860701560974121, -7.440403461456299, -7.020104885101318, -6.599806308746338, -6.179508209228516, -5.759209632873535, -5.338911056518555, -4.918612480163574, -4.498313903808594, -4.0780158042907715, -3.657717227935791, -3.2374186515808105, -2.817120313644409, -2.396821975708008, -1.9765233993530273, -1.5562249422073364, -1.1359264850616455, -0.7156280279159546, -0.29532957077026367, 0.1249690055847168, 0.5452673435211182, 0.9655656814575195, 1.3858642578125, 1.806162714958191, 2.226461172103882, 2.646759510040283, 3.0670580863952637, 3.487356662750244, 3.9076550006866455, 4.327953338623047, 4.748252868652344, 5.168551445007324, 5.588850021362305, 6.009148120880127, 6.429446697235107, 6.849745273590088, 7.27004337310791, 7.690341949462891, 8.110640525817871, 8.530939102172852, 8.951237678527832, 9.371536254882812, 9.791833877563477, 10.212133407592773, 10.632431030273438, 11.052729606628418, 11.473028182983398, 11.893326759338379, 12.31362533569336, 12.73392391204834, 13.15422248840332, 13.574520111083984, 13.994818687438965, 14.415117263793945, 14.835415840148926, 15.255714416503906, 15.676012992858887, 16.096311569213867, 16.51660919189453, 16.936908721923828, 17.357206344604492, 17.777503967285156, 18.197803497314453]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 5.0, 14.0, 12.0, 23.0, 25.0, 35.0, 54.0, 74.0, 96.0, 148.0, 243.0, 512.0, 839.0, 1789.0, 3819.0, 8773.0, 23054.0, 65780.0, 212059.0, 477486.0, 166809.0, 53967.0, 18916.0, 7368.0, 3223.0, 1518.0, 777.0, 405.0, 253.0, 163.0, 100.0, 53.0, 42.0, 28.0, 20.0, 15.0, 13.0, 5.0, 10.0, 5.0, 5.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0], "bins": [-6.72265625, -6.53277587890625, -6.3428955078125, -6.15301513671875, -5.963134765625, -5.77325439453125, -5.5833740234375, -5.39349365234375, -5.20361328125, -5.01373291015625, -4.8238525390625, -4.63397216796875, -4.444091796875, -4.25421142578125, -4.0643310546875, -3.87445068359375, -3.6845703125, -3.49468994140625, -3.3048095703125, -3.11492919921875, -2.925048828125, -2.73516845703125, -2.5452880859375, -2.35540771484375, -2.16552734375, -1.97564697265625, -1.7857666015625, -1.59588623046875, -1.406005859375, -1.21612548828125, -1.0262451171875, -0.83636474609375, -0.646484375, -0.45660400390625, -0.2667236328125, -0.07684326171875, 0.113037109375, 0.30291748046875, 0.4927978515625, 0.68267822265625, 0.87255859375, 1.06243896484375, 1.2523193359375, 1.44219970703125, 1.632080078125, 1.82196044921875, 2.0118408203125, 2.20172119140625, 2.3916015625, 2.58148193359375, 2.7713623046875, 2.96124267578125, 3.151123046875, 3.34100341796875, 3.5308837890625, 3.72076416015625, 3.91064453125, 4.10052490234375, 4.2904052734375, 4.48028564453125, 4.670166015625, 4.86004638671875, 5.0499267578125, 5.23980712890625, 5.4296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 11.0, 4.0, 7.0, 14.0, 14.0, 29.0, 23.0, 20.0, 22.0, 34.0, 37.0, 32.0, 39.0, 39.0, 55.0, 46.0, 50.0, 42.0, 55.0, 40.0, 34.0, 51.0, 58.0, 32.0, 36.0, 36.0, 30.0, 26.0, 11.0, 14.0, 17.0, 11.0, 9.0, 5.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.26953125, -2.2071685791015625, -2.144805908203125, -2.0824432373046875, -2.02008056640625, -1.9577178955078125, -1.895355224609375, -1.8329925537109375, -1.7706298828125, -1.7082672119140625, -1.645904541015625, -1.5835418701171875, -1.52117919921875, -1.4588165283203125, -1.396453857421875, -1.3340911865234375, -1.271728515625, -1.2093658447265625, -1.147003173828125, -1.0846405029296875, -1.02227783203125, -0.9599151611328125, -0.897552490234375, -0.8351898193359375, -0.7728271484375, -0.7104644775390625, -0.648101806640625, -0.5857391357421875, -0.52337646484375, -0.4610137939453125, -0.398651123046875, -0.3362884521484375, -0.27392578125, -0.2115631103515625, -0.149200439453125, -0.0868377685546875, -0.02447509765625, 0.0378875732421875, 0.100250244140625, 0.1626129150390625, 0.2249755859375, 0.2873382568359375, 0.349700927734375, 0.4120635986328125, 0.47442626953125, 0.5367889404296875, 0.599151611328125, 0.6615142822265625, 0.723876953125, 0.7862396240234375, 0.848602294921875, 0.9109649658203125, 0.97332763671875, 1.0356903076171875, 1.098052978515625, 1.1604156494140625, 1.2227783203125, 1.2851409912109375, 1.347503662109375, 1.4098663330078125, 1.47222900390625, 1.5345916748046875, 1.596954345703125, 1.6593170166015625, 1.7216796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 6.0, 1.0, 10.0, 5.0, 11.0, 15.0, 9.0, 22.0, 35.0, 38.0, 60.0, 72.0, 102.0, 166.0, 271.0, 516.0, 947.0, 2092.0, 5184.0, 13959.0, 49028.0, 251805.0, 577667.0, 105638.0, 26047.0, 8331.0, 3254.0, 1511.0, 705.0, 361.0, 229.0, 115.0, 102.0, 51.0, 56.0, 26.0, 19.0, 19.0, 19.0, 8.0, 10.0, 8.0, 8.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-7.68359375, -7.4716796875, -7.259765625, -7.0478515625, -6.8359375, -6.6240234375, -6.412109375, -6.2001953125, -5.98828125, -5.7763671875, -5.564453125, -5.3525390625, -5.140625, -4.9287109375, -4.716796875, -4.5048828125, -4.29296875, -4.0810546875, -3.869140625, -3.6572265625, -3.4453125, -3.2333984375, -3.021484375, -2.8095703125, -2.59765625, -2.3857421875, -2.173828125, -1.9619140625, -1.75, -1.5380859375, -1.326171875, -1.1142578125, -0.90234375, -0.6904296875, -0.478515625, -0.2666015625, -0.0546875, 0.1572265625, 0.369140625, 0.5810546875, 0.79296875, 1.0048828125, 1.216796875, 1.4287109375, 1.640625, 1.8525390625, 2.064453125, 2.2763671875, 2.48828125, 2.7001953125, 2.912109375, 3.1240234375, 3.3359375, 3.5478515625, 3.759765625, 3.9716796875, 4.18359375, 4.3955078125, 4.607421875, 4.8193359375, 5.03125, 5.2431640625, 5.455078125, 5.6669921875, 5.87890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 1.0, 6.0, 2.0, 10.0, 10.0, 12.0, 10.0, 15.0, 16.0, 19.0, 30.0, 24.0, 35.0, 41.0, 53.0, 55.0, 42.0, 60.0, 49.0, 44.0, 66.0, 53.0, 68.0, 53.0, 46.0, 39.0, 28.0, 20.0, 16.0, 13.0, 12.0, 12.0, 7.0, 8.0, 4.0, 3.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.484375, -10.20281982421875, -9.9212646484375, -9.63970947265625, -9.358154296875, -9.07659912109375, -8.7950439453125, -8.51348876953125, -8.23193359375, -7.95037841796875, -7.6688232421875, -7.38726806640625, -7.105712890625, -6.82415771484375, -6.5426025390625, -6.26104736328125, -5.9794921875, -5.69793701171875, -5.4163818359375, -5.13482666015625, -4.853271484375, -4.57171630859375, -4.2901611328125, -4.00860595703125, -3.72705078125, -3.44549560546875, -3.1639404296875, -2.88238525390625, -2.600830078125, -2.31927490234375, -2.0377197265625, -1.75616455078125, -1.474609375, -1.19305419921875, -0.9114990234375, -0.62994384765625, -0.348388671875, -0.06683349609375, 0.2147216796875, 0.49627685546875, 0.77783203125, 1.05938720703125, 1.3409423828125, 1.62249755859375, 1.904052734375, 2.18560791015625, 2.4671630859375, 2.74871826171875, 3.0302734375, 3.31182861328125, 3.5933837890625, 3.87493896484375, 4.156494140625, 4.43804931640625, 4.7196044921875, 5.00115966796875, 5.28271484375, 5.56427001953125, 5.8458251953125, 6.12738037109375, 6.408935546875, 6.69049072265625, 6.9720458984375, 7.25360107421875, 7.53515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 7.0, 5.0, 8.0, 22.0, 25.0, 48.0, 89.0, 174.0, 425.0, 1340.0, 5695.0, 27496.0, 204932.0, 730752.0, 61719.0, 12068.0, 2464.0, 749.0, 263.0, 134.0, 63.0, 20.0, 16.0, 17.0, 7.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.88671875, -2.79718017578125, -2.7076416015625, -2.61810302734375, -2.528564453125, -2.43902587890625, -2.3494873046875, -2.25994873046875, -2.17041015625, -2.08087158203125, -1.9913330078125, -1.90179443359375, -1.812255859375, -1.72271728515625, -1.6331787109375, -1.54364013671875, -1.4541015625, -1.36456298828125, -1.2750244140625, -1.18548583984375, -1.095947265625, -1.00640869140625, -0.9168701171875, -0.82733154296875, -0.73779296875, -0.64825439453125, -0.5587158203125, -0.46917724609375, -0.379638671875, -0.29010009765625, -0.2005615234375, -0.11102294921875, -0.021484375, 0.06805419921875, 0.1575927734375, 0.24713134765625, 0.336669921875, 0.42620849609375, 0.5157470703125, 0.60528564453125, 0.69482421875, 0.78436279296875, 0.8739013671875, 0.96343994140625, 1.052978515625, 1.14251708984375, 1.2320556640625, 1.32159423828125, 1.4111328125, 1.50067138671875, 1.5902099609375, 1.67974853515625, 1.769287109375, 1.85882568359375, 1.9483642578125, 2.03790283203125, 2.12744140625, 2.21697998046875, 2.3065185546875, 2.39605712890625, 2.485595703125, 2.57513427734375, 2.6646728515625, 2.75421142578125, 2.84375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 13.0, 12.0, 13.0, 11.0, 19.0, 21.0, 37.0, 95.0, 185.0, 244.0, 141.0, 60.0, 35.0, 22.0, 15.0, 9.0, 6.0, 13.0, 6.0, 4.0, 7.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.0006427764892578125, -0.000628247857093811, -0.0006137192249298096, -0.0005991905927658081, -0.0005846619606018066, -0.0005701333284378052, -0.0005556046962738037, -0.0005410760641098022, -0.0005265474319458008, -0.0005120187997817993, -0.0004974901676177979, -0.0004829615354537964, -0.0004684329032897949, -0.00045390427112579346, -0.000439375638961792, -0.00042484700679779053, -0.00041031837463378906, -0.0003957897424697876, -0.00038126111030578613, -0.00036673247814178467, -0.0003522038459777832, -0.00033767521381378174, -0.0003231465816497803, -0.0003086179494857788, -0.00029408931732177734, -0.0002795606851577759, -0.0002650320529937744, -0.00025050342082977295, -0.00023597478866577148, -0.00022144615650177002, -0.00020691752433776855, -0.0001923888921737671, -0.00017786026000976562, -0.00016333162784576416, -0.0001488029956817627, -0.00013427436351776123, -0.00011974573135375977, -0.0001052170991897583, -9.068846702575684e-05, -7.615983486175537e-05, -6.16312026977539e-05, -4.710257053375244e-05, -3.2573938369750977e-05, -1.8045306205749512e-05, -3.516674041748047e-06, 1.1011958122253418e-05, 2.5540590286254883e-05, 4.006922245025635e-05, 5.459785461425781e-05, 6.912648677825928e-05, 8.365511894226074e-05, 9.818375110626221e-05, 0.00011271238327026367, 0.00012724101543426514, 0.0001417696475982666, 0.00015629827976226807, 0.00017082691192626953, 0.000185355544090271, 0.00019988417625427246, 0.00021441280841827393, 0.0002289414405822754, 0.00024347007274627686, 0.0002579987049102783, 0.0002725273370742798, 0.00028705596923828125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 12.0, 9.0, 26.0, 34.0, 65.0, 119.0, 255.0, 573.0, 1827.0, 8741.0, 60894.0, 833741.0, 123495.0, 14601.0, 2755.0, 791.0, 310.0, 124.0, 75.0, 43.0, 28.0, 15.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.015625, -3.906036376953125, -3.79644775390625, -3.686859130859375, -3.5772705078125, -3.467681884765625, -3.35809326171875, -3.248504638671875, -3.138916015625, -3.029327392578125, -2.91973876953125, -2.810150146484375, -2.7005615234375, -2.590972900390625, -2.48138427734375, -2.371795654296875, -2.26220703125, -2.152618408203125, -2.04302978515625, -1.933441162109375, -1.8238525390625, -1.714263916015625, -1.60467529296875, -1.495086669921875, -1.385498046875, -1.275909423828125, -1.16632080078125, -1.056732177734375, -0.9471435546875, -0.837554931640625, -0.72796630859375, -0.618377685546875, -0.5087890625, -0.399200439453125, -0.28961181640625, -0.180023193359375, -0.0704345703125, 0.039154052734375, 0.14874267578125, 0.258331298828125, 0.367919921875, 0.477508544921875, 0.58709716796875, 0.696685791015625, 0.8062744140625, 0.915863037109375, 1.02545166015625, 1.135040283203125, 1.24462890625, 1.354217529296875, 1.46380615234375, 1.573394775390625, 1.6829833984375, 1.792572021484375, 1.90216064453125, 2.011749267578125, 2.121337890625, 2.230926513671875, 2.34051513671875, 2.450103759765625, 2.5596923828125, 2.669281005859375, 2.77886962890625, 2.888458251953125, 2.998046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 11.0, 6.0, 11.0, 16.0, 22.0, 37.0, 53.0, 100.0, 154.0, 208.0, 134.0, 94.0, 49.0, 37.0, 18.0, 20.0, 10.0, 9.0, 4.0, 5.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.306640625, -2.208221435546875, -2.10980224609375, -2.011383056640625, -1.9129638671875, -1.814544677734375, -1.71612548828125, -1.617706298828125, -1.519287109375, -1.420867919921875, -1.32244873046875, -1.224029541015625, -1.1256103515625, -1.027191162109375, -0.92877197265625, -0.830352783203125, -0.73193359375, -0.633514404296875, -0.53509521484375, -0.436676025390625, -0.3382568359375, -0.239837646484375, -0.14141845703125, -0.042999267578125, 0.055419921875, 0.153839111328125, 0.25225830078125, 0.350677490234375, 0.4490966796875, 0.547515869140625, 0.64593505859375, 0.744354248046875, 0.8427734375, 0.941192626953125, 1.03961181640625, 1.138031005859375, 1.2364501953125, 1.334869384765625, 1.43328857421875, 1.531707763671875, 1.630126953125, 1.728546142578125, 1.82696533203125, 1.925384521484375, 2.0238037109375, 2.122222900390625, 2.22064208984375, 2.319061279296875, 2.41748046875, 2.515899658203125, 2.61431884765625, 2.712738037109375, 2.8111572265625, 2.909576416015625, 3.00799560546875, 3.106414794921875, 3.204833984375, 3.303253173828125, 3.40167236328125, 3.500091552734375, 3.5985107421875, 3.696929931640625, 3.79534912109375, 3.893768310546875, 3.9921875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 8.0, 8.0, 19.0, 26.0, 64.0, 117.0, 184.0, 208.0, 176.0, 105.0, 40.0, 27.0, 15.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-79.7020263671875, -78.09283447265625, -76.48363494873047, -74.87444305419922, -73.26524353027344, -71.65605163574219, -70.0468521118164, -68.43766021728516, -66.82846069335938, -65.21926879882812, -63.610069274902344, -62.00087356567383, -60.39167785644531, -58.78248596191406, -57.17329025268555, -55.56409454345703, -53.95490264892578, -52.345706939697266, -50.73651123046875, -49.127315521240234, -47.51811981201172, -45.90892791748047, -44.29973220825195, -42.69053649902344, -41.08134078979492, -39.472145080566406, -37.86294937133789, -36.253753662109375, -34.644561767578125, -33.035362243652344, -31.426170349121094, -29.816974639892578, -28.207782745361328, -26.598587036132812, -24.989391326904297, -23.380197525024414, -21.7710018157959, -20.161806106567383, -18.5526123046875, -16.943416595458984, -15.334220886230469, -13.725025177001953, -12.115830421447754, -10.506635665893555, -8.897439956665039, -7.288244247436523, -5.679049491882324, -4.069854736328125, -2.4606590270996094, -0.851463794708252, 0.7577314376831055, 2.366926670074463, 3.9761219024658203, 5.585317611694336, 7.194512367248535, 8.803707122802734, 10.41290283203125, 12.022098541259766, 13.631293296813965, 15.240488052368164, 16.84968376159668, 18.458879470825195, 20.068073272705078, 21.677268981933594, 23.28646469116211]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 11.0, 10.0, 15.0, 20.0, 15.0, 13.0, 22.0, 15.0, 21.0, 24.0, 22.0, 34.0, 34.0, 27.0, 31.0, 44.0, 35.0, 30.0, 34.0, 47.0, 39.0, 47.0, 28.0, 35.0, 39.0, 26.0, 26.0, 27.0, 35.0, 18.0, 24.0, 20.0, 13.0, 18.0, 20.0, 9.0, 19.0, 6.0, 9.0, 7.0, 6.0, 4.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.196887969970703, -26.303001403808594, -25.40911293029785, -24.51522445678711, -23.621337890625, -22.72745132446289, -21.83356285095215, -20.939674377441406, -20.045787811279297, -19.151901245117188, -18.258012771606445, -17.364124298095703, -16.470237731933594, -15.576350212097168, -14.682462692260742, -13.788575172424316, -12.89468765258789, -12.000800132751465, -11.106912612915039, -10.213025093078613, -9.319137573242188, -8.425250053405762, -7.531362533569336, -6.63747501373291, -5.743587493896484, -4.849699974060059, -3.955812454223633, -3.061924934387207, -2.1680374145507812, -1.2741498947143555, -0.3802623748779297, 0.5136251449584961, 1.4075145721435547, 2.3014020919799805, 3.1952896118164062, 4.089177131652832, 4.983064651489258, 5.876952171325684, 6.770839691162109, 7.664727210998535, 8.558614730834961, 9.452502250671387, 10.346389770507812, 11.240277290344238, 12.134164810180664, 13.02805233001709, 13.921939849853516, 14.815827369689941, 15.709714889526367, 16.60360336303711, 17.49748992919922, 18.391376495361328, 19.28526496887207, 20.179153442382812, 21.073040008544922, 21.96692657470703, 22.860815048217773, 23.754703521728516, 24.648590087890625, 25.542476654052734, 26.436365127563477, 27.33025360107422, 28.224140167236328, 29.118026733398438, 30.01191520690918]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 13.0, 20.0, 23.0, 33.0, 45.0, 84.0, 90.0, 162.0, 278.0, 371.0, 527.0, 819.0, 1337.0, 2088.0, 3476.0, 6307.0, 12851.0, 33502.0, 165526.0, 3618411.0, 272041.0, 43625.0, 15456.0, 7026.0, 3878.0, 2223.0, 1406.0, 888.0, 564.0, 373.0, 225.0, 182.0, 126.0, 83.0, 67.0, 44.0, 35.0, 14.0, 14.0, 13.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.26171875, -7.0577392578125, -6.853759765625, -6.6497802734375, -6.44580078125, -6.2418212890625, -6.037841796875, -5.8338623046875, -5.6298828125, -5.4259033203125, -5.221923828125, -5.0179443359375, -4.81396484375, -4.6099853515625, -4.406005859375, -4.2020263671875, -3.998046875, -3.7940673828125, -3.590087890625, -3.3861083984375, -3.18212890625, -2.9781494140625, -2.774169921875, -2.5701904296875, -2.3662109375, -2.1622314453125, -1.958251953125, -1.7542724609375, -1.55029296875, -1.3463134765625, -1.142333984375, -0.9383544921875, -0.734375, -0.5303955078125, -0.326416015625, -0.1224365234375, 0.08154296875, 0.2855224609375, 0.489501953125, 0.6934814453125, 0.8974609375, 1.1014404296875, 1.305419921875, 1.5093994140625, 1.71337890625, 1.9173583984375, 2.121337890625, 2.3253173828125, 2.529296875, 2.7332763671875, 2.937255859375, 3.1412353515625, 3.34521484375, 3.5491943359375, 3.753173828125, 3.9571533203125, 4.1611328125, 4.3651123046875, 4.569091796875, 4.7730712890625, 4.97705078125, 5.1810302734375, 5.385009765625, 5.5889892578125, 5.79296875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 10.0, 8.0, 9.0, 12.0, 10.0, 11.0, 19.0, 21.0, 16.0, 24.0, 38.0, 33.0, 27.0, 30.0, 44.0, 47.0, 44.0, 40.0, 58.0, 42.0, 51.0, 43.0, 36.0, 44.0, 33.0, 37.0, 51.0, 29.0, 27.0, 22.0, 14.0, 16.0, 16.0, 8.0, 12.0, 8.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.380859375, -2.3166656494140625, -2.252471923828125, -2.1882781982421875, -2.12408447265625, -2.0598907470703125, -1.995697021484375, -1.9315032958984375, -1.8673095703125, -1.8031158447265625, -1.738922119140625, -1.6747283935546875, -1.61053466796875, -1.5463409423828125, -1.482147216796875, -1.4179534912109375, -1.353759765625, -1.2895660400390625, -1.225372314453125, -1.1611785888671875, -1.09698486328125, -1.0327911376953125, -0.968597412109375, -0.9044036865234375, -0.8402099609375, -0.7760162353515625, -0.711822509765625, -0.6476287841796875, -0.58343505859375, -0.5192413330078125, -0.455047607421875, -0.3908538818359375, -0.32666015625, -0.2624664306640625, -0.198272705078125, -0.1340789794921875, -0.06988525390625, -0.0056915283203125, 0.058502197265625, 0.1226959228515625, 0.1868896484375, 0.2510833740234375, 0.315277099609375, 0.3794708251953125, 0.44366455078125, 0.5078582763671875, 0.572052001953125, 0.6362457275390625, 0.700439453125, 0.7646331787109375, 0.828826904296875, 0.8930206298828125, 0.95721435546875, 1.0214080810546875, 1.085601806640625, 1.1497955322265625, 1.2139892578125, 1.2781829833984375, 1.342376708984375, 1.4065704345703125, 1.47076416015625, 1.5349578857421875, 1.599151611328125, 1.6633453369140625, 1.7275390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 9.0, 13.0, 13.0, 22.0, 28.0, 40.0, 76.0, 118.0, 159.0, 254.0, 396.0, 589.0, 1005.0, 1837.0, 3352.0, 7085.0, 16662.0, 51572.0, 308890.0, 3479182.0, 248458.0, 45536.0, 15082.0, 6413.0, 3158.0, 1745.0, 946.0, 584.0, 356.0, 249.0, 158.0, 97.0, 60.0, 37.0, 29.0, 22.0, 10.0, 14.0, 11.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.18023681640625, -5.0206298828125, -4.86102294921875, -4.701416015625, -4.54180908203125, -4.3822021484375, -4.22259521484375, -4.06298828125, -3.90338134765625, -3.7437744140625, -3.58416748046875, -3.424560546875, -3.26495361328125, -3.1053466796875, -2.94573974609375, -2.7861328125, -2.62652587890625, -2.4669189453125, -2.30731201171875, -2.147705078125, -1.98809814453125, -1.8284912109375, -1.66888427734375, -1.50927734375, -1.34967041015625, -1.1900634765625, -1.03045654296875, -0.870849609375, -0.71124267578125, -0.5516357421875, -0.39202880859375, -0.232421875, -0.07281494140625, 0.0867919921875, 0.24639892578125, 0.406005859375, 0.56561279296875, 0.7252197265625, 0.88482666015625, 1.04443359375, 1.20404052734375, 1.3636474609375, 1.52325439453125, 1.682861328125, 1.84246826171875, 2.0020751953125, 2.16168212890625, 2.3212890625, 2.48089599609375, 2.6405029296875, 2.80010986328125, 2.959716796875, 3.11932373046875, 3.2789306640625, 3.43853759765625, 3.59814453125, 3.75775146484375, 3.9173583984375, 4.07696533203125, 4.236572265625, 4.39617919921875, 4.5557861328125, 4.71539306640625, 4.875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 12.0, 12.0, 15.0, 12.0, 33.0, 36.0, 82.0, 196.0, 680.0, 2326.0, 391.0, 101.0, 63.0, 34.0, 13.0, 16.0, 2.0, 11.0, 7.0, 6.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.99609375, -3.8797607421875, -3.763427734375, -3.6470947265625, -3.53076171875, -3.4144287109375, -3.298095703125, -3.1817626953125, -3.0654296875, -2.9490966796875, -2.832763671875, -2.7164306640625, -2.60009765625, -2.4837646484375, -2.367431640625, -2.2510986328125, -2.134765625, -2.0184326171875, -1.902099609375, -1.7857666015625, -1.66943359375, -1.5531005859375, -1.436767578125, -1.3204345703125, -1.2041015625, -1.0877685546875, -0.971435546875, -0.8551025390625, -0.73876953125, -0.6224365234375, -0.506103515625, -0.3897705078125, -0.2734375, -0.1571044921875, -0.040771484375, 0.0755615234375, 0.19189453125, 0.3082275390625, 0.424560546875, 0.5408935546875, 0.6572265625, 0.7735595703125, 0.889892578125, 1.0062255859375, 1.12255859375, 1.2388916015625, 1.355224609375, 1.4715576171875, 1.587890625, 1.7042236328125, 1.820556640625, 1.9368896484375, 2.05322265625, 2.1695556640625, 2.285888671875, 2.4022216796875, 2.5185546875, 2.6348876953125, 2.751220703125, 2.8675537109375, 2.98388671875, 3.1002197265625, 3.216552734375, 3.3328857421875, 3.44921875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 16.0, 27.0, 51.0, 69.0, 99.0, 130.0, 160.0, 143.0, 115.0, 61.0, 48.0, 30.0, 18.0, 6.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.109806060791016, -16.68512725830078, -16.26045036315918, -15.835771560668945, -15.411092758178711, -14.986414909362793, -14.561737060546875, -14.13705825805664, -13.712380409240723, -13.287702560424805, -12.86302375793457, -12.438345909118652, -12.013668060302734, -11.5889892578125, -11.164311408996582, -10.739633560180664, -10.31495475769043, -9.890276908874512, -9.465598106384277, -9.04092025756836, -8.616241455078125, -8.191563606262207, -7.766885757446289, -7.342207431793213, -6.917529106140137, -6.4928507804870605, -6.068172454833984, -5.643494606018066, -5.21881628036499, -4.794137954711914, -4.369460105895996, -3.94478178024292, -3.5201025009155273, -3.095424175262451, -2.670746088027954, -2.246068000793457, -1.8213896751403809, -1.3967113494873047, -0.9720332622528076, -0.5473551750183105, -0.12267684936523438, 0.30200135707855225, 0.7266795635223389, 1.1513577699661255, 1.576035976409912, 2.0007143020629883, 2.4253923892974854, 2.8500704765319824, 3.2747488021850586, 3.6994271278381348, 4.124105453491211, 4.548783302307129, 4.973461627960205, 5.398139953613281, 5.822817802429199, 6.247496128082275, 6.672174453735352, 7.096852779388428, 7.521531105041504, 7.946208953857422, 8.370887756347656, 8.795565605163574, 9.220243453979492, 9.644922256469727, 10.069600105285645]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 9.0, 4.0, 9.0, 15.0, 11.0, 24.0, 20.0, 31.0, 24.0, 42.0, 38.0, 33.0, 47.0, 47.0, 53.0, 53.0, 43.0, 55.0, 40.0, 52.0, 52.0, 40.0, 44.0, 30.0, 34.0, 25.0, 28.0, 24.0, 9.0, 18.0, 11.0, 4.0, 8.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.83294153213501, -7.537915229797363, -7.242889404296875, -6.9478631019592285, -6.652836799621582, -6.357810974121094, -6.062784671783447, -5.767758369445801, -5.4727325439453125, -5.177706241607666, -4.882680416107178, -4.587654113769531, -4.292627811431885, -3.9976017475128174, -3.70257568359375, -3.4075493812561035, -3.112523078918457, -2.8174970149993896, -2.522470712661743, -2.227444648742676, -1.9324184656143188, -1.637392282485962, -1.3423662185668945, -1.047339916229248, -0.7523138523101807, -0.4572876989841461, -0.16226154565811157, 0.13276457786560059, 0.4277907609939575, 0.7228169441223145, 1.0178430080413818, 1.3128693103790283, 1.607895851135254, 1.9029220342636108, 2.1979482173919678, 2.492974281311035, 2.7880005836486816, 3.083026647567749, 3.3780527114868164, 3.673079013824463, 3.9681050777435303, 4.263131141662598, 4.558157444000244, 4.853183746337891, 5.148209571838379, 5.443235874176025, 5.738262176513672, 6.03328800201416, 6.328314304351807, 6.623340606689453, 6.918366432189941, 7.213392734527588, 7.508419036865234, 7.803444862365723, 8.098470687866211, 8.393497467041016, 8.688523292541504, 8.983549118041992, 9.278575897216797, 9.573601722717285, 9.868627548217773, 10.163654327392578, 10.458680152893066, 10.753705978393555, 11.04873275756836]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 5.0, 6.0, 4.0, 8.0, 12.0, 10.0, 28.0, 29.0, 36.0, 45.0, 63.0, 104.0, 163.0, 227.0, 371.0, 635.0, 1040.0, 1741.0, 3168.0, 6579.0, 13621.0, 29573.0, 69949.0, 170603.0, 357143.0, 226384.0, 93291.0, 38757.0, 17164.0, 8330.0, 4135.0, 2099.0, 1232.0, 737.0, 426.0, 265.0, 165.0, 120.0, 86.0, 61.0, 50.0, 29.0, 19.0, 21.0, 14.0, 5.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.42578125, -4.2713623046875, -4.116943359375, -3.9625244140625, -3.80810546875, -3.6536865234375, -3.499267578125, -3.3448486328125, -3.1904296875, -3.0360107421875, -2.881591796875, -2.7271728515625, -2.57275390625, -2.4183349609375, -2.263916015625, -2.1094970703125, -1.955078125, -1.8006591796875, -1.646240234375, -1.4918212890625, -1.33740234375, -1.1829833984375, -1.028564453125, -0.8741455078125, -0.7197265625, -0.5653076171875, -0.410888671875, -0.2564697265625, -0.10205078125, 0.0523681640625, 0.206787109375, 0.3612060546875, 0.515625, 0.6700439453125, 0.824462890625, 0.9788818359375, 1.13330078125, 1.2877197265625, 1.442138671875, 1.5965576171875, 1.7509765625, 1.9053955078125, 2.059814453125, 2.2142333984375, 2.36865234375, 2.5230712890625, 2.677490234375, 2.8319091796875, 2.986328125, 3.1407470703125, 3.295166015625, 3.4495849609375, 3.60400390625, 3.7584228515625, 3.912841796875, 4.0672607421875, 4.2216796875, 4.3760986328125, 4.530517578125, 4.6849365234375, 4.83935546875, 4.9937744140625, 5.148193359375, 5.3026123046875, 5.45703125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 12.0, 8.0, 12.0, 15.0, 11.0, 16.0, 23.0, 22.0, 28.0, 34.0, 31.0, 38.0, 38.0, 26.0, 52.0, 51.0, 47.0, 45.0, 63.0, 43.0, 47.0, 49.0, 32.0, 29.0, 35.0, 30.0, 26.0, 26.0, 16.0, 20.0, 12.0, 16.0, 9.0, 9.0, 8.0, 5.0, 3.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.30078125, -2.237640380859375, -2.17449951171875, -2.111358642578125, -2.0482177734375, -1.985076904296875, -1.92193603515625, -1.858795166015625, -1.795654296875, -1.732513427734375, -1.66937255859375, -1.606231689453125, -1.5430908203125, -1.479949951171875, -1.41680908203125, -1.353668212890625, -1.29052734375, -1.227386474609375, -1.16424560546875, -1.101104736328125, -1.0379638671875, -0.974822998046875, -0.91168212890625, -0.848541259765625, -0.785400390625, -0.722259521484375, -0.65911865234375, -0.595977783203125, -0.5328369140625, -0.469696044921875, -0.40655517578125, -0.343414306640625, -0.2802734375, -0.217132568359375, -0.15399169921875, -0.090850830078125, -0.0277099609375, 0.035430908203125, 0.09857177734375, 0.161712646484375, 0.224853515625, 0.287994384765625, 0.35113525390625, 0.414276123046875, 0.4774169921875, 0.540557861328125, 0.60369873046875, 0.666839599609375, 0.72998046875, 0.793121337890625, 0.85626220703125, 0.919403076171875, 0.9825439453125, 1.045684814453125, 1.10882568359375, 1.171966552734375, 1.235107421875, 1.298248291015625, 1.36138916015625, 1.424530029296875, 1.4876708984375, 1.550811767578125, 1.61395263671875, 1.677093505859375, 1.740234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 10.0, 16.0, 10.0, 18.0, 23.0, 37.0, 51.0, 70.0, 108.0, 183.0, 318.0, 521.0, 1112.0, 3065.0, 13098.0, 109272.0, 738631.0, 158459.0, 17213.0, 3624.0, 1274.0, 562.0, 317.0, 190.0, 106.0, 76.0, 53.0, 44.0, 24.0, 17.0, 10.0, 4.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.4453125, -9.102783203125, -8.76025390625, -8.417724609375, -8.0751953125, -7.732666015625, -7.39013671875, -7.047607421875, -6.705078125, -6.362548828125, -6.02001953125, -5.677490234375, -5.3349609375, -4.992431640625, -4.64990234375, -4.307373046875, -3.96484375, -3.622314453125, -3.27978515625, -2.937255859375, -2.5947265625, -2.252197265625, -1.90966796875, -1.567138671875, -1.224609375, -0.882080078125, -0.53955078125, -0.197021484375, 0.1455078125, 0.488037109375, 0.83056640625, 1.173095703125, 1.515625, 1.858154296875, 2.20068359375, 2.543212890625, 2.8857421875, 3.228271484375, 3.57080078125, 3.913330078125, 4.255859375, 4.598388671875, 4.94091796875, 5.283447265625, 5.6259765625, 5.968505859375, 6.31103515625, 6.653564453125, 6.99609375, 7.338623046875, 7.68115234375, 8.023681640625, 8.3662109375, 8.708740234375, 9.05126953125, 9.393798828125, 9.736328125, 10.078857421875, 10.42138671875, 10.763916015625, 11.1064453125, 11.448974609375, 11.79150390625, 12.134033203125, 12.4765625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 10.0, 4.0, 14.0, 11.0, 12.0, 24.0, 31.0, 22.0, 34.0, 42.0, 64.0, 46.0, 55.0, 56.0, 51.0, 76.0, 61.0, 60.0, 55.0, 47.0, 31.0, 31.0, 32.0, 24.0, 24.0, 20.0, 15.0, 8.0, 12.0, 9.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0], "bins": [-15.8125, -15.439208984375, -15.06591796875, -14.692626953125, -14.3193359375, -13.946044921875, -13.57275390625, -13.199462890625, -12.826171875, -12.452880859375, -12.07958984375, -11.706298828125, -11.3330078125, -10.959716796875, -10.58642578125, -10.213134765625, -9.83984375, -9.466552734375, -9.09326171875, -8.719970703125, -8.3466796875, -7.973388671875, -7.60009765625, -7.226806640625, -6.853515625, -6.480224609375, -6.10693359375, -5.733642578125, -5.3603515625, -4.987060546875, -4.61376953125, -4.240478515625, -3.8671875, -3.493896484375, -3.12060546875, -2.747314453125, -2.3740234375, -2.000732421875, -1.62744140625, -1.254150390625, -0.880859375, -0.507568359375, -0.13427734375, 0.239013671875, 0.6123046875, 0.985595703125, 1.35888671875, 1.732177734375, 2.10546875, 2.478759765625, 2.85205078125, 3.225341796875, 3.5986328125, 3.971923828125, 4.34521484375, 4.718505859375, 5.091796875, 5.465087890625, 5.83837890625, 6.211669921875, 6.5849609375, 6.958251953125, 7.33154296875, 7.704833984375, 8.078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 8.0, 15.0, 27.0, 36.0, 44.0, 94.0, 146.0, 319.0, 595.0, 1862.0, 8993.0, 97841.0, 810311.0, 114870.0, 10082.0, 1950.0, 637.0, 318.0, 150.0, 89.0, 53.0, 42.0, 29.0, 8.0, 8.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.23828125, -5.0721435546875, -4.906005859375, -4.7398681640625, -4.57373046875, -4.4075927734375, -4.241455078125, -4.0753173828125, -3.9091796875, -3.7430419921875, -3.576904296875, -3.4107666015625, -3.24462890625, -3.0784912109375, -2.912353515625, -2.7462158203125, -2.580078125, -2.4139404296875, -2.247802734375, -2.0816650390625, -1.91552734375, -1.7493896484375, -1.583251953125, -1.4171142578125, -1.2509765625, -1.0848388671875, -0.918701171875, -0.7525634765625, -0.58642578125, -0.4202880859375, -0.254150390625, -0.0880126953125, 0.078125, 0.2442626953125, 0.410400390625, 0.5765380859375, 0.74267578125, 0.9088134765625, 1.074951171875, 1.2410888671875, 1.4072265625, 1.5733642578125, 1.739501953125, 1.9056396484375, 2.07177734375, 2.2379150390625, 2.404052734375, 2.5701904296875, 2.736328125, 2.9024658203125, 3.068603515625, 3.2347412109375, 3.40087890625, 3.5670166015625, 3.733154296875, 3.8992919921875, 4.0654296875, 4.2315673828125, 4.397705078125, 4.5638427734375, 4.72998046875, 4.8961181640625, 5.062255859375, 5.2283935546875, 5.39453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 7.0, 16.0, 12.0, 22.0, 20.0, 36.0, 28.0, 32.0, 38.0, 52.0, 99.0, 205.0, 93.0, 56.0, 46.0, 43.0, 38.0, 38.0, 24.0, 10.0, 17.0, 15.0, 11.0, 6.0, 4.0, 2.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0005006790161132812, -0.0004853159189224243, -0.0004699528217315674, -0.00045458972454071045, -0.0004392266273498535, -0.0004238635301589966, -0.00040850043296813965, -0.0003931373357772827, -0.0003777742385864258, -0.00036241114139556885, -0.0003470480442047119, -0.000331684947013855, -0.00031632184982299805, -0.0003009587526321411, -0.0002855956554412842, -0.00027023255825042725, -0.0002548694610595703, -0.00023950636386871338, -0.00022414326667785645, -0.0002087801694869995, -0.00019341707229614258, -0.00017805397510528564, -0.0001626908779144287, -0.00014732778072357178, -0.00013196468353271484, -0.00011660158634185791, -0.00010123848915100098, -8.587539196014404e-05, -7.051229476928711e-05, -5.5149197578430176e-05, -3.978610038757324e-05, -2.442300319671631e-05, -9.059906005859375e-06, 6.303191184997559e-06, 2.1666288375854492e-05, 3.7029385566711426e-05, 5.239248275756836e-05, 6.775557994842529e-05, 8.311867713928223e-05, 9.848177433013916e-05, 0.0001138448715209961, 0.00012920796871185303, 0.00014457106590270996, 0.0001599341630935669, 0.00017529726028442383, 0.00019066035747528076, 0.0002060234546661377, 0.00022138655185699463, 0.00023674964904785156, 0.0002521127462387085, 0.00026747584342956543, 0.00028283894062042236, 0.0002982020378112793, 0.00031356513500213623, 0.00032892823219299316, 0.0003442913293838501, 0.00035965442657470703, 0.00037501752376556396, 0.0003903806209564209, 0.00040574371814727783, 0.00042110681533813477, 0.0004364699125289917, 0.00045183300971984863, 0.00046719610691070557, 0.0004825592041015625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 7.0, 2.0, 14.0, 17.0, 18.0, 19.0, 42.0, 61.0, 96.0, 155.0, 243.0, 526.0, 903.0, 2275.0, 10398.0, 91895.0, 756860.0, 163140.0, 16277.0, 3145.0, 1114.0, 563.0, 284.0, 168.0, 124.0, 55.0, 42.0, 21.0, 26.0, 10.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.3828125, -5.231689453125, -5.08056640625, -4.929443359375, -4.7783203125, -4.627197265625, -4.47607421875, -4.324951171875, -4.173828125, -4.022705078125, -3.87158203125, -3.720458984375, -3.5693359375, -3.418212890625, -3.26708984375, -3.115966796875, -2.96484375, -2.813720703125, -2.66259765625, -2.511474609375, -2.3603515625, -2.209228515625, -2.05810546875, -1.906982421875, -1.755859375, -1.604736328125, -1.45361328125, -1.302490234375, -1.1513671875, -1.000244140625, -0.84912109375, -0.697998046875, -0.546875, -0.395751953125, -0.24462890625, -0.093505859375, 0.0576171875, 0.208740234375, 0.35986328125, 0.510986328125, 0.662109375, 0.813232421875, 0.96435546875, 1.115478515625, 1.2666015625, 1.417724609375, 1.56884765625, 1.719970703125, 1.87109375, 2.022216796875, 2.17333984375, 2.324462890625, 2.4755859375, 2.626708984375, 2.77783203125, 2.928955078125, 3.080078125, 3.231201171875, 3.38232421875, 3.533447265625, 3.6845703125, 3.835693359375, 3.98681640625, 4.137939453125, 4.2890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 8.0, 7.0, 20.0, 19.0, 20.0, 36.0, 41.0, 57.0, 75.0, 126.0, 141.0, 116.0, 102.0, 55.0, 48.0, 36.0, 22.0, 17.0, 14.0, 5.0, 8.0, 7.0, 3.0, 4.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.361328125, -3.235687255859375, -3.11004638671875, -2.984405517578125, -2.8587646484375, -2.733123779296875, -2.60748291015625, -2.481842041015625, -2.356201171875, -2.230560302734375, -2.10491943359375, -1.979278564453125, -1.8536376953125, -1.727996826171875, -1.60235595703125, -1.476715087890625, -1.35107421875, -1.225433349609375, -1.09979248046875, -0.974151611328125, -0.8485107421875, -0.722869873046875, -0.59722900390625, -0.471588134765625, -0.345947265625, -0.220306396484375, -0.09466552734375, 0.030975341796875, 0.1566162109375, 0.282257080078125, 0.40789794921875, 0.533538818359375, 0.6591796875, 0.784820556640625, 0.91046142578125, 1.036102294921875, 1.1617431640625, 1.287384033203125, 1.41302490234375, 1.538665771484375, 1.664306640625, 1.789947509765625, 1.91558837890625, 2.041229248046875, 2.1668701171875, 2.292510986328125, 2.41815185546875, 2.543792724609375, 2.66943359375, 2.795074462890625, 2.92071533203125, 3.046356201171875, 3.1719970703125, 3.297637939453125, 3.42327880859375, 3.548919677734375, 3.674560546875, 3.800201416015625, 3.92584228515625, 4.051483154296875, 4.1771240234375, 4.302764892578125, 4.42840576171875, 4.554046630859375, 4.6796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 18.0, 23.0, 50.0, 133.0, 178.0, 209.0, 169.0, 125.0, 51.0, 21.0, 9.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.34636688232422, -64.7073745727539, -62.068382263183594, -59.42938995361328, -56.79039764404297, -54.151405334472656, -51.51241683959961, -48.8734245300293, -46.234432220458984, -43.59543991088867, -40.95644760131836, -38.31745529174805, -35.678466796875, -33.03947448730469, -30.400482177734375, -27.761489868164062, -25.12249755859375, -22.483505249023438, -19.844512939453125, -17.205522537231445, -14.566530227661133, -11.92753791809082, -9.288546562194824, -6.649555206298828, -4.010562896728516, -1.3715710639953613, 1.267420768737793, 3.9064126014709473, 6.545404434204102, 9.184396743774414, 11.82338809967041, 14.462379455566406, 17.101364135742188, 19.7403564453125, 22.379348754882812, 25.018339157104492, 27.657331466674805, 30.296323776245117, 32.9353141784668, 35.57430648803711, 38.21329879760742, 40.852291107177734, 43.49128341674805, 46.13027572631836, 48.769264221191406, 51.40825653076172, 54.04724884033203, 56.686241149902344, 59.325233459472656, 61.96422576904297, 64.60321807861328, 67.2422103881836, 69.8812026977539, 72.52019500732422, 75.15918731689453, 77.79817199707031, 80.43716430664062, 83.07615661621094, 85.71514892578125, 88.35414123535156, 90.99313354492188, 93.63212585449219, 96.2711181640625, 98.91011047363281, 101.54910278320312]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 8.0, 5.0, 13.0, 10.0, 12.0, 13.0, 20.0, 13.0, 27.0, 26.0, 32.0, 26.0, 36.0, 34.0, 51.0, 54.0, 51.0, 44.0, 56.0, 44.0, 45.0, 33.0, 55.0, 37.0, 31.0, 32.0, 22.0, 23.0, 27.0, 23.0, 23.0, 11.0, 9.0, 10.0, 8.0, 15.0, 0.0, 4.0, 9.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.828792572021484, -46.032745361328125, -44.23670196533203, -42.44065475463867, -40.64460754394531, -38.84856414794922, -37.05251693725586, -35.2564697265625, -33.460426330566406, -31.66438102722168, -29.868335723876953, -28.072288513183594, -26.276243209838867, -24.48019790649414, -22.68415069580078, -20.888105392456055, -19.092060089111328, -17.2960147857666, -15.499968528747559, -13.703922271728516, -11.907876968383789, -10.111831665039062, -8.31578540802002, -6.519739151000977, -4.72369384765625, -2.9276480674743652, -1.1316022872924805, 0.6644434928894043, 2.460489273071289, 4.256534576416016, 6.052580833435059, 7.848627090454102, 9.644668579101562, 11.440713882446289, 13.236760139465332, 15.032806396484375, 16.8288516998291, 18.624897003173828, 20.420944213867188, 22.216989517211914, 24.01303482055664, 25.809080123901367, 27.605125427246094, 29.401172637939453, 31.19721794128418, 32.993263244628906, 34.789310455322266, 36.585357666015625, 38.38140106201172, 40.17744827270508, 41.97349166870117, 43.76953887939453, 45.565582275390625, 47.361629486083984, 49.157676696777344, 50.95372009277344, 52.7497673034668, 54.545814514160156, 56.34185791015625, 58.13790512084961, 59.93395233154297, 61.72999572753906, 63.52604293823242, 65.32209014892578, 67.11813354492188]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 11.0, 16.0, 21.0, 38.0, 61.0, 78.0, 135.0, 227.0, 390.0, 745.0, 1439.0, 2816.0, 5960.0, 14649.0, 54867.0, 627871.0, 3331947.0, 113196.0, 23292.0, 8337.0, 3801.0, 1922.0, 1013.0, 584.0, 303.0, 191.0, 112.0, 84.0, 44.0, 38.0, 29.0, 17.0, 10.0, 8.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.59881591796875, -5.3929443359375, -5.18707275390625, -4.981201171875, -4.77532958984375, -4.5694580078125, -4.36358642578125, -4.15771484375, -3.95184326171875, -3.7459716796875, -3.54010009765625, -3.334228515625, -3.12835693359375, -2.9224853515625, -2.71661376953125, -2.5107421875, -2.30487060546875, -2.0989990234375, -1.89312744140625, -1.687255859375, -1.48138427734375, -1.2755126953125, -1.06964111328125, -0.86376953125, -0.65789794921875, -0.4520263671875, -0.24615478515625, -0.040283203125, 0.16558837890625, 0.3714599609375, 0.57733154296875, 0.783203125, 0.98907470703125, 1.1949462890625, 1.40081787109375, 1.606689453125, 1.81256103515625, 2.0184326171875, 2.22430419921875, 2.43017578125, 2.63604736328125, 2.8419189453125, 3.04779052734375, 3.253662109375, 3.45953369140625, 3.6654052734375, 3.87127685546875, 4.0771484375, 4.28302001953125, 4.4888916015625, 4.69476318359375, 4.900634765625, 5.10650634765625, 5.3123779296875, 5.51824951171875, 5.72412109375, 5.92999267578125, 6.1358642578125, 6.34173583984375, 6.547607421875, 6.75347900390625, 6.9593505859375, 7.16522216796875, 7.37109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 9.0, 9.0, 8.0, 15.0, 31.0, 19.0, 25.0, 38.0, 41.0, 39.0, 41.0, 35.0, 47.0, 46.0, 63.0, 50.0, 52.0, 49.0, 40.0, 49.0, 25.0, 35.0, 37.0, 46.0, 21.0, 21.0, 29.0, 13.0, 15.0, 13.0, 11.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.138671875, -2.058013916015625, -1.97735595703125, -1.896697998046875, -1.8160400390625, -1.735382080078125, -1.65472412109375, -1.574066162109375, -1.493408203125, -1.412750244140625, -1.33209228515625, -1.251434326171875, -1.1707763671875, -1.090118408203125, -1.00946044921875, -0.928802490234375, -0.84814453125, -0.767486572265625, -0.68682861328125, -0.606170654296875, -0.5255126953125, -0.444854736328125, -0.36419677734375, -0.283538818359375, -0.202880859375, -0.122222900390625, -0.04156494140625, 0.039093017578125, 0.1197509765625, 0.200408935546875, 0.28106689453125, 0.361724853515625, 0.4423828125, 0.523040771484375, 0.60369873046875, 0.684356689453125, 0.7650146484375, 0.845672607421875, 0.92633056640625, 1.006988525390625, 1.087646484375, 1.168304443359375, 1.24896240234375, 1.329620361328125, 1.4102783203125, 1.490936279296875, 1.57159423828125, 1.652252197265625, 1.73291015625, 1.813568115234375, 1.89422607421875, 1.974884033203125, 2.0555419921875, 2.136199951171875, 2.21685791015625, 2.297515869140625, 2.378173828125, 2.458831787109375, 2.53948974609375, 2.620147705078125, 2.7008056640625, 2.781463623046875, 2.86212158203125, 2.942779541015625, 3.0234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 12.0, 12.0, 14.0, 30.0, 38.0, 61.0, 107.0, 207.0, 357.0, 651.0, 1182.0, 2302.0, 5193.0, 13988.0, 48637.0, 295015.0, 3328314.0, 410392.0, 60192.0, 16308.0, 5849.0, 2596.0, 1309.0, 621.0, 377.0, 219.0, 129.0, 65.0, 42.0, 22.0, 18.0, 8.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.87091064453125, -3.7066650390625, -3.54241943359375, -3.378173828125, -3.21392822265625, -3.0496826171875, -2.88543701171875, -2.72119140625, -2.55694580078125, -2.3927001953125, -2.22845458984375, -2.064208984375, -1.89996337890625, -1.7357177734375, -1.57147216796875, -1.4072265625, -1.24298095703125, -1.0787353515625, -0.91448974609375, -0.750244140625, -0.58599853515625, -0.4217529296875, -0.25750732421875, -0.09326171875, 0.07098388671875, 0.2352294921875, 0.39947509765625, 0.563720703125, 0.72796630859375, 0.8922119140625, 1.05645751953125, 1.220703125, 1.38494873046875, 1.5491943359375, 1.71343994140625, 1.877685546875, 2.04193115234375, 2.2061767578125, 2.37042236328125, 2.53466796875, 2.69891357421875, 2.8631591796875, 3.02740478515625, 3.191650390625, 3.35589599609375, 3.5201416015625, 3.68438720703125, 3.8486328125, 4.01287841796875, 4.1771240234375, 4.34136962890625, 4.505615234375, 4.66986083984375, 4.8341064453125, 4.99835205078125, 5.16259765625, 5.32684326171875, 5.4910888671875, 5.65533447265625, 5.819580078125, 5.98382568359375, 6.1480712890625, 6.31231689453125, 6.4765625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 11.0, 10.0, 13.0, 20.0, 29.0, 59.0, 82.0, 162.0, 263.0, 913.0, 1635.0, 397.0, 193.0, 97.0, 67.0, 30.0, 19.0, 17.0, 5.0, 4.0, 8.0, 5.0, 9.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.01171875, -3.891021728515625, -3.77032470703125, -3.649627685546875, -3.5289306640625, -3.408233642578125, -3.28753662109375, -3.166839599609375, -3.046142578125, -2.925445556640625, -2.80474853515625, -2.684051513671875, -2.5633544921875, -2.442657470703125, -2.32196044921875, -2.201263427734375, -2.08056640625, -1.959869384765625, -1.83917236328125, -1.718475341796875, -1.5977783203125, -1.477081298828125, -1.35638427734375, -1.235687255859375, -1.114990234375, -0.994293212890625, -0.87359619140625, -0.752899169921875, -0.6322021484375, -0.511505126953125, -0.39080810546875, -0.270111083984375, -0.1494140625, -0.028717041015625, 0.09197998046875, 0.212677001953125, 0.3333740234375, 0.454071044921875, 0.57476806640625, 0.695465087890625, 0.816162109375, 0.936859130859375, 1.05755615234375, 1.178253173828125, 1.2989501953125, 1.419647216796875, 1.54034423828125, 1.661041259765625, 1.78173828125, 1.902435302734375, 2.02313232421875, 2.143829345703125, 2.2645263671875, 2.385223388671875, 2.50592041015625, 2.626617431640625, 2.747314453125, 2.868011474609375, 2.98870849609375, 3.109405517578125, 3.2301025390625, 3.350799560546875, 3.47149658203125, 3.592193603515625, 3.712890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 8.0, 31.0, 98.0, 196.0, 308.0, 232.0, 86.0, 26.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.54499053955078, -36.361656188964844, -35.178321838378906, -33.994991302490234, -32.8116569519043, -31.62832260131836, -30.444988250732422, -29.261655807495117, -28.078323364257812, -26.894989013671875, -25.71165657043457, -24.528322219848633, -23.344989776611328, -22.16165542602539, -20.978321075439453, -19.79498863220215, -18.61165428161621, -17.428319931030273, -16.24498748779297, -15.061653137207031, -13.878320693969727, -12.694986343383789, -11.511652946472168, -10.328319549560547, -9.144986152648926, -7.961652755737305, -6.778319358825684, -5.594985485076904, -4.411652088165283, -3.228318691253662, -2.044984817504883, -0.8616514205932617, 0.3216819763183594, 1.50501549243927, 2.6883490085601807, 3.871682643890381, 5.055016040802002, 6.238349437713623, 7.421683311462402, 8.605016708374023, 9.788350105285645, 10.971683502197266, 12.155016899108887, 13.338350296020508, 14.521684646606445, 15.70501708984375, 16.888351440429688, 18.071685791015625, 19.25501823425293, 20.438352584838867, 21.621685028076172, 22.80501937866211, 23.988351821899414, 25.17168617248535, 26.355018615722656, 27.538352966308594, 28.72168731689453, 29.90502166748047, 31.088354110717773, 32.27168655395508, 33.455020904541016, 34.63835525512695, 35.82168960571289, 37.00502014160156, 38.1883544921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 7.0, 5.0, 12.0, 12.0, 12.0, 20.0, 17.0, 22.0, 26.0, 44.0, 41.0, 34.0, 45.0, 34.0, 43.0, 50.0, 44.0, 54.0, 55.0, 42.0, 40.0, 49.0, 41.0, 26.0, 35.0, 40.0, 30.0, 30.0, 13.0, 17.0, 11.0, 10.0, 11.0, 11.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.848400115966797, -10.46182918548584, -10.075257301330566, -9.68868637084961, -9.302114486694336, -8.915543556213379, -8.528971672058105, -8.142400741577148, -7.755828857421875, -7.36925745010376, -6.9826860427856445, -6.596114635467529, -6.209543228149414, -5.822971820831299, -5.436400413513184, -5.049829483032227, -4.663258075714111, -4.276686668395996, -3.890115261077881, -3.5035438537597656, -3.1169724464416504, -2.730401039123535, -2.343829870223999, -1.9572584629058838, -1.5706870555877686, -1.1841156482696533, -0.7975443005561829, -0.4109729528427124, -0.024401545524597168, 0.36216986179351807, 0.7487411499023438, 1.135312557220459, 1.5218839645385742, 1.9084553718566895, 2.2950267791748047, 2.68159818649292, 3.068169593811035, 3.4547410011291504, 3.8413121700286865, 4.227883338928223, 4.614455223083496, 5.001026630401611, 5.387598037719727, 5.774169445037842, 6.160740852355957, 6.547312259674072, 6.9338836669921875, 7.3204545974731445, 7.70702600479126, 8.093597412109375, 8.480168342590332, 8.866740226745605, 9.253311157226562, 9.639883041381836, 10.026453971862793, 10.413025856018066, 10.799596786499023, 11.18616771697998, 11.572739601135254, 11.959310531616211, 12.345882415771484, 12.732453346252441, 13.119025230407715, 13.505596160888672, 13.892168045043945]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 11.0, 18.0, 24.0, 33.0, 28.0, 53.0, 83.0, 120.0, 174.0, 239.0, 449.0, 714.0, 1206.0, 2232.0, 4306.0, 8761.0, 18679.0, 41676.0, 98726.0, 220858.0, 312503.0, 188899.0, 81355.0, 35185.0, 15933.0, 7621.0, 3802.0, 1982.0, 1057.0, 641.0, 395.0, 231.0, 153.0, 130.0, 74.0, 58.0, 28.0, 26.0, 18.0, 18.0, 12.0, 12.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.7734375, -4.6304931640625, -4.487548828125, -4.3446044921875, -4.20166015625, -4.0587158203125, -3.915771484375, -3.7728271484375, -3.6298828125, -3.4869384765625, -3.343994140625, -3.2010498046875, -3.05810546875, -2.9151611328125, -2.772216796875, -2.6292724609375, -2.486328125, -2.3433837890625, -2.200439453125, -2.0574951171875, -1.91455078125, -1.7716064453125, -1.628662109375, -1.4857177734375, -1.3427734375, -1.1998291015625, -1.056884765625, -0.9139404296875, -0.77099609375, -0.6280517578125, -0.485107421875, -0.3421630859375, -0.19921875, -0.0562744140625, 0.086669921875, 0.2296142578125, 0.37255859375, 0.5155029296875, 0.658447265625, 0.8013916015625, 0.9443359375, 1.0872802734375, 1.230224609375, 1.3731689453125, 1.51611328125, 1.6590576171875, 1.802001953125, 1.9449462890625, 2.087890625, 2.2308349609375, 2.373779296875, 2.5167236328125, 2.65966796875, 2.8026123046875, 2.945556640625, 3.0885009765625, 3.2314453125, 3.3743896484375, 3.517333984375, 3.6602783203125, 3.80322265625, 3.9461669921875, 4.089111328125, 4.2320556640625, 4.375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 4.0, 10.0, 9.0, 16.0, 10.0, 13.0, 24.0, 32.0, 25.0, 29.0, 38.0, 45.0, 46.0, 41.0, 42.0, 36.0, 45.0, 49.0, 38.0, 45.0, 35.0, 40.0, 40.0, 35.0, 30.0, 37.0, 32.0, 21.0, 23.0, 24.0, 9.0, 22.0, 10.0, 9.0, 8.0, 5.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.15234375, -2.082183837890625, -2.01202392578125, -1.941864013671875, -1.8717041015625, -1.801544189453125, -1.73138427734375, -1.661224365234375, -1.591064453125, -1.520904541015625, -1.45074462890625, -1.380584716796875, -1.3104248046875, -1.240264892578125, -1.17010498046875, -1.099945068359375, -1.02978515625, -0.959625244140625, -0.88946533203125, -0.819305419921875, -0.7491455078125, -0.678985595703125, -0.60882568359375, -0.538665771484375, -0.468505859375, -0.398345947265625, -0.32818603515625, -0.258026123046875, -0.1878662109375, -0.117706298828125, -0.04754638671875, 0.022613525390625, 0.0927734375, 0.162933349609375, 0.23309326171875, 0.303253173828125, 0.3734130859375, 0.443572998046875, 0.51373291015625, 0.583892822265625, 0.654052734375, 0.724212646484375, 0.79437255859375, 0.864532470703125, 0.9346923828125, 1.004852294921875, 1.07501220703125, 1.145172119140625, 1.21533203125, 1.285491943359375, 1.35565185546875, 1.425811767578125, 1.4959716796875, 1.566131591796875, 1.63629150390625, 1.706451416015625, 1.776611328125, 1.846771240234375, 1.91693115234375, 1.987091064453125, 2.0572509765625, 2.127410888671875, 2.19757080078125, 2.267730712890625, 2.337890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 11.0, 10.0, 16.0, 20.0, 24.0, 36.0, 48.0, 79.0, 119.0, 148.0, 201.0, 301.0, 489.0, 877.0, 1952.0, 6348.0, 30797.0, 261924.0, 632940.0, 91479.0, 13940.0, 3477.0, 1389.0, 645.0, 406.0, 246.0, 184.0, 131.0, 95.0, 66.0, 33.0, 22.0, 23.0, 11.0, 6.0, 6.0, 4.0, 5.0, 8.0, 5.0, 4.0, 5.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.6484375, -9.30712890625, -8.9658203125, -8.62451171875, -8.283203125, -7.94189453125, -7.6005859375, -7.25927734375, -6.91796875, -6.57666015625, -6.2353515625, -5.89404296875, -5.552734375, -5.21142578125, -4.8701171875, -4.52880859375, -4.1875, -3.84619140625, -3.5048828125, -3.16357421875, -2.822265625, -2.48095703125, -2.1396484375, -1.79833984375, -1.45703125, -1.11572265625, -0.7744140625, -0.43310546875, -0.091796875, 0.24951171875, 0.5908203125, 0.93212890625, 1.2734375, 1.61474609375, 1.9560546875, 2.29736328125, 2.638671875, 2.97998046875, 3.3212890625, 3.66259765625, 4.00390625, 4.34521484375, 4.6865234375, 5.02783203125, 5.369140625, 5.71044921875, 6.0517578125, 6.39306640625, 6.734375, 7.07568359375, 7.4169921875, 7.75830078125, 8.099609375, 8.44091796875, 8.7822265625, 9.12353515625, 9.46484375, 9.80615234375, 10.1474609375, 10.48876953125, 10.830078125, 11.17138671875, 11.5126953125, 11.85400390625, 12.1953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 10.0, 9.0, 20.0, 14.0, 14.0, 19.0, 26.0, 26.0, 25.0, 35.0, 41.0, 40.0, 63.0, 39.0, 48.0, 33.0, 45.0, 36.0, 48.0, 50.0, 51.0, 43.0, 29.0, 29.0, 24.0, 33.0, 16.0, 15.0, 20.0, 15.0, 15.0, 12.0, 7.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0], "bins": [-13.390625, -12.9970703125, -12.603515625, -12.2099609375, -11.81640625, -11.4228515625, -11.029296875, -10.6357421875, -10.2421875, -9.8486328125, -9.455078125, -9.0615234375, -8.66796875, -8.2744140625, -7.880859375, -7.4873046875, -7.09375, -6.7001953125, -6.306640625, -5.9130859375, -5.51953125, -5.1259765625, -4.732421875, -4.3388671875, -3.9453125, -3.5517578125, -3.158203125, -2.7646484375, -2.37109375, -1.9775390625, -1.583984375, -1.1904296875, -0.796875, -0.4033203125, -0.009765625, 0.3837890625, 0.77734375, 1.1708984375, 1.564453125, 1.9580078125, 2.3515625, 2.7451171875, 3.138671875, 3.5322265625, 3.92578125, 4.3193359375, 4.712890625, 5.1064453125, 5.5, 5.8935546875, 6.287109375, 6.6806640625, 7.07421875, 7.4677734375, 7.861328125, 8.2548828125, 8.6484375, 9.0419921875, 9.435546875, 9.8291015625, 10.22265625, 10.6162109375, 11.009765625, 11.4033203125, 11.796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 6.0, 10.0, 12.0, 18.0, 50.0, 110.0, 213.0, 707.0, 2347.0, 18935.0, 352149.0, 630641.0, 38185.0, 3698.0, 886.0, 332.0, 103.0, 63.0, 29.0, 14.0, 12.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73046875, -5.54638671875, -5.3623046875, -5.17822265625, -4.994140625, -4.81005859375, -4.6259765625, -4.44189453125, -4.2578125, -4.07373046875, -3.8896484375, -3.70556640625, -3.521484375, -3.33740234375, -3.1533203125, -2.96923828125, -2.78515625, -2.60107421875, -2.4169921875, -2.23291015625, -2.048828125, -1.86474609375, -1.6806640625, -1.49658203125, -1.3125, -1.12841796875, -0.9443359375, -0.76025390625, -0.576171875, -0.39208984375, -0.2080078125, -0.02392578125, 0.16015625, 0.34423828125, 0.5283203125, 0.71240234375, 0.896484375, 1.08056640625, 1.2646484375, 1.44873046875, 1.6328125, 1.81689453125, 2.0009765625, 2.18505859375, 2.369140625, 2.55322265625, 2.7373046875, 2.92138671875, 3.10546875, 3.28955078125, 3.4736328125, 3.65771484375, 3.841796875, 4.02587890625, 4.2099609375, 4.39404296875, 4.578125, 4.76220703125, 4.9462890625, 5.13037109375, 5.314453125, 5.49853515625, 5.6826171875, 5.86669921875, 6.05078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 11.0, 14.0, 15.0, 7.0, 18.0, 34.0, 36.0, 42.0, 36.0, 42.0, 60.0, 70.0, 82.0, 74.0, 79.0, 71.0, 48.0, 43.0, 45.0, 35.0, 31.0, 17.0, 19.0, 11.0, 8.0, 11.0, 9.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0005645751953125, -0.0005494169890880585, -0.0005342587828636169, -0.0005191005766391754, -0.0005039423704147339, -0.0004887841641902924, -0.00047362595796585083, -0.0004584677517414093, -0.0004433095455169678, -0.00042815133929252625, -0.0004129931330680847, -0.0003978349268436432, -0.00038267672061920166, -0.00036751851439476013, -0.0003523603081703186, -0.0003372021019458771, -0.00032204389572143555, -0.000306885689496994, -0.0002917274832725525, -0.00027656927704811096, -0.00026141107082366943, -0.0002462528645992279, -0.00023109465837478638, -0.00021593645215034485, -0.00020077824592590332, -0.0001856200397014618, -0.00017046183347702026, -0.00015530362725257874, -0.0001401454210281372, -0.00012498721480369568, -0.00010982900857925415, -9.467080235481262e-05, -7.95125961303711e-05, -6.435438990592957e-05, -4.919618368148804e-05, -3.403797745704651e-05, -1.887977123260498e-05, -3.721565008163452e-06, 1.1436641216278076e-05, 2.6594847440719604e-05, 4.175305366516113e-05, 5.691125988960266e-05, 7.206946611404419e-05, 8.722767233848572e-05, 0.00010238587856292725, 0.00011754408478736877, 0.0001327022910118103, 0.00014786049723625183, 0.00016301870346069336, 0.0001781769096851349, 0.00019333511590957642, 0.00020849332213401794, 0.00022365152835845947, 0.000238809734582901, 0.00025396794080734253, 0.00026912614703178406, 0.0002842843532562256, 0.0002994425594806671, 0.00031460076570510864, 0.00032975897192955017, 0.0003449171781539917, 0.00036007538437843323, 0.00037523359060287476, 0.0003903917968273163, 0.0004055500030517578]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 13.0, 12.0, 24.0, 27.0, 34.0, 34.0, 60.0, 82.0, 145.0, 238.0, 345.0, 644.0, 1241.0, 3063.0, 10488.0, 63614.0, 424401.0, 456721.0, 69674.0, 11451.0, 3197.0, 1285.0, 658.0, 369.0, 238.0, 159.0, 101.0, 50.0, 44.0, 30.0, 22.0, 17.0, 16.0, 7.0, 7.0, 8.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.8515625, -3.731292724609375, -3.61102294921875, -3.490753173828125, -3.3704833984375, -3.250213623046875, -3.12994384765625, -3.009674072265625, -2.889404296875, -2.769134521484375, -2.64886474609375, -2.528594970703125, -2.4083251953125, -2.288055419921875, -2.16778564453125, -2.047515869140625, -1.92724609375, -1.806976318359375, -1.68670654296875, -1.566436767578125, -1.4461669921875, -1.325897216796875, -1.20562744140625, -1.085357666015625, -0.965087890625, -0.844818115234375, -0.72454833984375, -0.604278564453125, -0.4840087890625, -0.363739013671875, -0.24346923828125, -0.123199462890625, -0.0029296875, 0.117340087890625, 0.23760986328125, 0.357879638671875, 0.4781494140625, 0.598419189453125, 0.71868896484375, 0.838958740234375, 0.959228515625, 1.079498291015625, 1.19976806640625, 1.320037841796875, 1.4403076171875, 1.560577392578125, 1.68084716796875, 1.801116943359375, 1.92138671875, 2.041656494140625, 2.16192626953125, 2.282196044921875, 2.4024658203125, 2.522735595703125, 2.64300537109375, 2.763275146484375, 2.883544921875, 3.003814697265625, 3.12408447265625, 3.244354248046875, 3.3646240234375, 3.484893798828125, 3.60516357421875, 3.725433349609375, 3.845703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 6.0, 8.0, 12.0, 20.0, 18.0, 31.0, 36.0, 47.0, 48.0, 69.0, 100.0, 94.0, 102.0, 78.0, 93.0, 49.0, 45.0, 35.0, 30.0, 24.0, 10.0, 17.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.61328125, -4.485198974609375, -4.35711669921875, -4.229034423828125, -4.1009521484375, -3.972869873046875, -3.84478759765625, -3.716705322265625, -3.588623046875, -3.460540771484375, -3.33245849609375, -3.204376220703125, -3.0762939453125, -2.948211669921875, -2.82012939453125, -2.692047119140625, -2.56396484375, -2.435882568359375, -2.30780029296875, -2.179718017578125, -2.0516357421875, -1.923553466796875, -1.79547119140625, -1.667388916015625, -1.539306640625, -1.411224365234375, -1.28314208984375, -1.155059814453125, -1.0269775390625, -0.898895263671875, -0.77081298828125, -0.642730712890625, -0.5146484375, -0.386566162109375, -0.25848388671875, -0.130401611328125, -0.0023193359375, 0.125762939453125, 0.25384521484375, 0.381927490234375, 0.510009765625, 0.638092041015625, 0.76617431640625, 0.894256591796875, 1.0223388671875, 1.150421142578125, 1.27850341796875, 1.406585693359375, 1.53466796875, 1.662750244140625, 1.79083251953125, 1.918914794921875, 2.0469970703125, 2.175079345703125, 2.30316162109375, 2.431243896484375, 2.559326171875, 2.687408447265625, 2.81549072265625, 2.943572998046875, 3.0716552734375, 3.199737548828125, 3.32781982421875, 3.455902099609375, 3.583984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 11.0, 21.0, 70.0, 195.0, 292.0, 242.0, 97.0, 47.0, 15.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.32371520996094, -70.89891815185547, -67.47411346435547, -64.04931640625, -60.62451934814453, -57.1997184753418, -53.77491760253906, -50.350120544433594, -46.925323486328125, -43.50052261352539, -40.07572555541992, -36.65092468261719, -33.22612762451172, -29.801326751708984, -26.376527786254883, -22.95172882080078, -19.526927947998047, -16.102128982543945, -12.677330017089844, -9.252530097961426, -5.827731132507324, -2.4029312133789062, 1.0218677520751953, 4.446666717529297, 7.871465682983398, 11.2962646484375, 14.721063613891602, 18.145862579345703, 21.570663452148438, 24.99546241760254, 28.42026138305664, 31.845060348510742, 35.269859313964844, 38.69466018676758, 42.11945724487305, 45.54425811767578, 48.96905517578125, 52.393856048583984, 55.81865692138672, 59.24345397949219, 62.668251037597656, 66.09304809570312, 69.51785278320312, 72.9426498413086, 76.36744689941406, 79.79225158691406, 83.21704864501953, 86.641845703125, 90.066650390625, 93.49144744873047, 96.91625213623047, 100.34104919433594, 103.7658462524414, 107.19064331054688, 110.61544799804688, 114.04024505615234, 117.46504211425781, 120.88983917236328, 124.31464385986328, 127.73944091796875, 131.16424560546875, 134.5890350341797, 138.0138397216797, 141.43862915039062, 144.86343383789062]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 5.0, 4.0, 8.0, 12.0, 8.0, 12.0, 17.0, 18.0, 20.0, 32.0, 22.0, 39.0, 48.0, 36.0, 46.0, 47.0, 50.0, 50.0, 60.0, 51.0, 66.0, 64.0, 41.0, 35.0, 40.0, 29.0, 29.0, 20.0, 21.0, 12.0, 18.0, 7.0, 10.0, 8.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-66.88848876953125, -64.68608093261719, -62.483673095703125, -60.28126907348633, -58.078861236572266, -55.8764533996582, -53.674049377441406, -51.471641540527344, -49.26923370361328, -47.06682586669922, -44.864418029785156, -42.66201400756836, -40.4596061706543, -38.257198333740234, -36.05479431152344, -33.852386474609375, -31.649978637695312, -29.44757080078125, -27.24516487121582, -25.04275894165039, -22.840351104736328, -20.637943267822266, -18.435537338256836, -16.233131408691406, -14.030723571777344, -11.828316688537598, -9.625909805297852, -7.4235029220581055, -5.221096038818359, -3.0186891555786133, -0.8162822723388672, 1.386124610900879, 3.5885238647460938, 5.79093074798584, 7.993337631225586, 10.195744514465332, 12.398151397705078, 14.600558280944824, 16.80296516418457, 19.00537109375, 21.207778930664062, 23.410186767578125, 25.612592697143555, 27.814998626708984, 30.017406463623047, 32.21981430053711, 34.422218322753906, 36.62462615966797, 38.82703399658203, 41.029441833496094, 43.231849670410156, 45.43425369262695, 47.636661529541016, 49.83906936645508, 52.041473388671875, 54.24388122558594, 56.4462890625, 58.64869689941406, 60.851104736328125, 63.05350875854492, 65.25592041015625, 67.45832061767578, 69.66072845458984, 71.8631362915039, 74.06554412841797]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 10.0, 13.0, 11.0, 16.0, 23.0, 26.0, 54.0, 64.0, 78.0, 173.0, 308.0, 713.0, 1880.0, 5035.0, 18715.0, 116297.0, 3901021.0, 121977.0, 19107.0, 5245.0, 1854.0, 743.0, 384.0, 189.0, 95.0, 67.0, 51.0, 29.0, 20.0, 20.0, 21.0, 8.0, 5.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.84375, -4.6461181640625, -4.448486328125, -4.2508544921875, -4.05322265625, -3.8555908203125, -3.657958984375, -3.4603271484375, -3.2626953125, -3.0650634765625, -2.867431640625, -2.6697998046875, -2.47216796875, -2.2745361328125, -2.076904296875, -1.8792724609375, -1.681640625, -1.4840087890625, -1.286376953125, -1.0887451171875, -0.89111328125, -0.6934814453125, -0.495849609375, -0.2982177734375, -0.1005859375, 0.0970458984375, 0.294677734375, 0.4923095703125, 0.68994140625, 0.8875732421875, 1.085205078125, 1.2828369140625, 1.48046875, 1.6781005859375, 1.875732421875, 2.0733642578125, 2.27099609375, 2.4686279296875, 2.666259765625, 2.8638916015625, 3.0615234375, 3.2591552734375, 3.456787109375, 3.6544189453125, 3.85205078125, 4.0496826171875, 4.247314453125, 4.4449462890625, 4.642578125, 4.8402099609375, 5.037841796875, 5.2354736328125, 5.43310546875, 5.6307373046875, 5.828369140625, 6.0260009765625, 6.2236328125, 6.4212646484375, 6.618896484375, 6.8165283203125, 7.01416015625, 7.2117919921875, 7.409423828125, 7.6070556640625, 7.8046875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 11.0, 15.0, 18.0, 14.0, 33.0, 30.0, 37.0, 38.0, 53.0, 55.0, 61.0, 65.0, 62.0, 64.0, 60.0, 51.0, 45.0, 47.0, 47.0, 30.0, 35.0, 27.0, 21.0, 18.0, 19.0, 9.0, 13.0, 8.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.837890625, -2.720489501953125, -2.60308837890625, -2.485687255859375, -2.3682861328125, -2.250885009765625, -2.13348388671875, -2.016082763671875, -1.898681640625, -1.781280517578125, -1.66387939453125, -1.546478271484375, -1.4290771484375, -1.311676025390625, -1.19427490234375, -1.076873779296875, -0.95947265625, -0.842071533203125, -0.72467041015625, -0.607269287109375, -0.4898681640625, -0.372467041015625, -0.25506591796875, -0.137664794921875, -0.020263671875, 0.097137451171875, 0.21453857421875, 0.331939697265625, 0.4493408203125, 0.566741943359375, 0.68414306640625, 0.801544189453125, 0.9189453125, 1.036346435546875, 1.15374755859375, 1.271148681640625, 1.3885498046875, 1.505950927734375, 1.62335205078125, 1.740753173828125, 1.858154296875, 1.975555419921875, 2.09295654296875, 2.210357666015625, 2.3277587890625, 2.445159912109375, 2.56256103515625, 2.679962158203125, 2.79736328125, 2.914764404296875, 3.03216552734375, 3.149566650390625, 3.2669677734375, 3.384368896484375, 3.50177001953125, 3.619171142578125, 3.736572265625, 3.853973388671875, 3.97137451171875, 4.088775634765625, 4.2061767578125, 4.323577880859375, 4.44097900390625, 4.558380126953125, 4.67578125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 11.0, 13.0, 18.0, 31.0, 35.0, 69.0, 80.0, 142.0, 210.0, 361.0, 619.0, 1054.0, 1921.0, 3668.0, 7413.0, 17096.0, 48083.0, 248999.0, 3631140.0, 166354.0, 38842.0, 14420.0, 6499.0, 3226.0, 1648.0, 914.0, 525.0, 315.0, 209.0, 130.0, 83.0, 49.0, 28.0, 20.0, 16.0, 16.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.390625, -3.26690673828125, -3.1431884765625, -3.01947021484375, -2.895751953125, -2.77203369140625, -2.6483154296875, -2.52459716796875, -2.40087890625, -2.27716064453125, -2.1534423828125, -2.02972412109375, -1.906005859375, -1.78228759765625, -1.6585693359375, -1.53485107421875, -1.4111328125, -1.28741455078125, -1.1636962890625, -1.03997802734375, -0.916259765625, -0.79254150390625, -0.6688232421875, -0.54510498046875, -0.42138671875, -0.29766845703125, -0.1739501953125, -0.05023193359375, 0.073486328125, 0.19720458984375, 0.3209228515625, 0.44464111328125, 0.568359375, 0.69207763671875, 0.8157958984375, 0.93951416015625, 1.063232421875, 1.18695068359375, 1.3106689453125, 1.43438720703125, 1.55810546875, 1.68182373046875, 1.8055419921875, 1.92926025390625, 2.052978515625, 2.17669677734375, 2.3004150390625, 2.42413330078125, 2.5478515625, 2.67156982421875, 2.7952880859375, 2.91900634765625, 3.042724609375, 3.16644287109375, 3.2901611328125, 3.41387939453125, 3.53759765625, 3.66131591796875, 3.7850341796875, 3.90875244140625, 4.032470703125, 4.15618896484375, 4.2799072265625, 4.40362548828125, 4.52734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 7.0, 8.0, 12.0, 19.0, 21.0, 47.0, 73.0, 177.0, 2163.0, 1151.0, 183.0, 76.0, 48.0, 24.0, 14.0, 11.0, 9.0, 8.0, 8.0, 6.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6484375, -1.60504150390625, -1.5616455078125, -1.51824951171875, -1.474853515625, -1.43145751953125, -1.3880615234375, -1.34466552734375, -1.30126953125, -1.25787353515625, -1.2144775390625, -1.17108154296875, -1.127685546875, -1.08428955078125, -1.0408935546875, -0.99749755859375, -0.9541015625, -0.91070556640625, -0.8673095703125, -0.82391357421875, -0.780517578125, -0.73712158203125, -0.6937255859375, -0.65032958984375, -0.60693359375, -0.56353759765625, -0.5201416015625, -0.47674560546875, -0.433349609375, -0.38995361328125, -0.3465576171875, -0.30316162109375, -0.259765625, -0.21636962890625, -0.1729736328125, -0.12957763671875, -0.086181640625, -0.04278564453125, 0.0006103515625, 0.04400634765625, 0.08740234375, 0.13079833984375, 0.1741943359375, 0.21759033203125, 0.260986328125, 0.30438232421875, 0.3477783203125, 0.39117431640625, 0.4345703125, 0.47796630859375, 0.5213623046875, 0.56475830078125, 0.608154296875, 0.65155029296875, 0.6949462890625, 0.73834228515625, 0.78173828125, 0.82513427734375, 0.8685302734375, 0.91192626953125, 0.955322265625, 0.99871826171875, 1.0421142578125, 1.08551025390625, 1.12890625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 12.0, 12.0, 24.0, 54.0, 96.0, 130.0, 168.0, 165.0, 153.0, 88.0, 46.0, 22.0, 14.0, 8.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.149101257324219, -6.933737754821777, -6.718374729156494, -6.503011703491211, -6.2876482009887695, -6.072284698486328, -5.856921672821045, -5.641558647155762, -5.42619514465332, -5.210831642150879, -4.995468616485596, -4.7801055908203125, -4.564742088317871, -4.34937858581543, -4.1340155601501465, -3.918652296066284, -3.703289031982422, -3.4879257678985596, -3.2725625038146973, -3.057199239730835, -2.8418359756469727, -2.6264727115631104, -2.411109447479248, -2.1957461833953857, -1.9803829193115234, -1.7650196552276611, -1.5496563911437988, -1.3342931270599365, -1.1189298629760742, -0.9035665988922119, -0.6882033348083496, -0.4728400707244873, -0.257476806640625, -0.042113542556762695, 0.1732497215270996, 0.3886129856109619, 0.6039762496948242, 0.8193395137786865, 1.0347027778625488, 1.2500660419464111, 1.4654293060302734, 1.6807925701141357, 1.896155834197998, 2.1115190982818604, 2.3268823623657227, 2.542245626449585, 2.7576088905334473, 2.9729721546173096, 3.188335418701172, 3.403698682785034, 3.6190619468688965, 3.834425210952759, 4.049788475036621, 4.2651519775390625, 4.480515003204346, 4.695878028869629, 4.91124153137207, 5.126605033874512, 5.341968059539795, 5.557331085205078, 5.7726945877075195, 5.988058090209961, 6.203421115875244, 6.418784141540527, 6.634147644042969]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 8.0, 4.0, 7.0, 7.0, 12.0, 14.0, 18.0, 7.0, 19.0, 27.0, 25.0, 27.0, 31.0, 28.0, 23.0, 32.0, 39.0, 46.0, 41.0, 59.0, 37.0, 37.0, 40.0, 42.0, 34.0, 38.0, 42.0, 30.0, 28.0, 31.0, 17.0, 24.0, 22.0, 11.0, 18.0, 12.0, 15.0, 12.0, 5.0, 4.0, 10.0, 6.0, 0.0, 4.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.094663619995117, -2.0222008228302, -1.9497382640838623, -1.8772754669189453, -1.8048127889633179, -1.7323501110076904, -1.6598873138427734, -1.587424635887146, -1.5149619579315186, -1.4424992799758911, -1.3700366020202637, -1.2975738048553467, -1.2251111268997192, -1.1526484489440918, -1.0801856517791748, -1.0077229738235474, -0.9352602958679199, -0.8627976179122925, -0.7903348803520203, -0.717872142791748, -0.6454094648361206, -0.5729467868804932, -0.500484049320221, -0.42802131175994873, -0.3555586338043213, -0.28309592604637146, -0.21063321828842163, -0.1381705105304718, -0.06570780277252197, 0.0067549049854278564, 0.07921761274337769, 0.1516803503036499, 0.22414326667785645, 0.2966059744358063, 0.3690686821937561, 0.44153138995170593, 0.5139940977096558, 0.5864567756652832, 0.6589195132255554, 0.7313822507858276, 0.8038449287414551, 0.8763076066970825, 0.9487703442573547, 1.021233081817627, 1.0936957597732544, 1.1661584377288818, 1.2386212348937988, 1.3110839128494263, 1.3835465908050537, 1.4560092687606812, 1.5284719467163086, 1.6009347438812256, 1.673397421836853, 1.7458600997924805, 1.8183228969573975, 1.890785574913025, 1.9632482528686523, 2.0357110500335693, 2.1081736087799072, 2.180636405944824, 2.253098964691162, 2.325561761856079, 2.398024559020996, 2.470487117767334, 2.542949914932251]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 10.0, 11.0, 11.0, 16.0, 19.0, 30.0, 61.0, 94.0, 198.0, 419.0, 946.0, 2509.0, 7862.0, 31455.0, 166840.0, 553316.0, 227493.0, 42124.0, 9924.0, 3039.0, 1189.0, 435.0, 231.0, 103.0, 60.0, 62.0, 34.0, 18.0, 20.0, 11.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.58203125, -6.30303955078125, -6.0240478515625, -5.74505615234375, -5.466064453125, -5.18707275390625, -4.9080810546875, -4.62908935546875, -4.35009765625, -4.07110595703125, -3.7921142578125, -3.51312255859375, -3.234130859375, -2.95513916015625, -2.6761474609375, -2.39715576171875, -2.1181640625, -1.83917236328125, -1.5601806640625, -1.28118896484375, -1.002197265625, -0.72320556640625, -0.4442138671875, -0.16522216796875, 0.11376953125, 0.39276123046875, 0.6717529296875, 0.95074462890625, 1.229736328125, 1.50872802734375, 1.7877197265625, 2.06671142578125, 2.345703125, 2.62469482421875, 2.9036865234375, 3.18267822265625, 3.461669921875, 3.74066162109375, 4.0196533203125, 4.29864501953125, 4.57763671875, 4.85662841796875, 5.1356201171875, 5.41461181640625, 5.693603515625, 5.97259521484375, 6.2515869140625, 6.53057861328125, 6.8095703125, 7.08856201171875, 7.3675537109375, 7.64654541015625, 7.925537109375, 8.20452880859375, 8.4835205078125, 8.76251220703125, 9.04150390625, 9.32049560546875, 9.5994873046875, 9.87847900390625, 10.157470703125, 10.43646240234375, 10.7154541015625, 10.99444580078125, 11.2734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 14.0, 10.0, 19.0, 17.0, 25.0, 31.0, 30.0, 45.0, 56.0, 62.0, 46.0, 58.0, 63.0, 78.0, 51.0, 57.0, 50.0, 38.0, 47.0, 34.0, 37.0, 23.0, 22.0, 19.0, 21.0, 15.0, 9.0, 6.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5234375, -2.4056396484375, -2.287841796875, -2.1700439453125, -2.05224609375, -1.9344482421875, -1.816650390625, -1.6988525390625, -1.5810546875, -1.4632568359375, -1.345458984375, -1.2276611328125, -1.10986328125, -0.9920654296875, -0.874267578125, -0.7564697265625, -0.638671875, -0.5208740234375, -0.403076171875, -0.2852783203125, -0.16748046875, -0.0496826171875, 0.068115234375, 0.1859130859375, 0.3037109375, 0.4215087890625, 0.539306640625, 0.6571044921875, 0.77490234375, 0.8927001953125, 1.010498046875, 1.1282958984375, 1.24609375, 1.3638916015625, 1.481689453125, 1.5994873046875, 1.71728515625, 1.8350830078125, 1.952880859375, 2.0706787109375, 2.1884765625, 2.3062744140625, 2.424072265625, 2.5418701171875, 2.65966796875, 2.7774658203125, 2.895263671875, 3.0130615234375, 3.130859375, 3.2486572265625, 3.366455078125, 3.4842529296875, 3.60205078125, 3.7198486328125, 3.837646484375, 3.9554443359375, 4.0732421875, 4.1910400390625, 4.308837890625, 4.4266357421875, 4.54443359375, 4.6622314453125, 4.780029296875, 4.8978271484375, 5.015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 1.0, 5.0, 10.0, 12.0, 10.0, 19.0, 27.0, 25.0, 45.0, 54.0, 80.0, 161.0, 242.0, 419.0, 840.0, 2183.0, 8282.0, 64262.0, 759571.0, 189793.0, 16586.0, 3407.0, 1127.0, 497.0, 306.0, 197.0, 125.0, 87.0, 56.0, 31.0, 22.0, 18.0, 13.0, 8.0, 10.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5703125, -14.1246337890625, -13.678955078125, -13.2332763671875, -12.78759765625, -12.3419189453125, -11.896240234375, -11.4505615234375, -11.0048828125, -10.5592041015625, -10.113525390625, -9.6678466796875, -9.22216796875, -8.7764892578125, -8.330810546875, -7.8851318359375, -7.439453125, -6.9937744140625, -6.548095703125, -6.1024169921875, -5.65673828125, -5.2110595703125, -4.765380859375, -4.3197021484375, -3.8740234375, -3.4283447265625, -2.982666015625, -2.5369873046875, -2.09130859375, -1.6456298828125, -1.199951171875, -0.7542724609375, -0.30859375, 0.1370849609375, 0.582763671875, 1.0284423828125, 1.47412109375, 1.9197998046875, 2.365478515625, 2.8111572265625, 3.2568359375, 3.7025146484375, 4.148193359375, 4.5938720703125, 5.03955078125, 5.4852294921875, 5.930908203125, 6.3765869140625, 6.822265625, 7.2679443359375, 7.713623046875, 8.1593017578125, 8.60498046875, 9.0506591796875, 9.496337890625, 9.9420166015625, 10.3876953125, 10.8333740234375, 11.279052734375, 11.7247314453125, 12.17041015625, 12.6160888671875, 13.061767578125, 13.5074462890625, 13.953125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 9.0, 4.0, 9.0, 15.0, 18.0, 19.0, 21.0, 17.0, 32.0, 28.0, 20.0, 36.0, 33.0, 37.0, 51.0, 50.0, 56.0, 52.0, 51.0, 53.0, 48.0, 47.0, 36.0, 41.0, 25.0, 24.0, 26.0, 28.0, 14.0, 20.0, 9.0, 13.0, 4.0, 11.0, 3.0, 7.0, 10.0, 4.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.78125, -16.249267578125, -15.71728515625, -15.185302734375, -14.6533203125, -14.121337890625, -13.58935546875, -13.057373046875, -12.525390625, -11.993408203125, -11.46142578125, -10.929443359375, -10.3974609375, -9.865478515625, -9.33349609375, -8.801513671875, -8.26953125, -7.737548828125, -7.20556640625, -6.673583984375, -6.1416015625, -5.609619140625, -5.07763671875, -4.545654296875, -4.013671875, -3.481689453125, -2.94970703125, -2.417724609375, -1.8857421875, -1.353759765625, -0.82177734375, -0.289794921875, 0.2421875, 0.774169921875, 1.30615234375, 1.838134765625, 2.3701171875, 2.902099609375, 3.43408203125, 3.966064453125, 4.498046875, 5.030029296875, 5.56201171875, 6.093994140625, 6.6259765625, 7.157958984375, 7.68994140625, 8.221923828125, 8.75390625, 9.285888671875, 9.81787109375, 10.349853515625, 10.8818359375, 11.413818359375, 11.94580078125, 12.477783203125, 13.009765625, 13.541748046875, 14.07373046875, 14.605712890625, 15.1376953125, 15.669677734375, 16.20166015625, 16.733642578125, 17.265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 3.0, 11.0, 9.0, 8.0, 16.0, 31.0, 38.0, 64.0, 141.0, 303.0, 687.0, 2215.0, 14950.0, 386824.0, 615854.0, 23023.0, 2854.0, 836.0, 330.0, 148.0, 93.0, 38.0, 23.0, 15.0, 13.0, 7.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.44293212890625, -4.2725830078125, -4.10223388671875, -3.931884765625, -3.76153564453125, -3.5911865234375, -3.42083740234375, -3.25048828125, -3.08013916015625, -2.9097900390625, -2.73944091796875, -2.569091796875, -2.39874267578125, -2.2283935546875, -2.05804443359375, -1.8876953125, -1.71734619140625, -1.5469970703125, -1.37664794921875, -1.206298828125, -1.03594970703125, -0.8656005859375, -0.69525146484375, -0.52490234375, -0.35455322265625, -0.1842041015625, -0.01385498046875, 0.156494140625, 0.32684326171875, 0.4971923828125, 0.66754150390625, 0.837890625, 1.00823974609375, 1.1785888671875, 1.34893798828125, 1.519287109375, 1.68963623046875, 1.8599853515625, 2.03033447265625, 2.20068359375, 2.37103271484375, 2.5413818359375, 2.71173095703125, 2.882080078125, 3.05242919921875, 3.2227783203125, 3.39312744140625, 3.5634765625, 3.73382568359375, 3.9041748046875, 4.07452392578125, 4.244873046875, 4.41522216796875, 4.5855712890625, 4.75592041015625, 4.92626953125, 5.09661865234375, 5.2669677734375, 5.43731689453125, 5.607666015625, 5.77801513671875, 5.9483642578125, 6.11871337890625, 6.2890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 11.0, 10.0, 11.0, 12.0, 23.0, 15.0, 30.0, 46.0, 54.0, 90.0, 90.0, 125.0, 106.0, 92.0, 71.0, 58.0, 39.0, 27.0, 25.0, 20.0, 13.0, 11.0, 10.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007715225219726562, -0.0007534585893154144, -0.0007353946566581726, -0.0007173307240009308, -0.000699266791343689, -0.0006812028586864471, -0.0006631389260292053, -0.0006450749933719635, -0.0006270110607147217, -0.0006089471280574799, -0.000590883195400238, -0.0005728192627429962, -0.0005547553300857544, -0.0005366913974285126, -0.0005186274647712708, -0.0005005635321140289, -0.0004824995994567871, -0.0004644356667995453, -0.00044637173414230347, -0.00042830780148506165, -0.0004102438688278198, -0.000392179936170578, -0.0003741160035133362, -0.00035605207085609436, -0.00033798813819885254, -0.0003199242055416107, -0.0003018602728843689, -0.0002837963402271271, -0.00026573240756988525, -0.00024766847491264343, -0.0002296045422554016, -0.0002115406095981598, -0.00019347667694091797, -0.00017541274428367615, -0.00015734881162643433, -0.0001392848789691925, -0.00012122094631195068, -0.00010315701365470886, -8.509308099746704e-05, -6.702914834022522e-05, -4.89652156829834e-05, -3.090128302574158e-05, -1.2837350368499756e-05, 5.2265822887420654e-06, 2.3290514945983887e-05, 4.135444760322571e-05, 5.941838026046753e-05, 7.748231291770935e-05, 9.554624557495117e-05, 0.00011361017823219299, 0.00013167411088943481, 0.00014973804354667664, 0.00016780197620391846, 0.00018586590886116028, 0.0002039298415184021, 0.00022199377417564392, 0.00024005770683288574, 0.00025812163949012756, 0.0002761855721473694, 0.0002942495048046112, 0.00031231343746185303, 0.00033037737011909485, 0.00034844130277633667, 0.0003665052354335785, 0.0003845691680908203]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 11.0, 11.0, 13.0, 26.0, 30.0, 36.0, 55.0, 75.0, 149.0, 260.0, 547.0, 1226.0, 3954.0, 23196.0, 422914.0, 558599.0, 30202.0, 4506.0, 1402.0, 571.0, 285.0, 181.0, 83.0, 62.0, 43.0, 35.0, 23.0, 10.0, 9.0, 7.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.96124267578125, -3.8092041015625, -3.65716552734375, -3.505126953125, -3.35308837890625, -3.2010498046875, -3.04901123046875, -2.89697265625, -2.74493408203125, -2.5928955078125, -2.44085693359375, -2.288818359375, -2.13677978515625, -1.9847412109375, -1.83270263671875, -1.6806640625, -1.52862548828125, -1.3765869140625, -1.22454833984375, -1.072509765625, -0.92047119140625, -0.7684326171875, -0.61639404296875, -0.46435546875, -0.31231689453125, -0.1602783203125, -0.00823974609375, 0.143798828125, 0.29583740234375, 0.4478759765625, 0.59991455078125, 0.751953125, 0.90399169921875, 1.0560302734375, 1.20806884765625, 1.360107421875, 1.51214599609375, 1.6641845703125, 1.81622314453125, 1.96826171875, 2.12030029296875, 2.2723388671875, 2.42437744140625, 2.576416015625, 2.72845458984375, 2.8804931640625, 3.03253173828125, 3.1845703125, 3.33660888671875, 3.4886474609375, 3.64068603515625, 3.792724609375, 3.94476318359375, 4.0968017578125, 4.24884033203125, 4.40087890625, 4.55291748046875, 4.7049560546875, 4.85699462890625, 5.009033203125, 5.16107177734375, 5.3131103515625, 5.46514892578125, 5.6171875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 7.0, 14.0, 19.0, 40.0, 33.0, 45.0, 72.0, 71.0, 94.0, 119.0, 116.0, 96.0, 68.0, 51.0, 29.0, 33.0, 26.0, 17.0, 11.0, 9.0, 9.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.646484375, -3.499053955078125, -3.35162353515625, -3.204193115234375, -3.0567626953125, -2.909332275390625, -2.76190185546875, -2.614471435546875, -2.467041015625, -2.319610595703125, -2.17218017578125, -2.024749755859375, -1.8773193359375, -1.729888916015625, -1.58245849609375, -1.435028076171875, -1.28759765625, -1.140167236328125, -0.99273681640625, -0.845306396484375, -0.6978759765625, -0.550445556640625, -0.40301513671875, -0.255584716796875, -0.108154296875, 0.039276123046875, 0.18670654296875, 0.334136962890625, 0.4815673828125, 0.628997802734375, 0.77642822265625, 0.923858642578125, 1.0712890625, 1.218719482421875, 1.36614990234375, 1.513580322265625, 1.6610107421875, 1.808441162109375, 1.95587158203125, 2.103302001953125, 2.250732421875, 2.398162841796875, 2.54559326171875, 2.693023681640625, 2.8404541015625, 2.987884521484375, 3.13531494140625, 3.282745361328125, 3.43017578125, 3.577606201171875, 3.72503662109375, 3.872467041015625, 4.0198974609375, 4.167327880859375, 4.31475830078125, 4.462188720703125, 4.609619140625, 4.757049560546875, 4.90447998046875, 5.051910400390625, 5.1993408203125, 5.346771240234375, 5.49420166015625, 5.641632080078125, 5.7890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 10.0, 53.0, 130.0, 362.0, 311.0, 103.0, 27.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.0185546875, -132.55633544921875, -128.0941162109375, -123.63188934326172, -119.16966247558594, -114.70744323730469, -110.24522399902344, -105.78300476074219, -101.3207778930664, -96.85855865478516, -92.39633178710938, -87.93411254882812, -83.47189331054688, -79.0096664428711, -74.54744720458984, -70.08522033691406, -65.62300109863281, -61.1607780456543, -56.69855499267578, -52.23633575439453, -47.774112701416016, -43.3118896484375, -38.84967041015625, -34.387447357177734, -29.92522430419922, -25.463001251220703, -21.00078010559082, -16.538558959960938, -12.076335906982422, -7.614112854003906, -3.1518917083740234, 1.3103294372558594, 5.7725677490234375, 10.234789848327637, 14.697011947631836, 19.15923309326172, 23.621456146240234, 28.08367919921875, 32.5458984375, 37.008121490478516, 41.47034454345703, 45.93256759643555, 50.39479064941406, 54.85700988769531, 59.31923294067383, 63.781455993652344, 68.2436752319336, 72.70590209960938, 77.16812133789062, 81.63034057617188, 86.09256744384766, 90.5547866821289, 95.01701354980469, 99.47923278808594, 103.94145202636719, 108.40367126464844, 112.86589813232422, 117.32811737060547, 121.79034423828125, 126.2525634765625, 130.71478271484375, 135.177001953125, 139.6392364501953, 144.10145568847656, 148.5636749267578]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 5.0, 9.0, 7.0, 22.0, 19.0, 19.0, 25.0, 38.0, 37.0, 31.0, 39.0, 42.0, 48.0, 55.0, 50.0, 42.0, 71.0, 48.0, 45.0, 30.0, 39.0, 42.0, 48.0, 34.0, 27.0, 24.0, 17.0, 15.0, 10.0, 11.0, 10.0, 7.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-76.19019317626953, -73.91445922851562, -71.63872528076172, -69.36299133300781, -67.0872573852539, -64.8115234375, -62.53578567504883, -60.26005172729492, -57.984317779541016, -55.70858383178711, -53.4328498840332, -51.1571159362793, -48.881378173828125, -46.60564422607422, -44.32991027832031, -42.054176330566406, -39.7784423828125, -37.502708435058594, -35.22697448730469, -32.95124053955078, -30.675504684448242, -28.399770736694336, -26.124034881591797, -23.84830093383789, -21.572566986083984, -19.296833038330078, -17.021099090576172, -14.745363235473633, -12.469629287719727, -10.19389533996582, -7.918160438537598, -5.642425537109375, -3.3666839599609375, -1.090949535369873, 1.1847848892211914, 3.460519313812256, 5.73625373840332, 8.011987686157227, 10.28772258758545, 12.563457489013672, 14.839191436767578, 17.114925384521484, 19.39065933227539, 21.66639518737793, 23.942129135131836, 26.217863082885742, 28.49359893798828, 30.769332885742188, 33.045066833496094, 35.32080078125, 37.596534729003906, 39.87226867675781, 42.14800262451172, 44.423736572265625, 46.6994743347168, 48.9752082824707, 51.25094223022461, 53.526676177978516, 55.80241012573242, 58.07814407348633, 60.3538818359375, 62.629615783691406, 64.90534973144531, 67.18108367919922, 69.45681762695312]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 10.0, 9.0, 12.0, 12.0, 22.0, 40.0, 59.0, 98.0, 175.0, 289.0, 509.0, 862.0, 1675.0, 3721.0, 8979.0, 26656.0, 118455.0, 3732405.0, 238306.0, 39994.0, 12294.0, 4768.0, 2264.0, 1147.0, 622.0, 327.0, 200.0, 125.0, 79.0, 45.0, 37.0, 31.0, 13.0, 11.0, 8.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.689453125, -3.569122314453125, -3.44879150390625, -3.328460693359375, -3.2081298828125, -3.087799072265625, -2.96746826171875, -2.847137451171875, -2.726806640625, -2.606475830078125, -2.48614501953125, -2.365814208984375, -2.2454833984375, -2.125152587890625, -2.00482177734375, -1.884490966796875, -1.76416015625, -1.643829345703125, -1.52349853515625, -1.403167724609375, -1.2828369140625, -1.162506103515625, -1.04217529296875, -0.921844482421875, -0.801513671875, -0.681182861328125, -0.56085205078125, -0.440521240234375, -0.3201904296875, -0.199859619140625, -0.07952880859375, 0.040802001953125, 0.1611328125, 0.281463623046875, 0.40179443359375, 0.522125244140625, 0.6424560546875, 0.762786865234375, 0.88311767578125, 1.003448486328125, 1.123779296875, 1.244110107421875, 1.36444091796875, 1.484771728515625, 1.6051025390625, 1.725433349609375, 1.84576416015625, 1.966094970703125, 2.08642578125, 2.206756591796875, 2.32708740234375, 2.447418212890625, 2.5677490234375, 2.688079833984375, 2.80841064453125, 2.928741455078125, 3.049072265625, 3.169403076171875, 3.28973388671875, 3.410064697265625, 3.5303955078125, 3.650726318359375, 3.77105712890625, 3.891387939453125, 4.01171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 10.0, 7.0, 12.0, 3.0, 16.0, 13.0, 20.0, 24.0, 27.0, 24.0, 33.0, 31.0, 29.0, 34.0, 44.0, 36.0, 48.0, 32.0, 37.0, 49.0, 54.0, 35.0, 32.0, 36.0, 30.0, 29.0, 32.0, 30.0, 21.0, 27.0, 19.0, 19.0, 14.0, 17.0, 15.0, 12.0, 12.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.484375, -2.401214599609375, -2.31805419921875, -2.234893798828125, -2.1517333984375, -2.068572998046875, -1.98541259765625, -1.902252197265625, -1.819091796875, -1.735931396484375, -1.65277099609375, -1.569610595703125, -1.4864501953125, -1.403289794921875, -1.32012939453125, -1.236968994140625, -1.15380859375, -1.070648193359375, -0.98748779296875, -0.904327392578125, -0.8211669921875, -0.738006591796875, -0.65484619140625, -0.571685791015625, -0.488525390625, -0.405364990234375, -0.32220458984375, -0.239044189453125, -0.1558837890625, -0.072723388671875, 0.01043701171875, 0.093597412109375, 0.1767578125, 0.259918212890625, 0.34307861328125, 0.426239013671875, 0.5093994140625, 0.592559814453125, 0.67572021484375, 0.758880615234375, 0.842041015625, 0.925201416015625, 1.00836181640625, 1.091522216796875, 1.1746826171875, 1.257843017578125, 1.34100341796875, 1.424163818359375, 1.50732421875, 1.590484619140625, 1.67364501953125, 1.756805419921875, 1.8399658203125, 1.923126220703125, 2.00628662109375, 2.089447021484375, 2.172607421875, 2.255767822265625, 2.33892822265625, 2.422088623046875, 2.5052490234375, 2.588409423828125, 2.67156982421875, 2.754730224609375, 2.837890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 10.0, 9.0, 12.0, 13.0, 18.0, 22.0, 34.0, 41.0, 76.0, 89.0, 132.0, 181.0, 315.0, 465.0, 783.0, 1398.0, 2442.0, 4476.0, 8882.0, 20049.0, 54710.0, 258783.0, 3544083.0, 211785.0, 49222.0, 18240.0, 8134.0, 4110.0, 2272.0, 1321.0, 773.0, 474.0, 274.0, 214.0, 129.0, 94.0, 61.0, 47.0, 33.0, 25.0, 14.0, 15.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.162109375, -3.064666748046875, -2.96722412109375, -2.869781494140625, -2.7723388671875, -2.674896240234375, -2.57745361328125, -2.480010986328125, -2.382568359375, -2.285125732421875, -2.18768310546875, -2.090240478515625, -1.9927978515625, -1.895355224609375, -1.79791259765625, -1.700469970703125, -1.60302734375, -1.505584716796875, -1.40814208984375, -1.310699462890625, -1.2132568359375, -1.115814208984375, -1.01837158203125, -0.920928955078125, -0.823486328125, -0.726043701171875, -0.62860107421875, -0.531158447265625, -0.4337158203125, -0.336273193359375, -0.23883056640625, -0.141387939453125, -0.0439453125, 0.053497314453125, 0.15093994140625, 0.248382568359375, 0.3458251953125, 0.443267822265625, 0.54071044921875, 0.638153076171875, 0.735595703125, 0.833038330078125, 0.93048095703125, 1.027923583984375, 1.1253662109375, 1.222808837890625, 1.32025146484375, 1.417694091796875, 1.51513671875, 1.612579345703125, 1.71002197265625, 1.807464599609375, 1.9049072265625, 2.002349853515625, 2.09979248046875, 2.197235107421875, 2.294677734375, 2.392120361328125, 2.48956298828125, 2.587005615234375, 2.6844482421875, 2.781890869140625, 2.87933349609375, 2.976776123046875, 3.07421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 12.0, 15.0, 19.0, 30.0, 40.0, 73.0, 183.0, 703.0, 2512.0, 228.0, 111.0, 41.0, 33.0, 17.0, 10.0, 15.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.95703125, -1.911651611328125, -1.86627197265625, -1.820892333984375, -1.7755126953125, -1.730133056640625, -1.68475341796875, -1.639373779296875, -1.593994140625, -1.548614501953125, -1.50323486328125, -1.457855224609375, -1.4124755859375, -1.367095947265625, -1.32171630859375, -1.276336669921875, -1.23095703125, -1.185577392578125, -1.14019775390625, -1.094818115234375, -1.0494384765625, -1.004058837890625, -0.95867919921875, -0.913299560546875, -0.867919921875, -0.822540283203125, -0.77716064453125, -0.731781005859375, -0.6864013671875, -0.641021728515625, -0.59564208984375, -0.550262451171875, -0.5048828125, -0.459503173828125, -0.41412353515625, -0.368743896484375, -0.3233642578125, -0.277984619140625, -0.23260498046875, -0.187225341796875, -0.141845703125, -0.096466064453125, -0.05108642578125, -0.005706787109375, 0.0396728515625, 0.085052490234375, 0.13043212890625, 0.175811767578125, 0.22119140625, 0.266571044921875, 0.31195068359375, 0.357330322265625, 0.4027099609375, 0.448089599609375, 0.49346923828125, 0.538848876953125, 0.584228515625, 0.629608154296875, 0.67498779296875, 0.720367431640625, 0.7657470703125, 0.811126708984375, 0.85650634765625, 0.901885986328125, 0.947265625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 10.0, 7.0, 13.0, 34.0, 51.0, 57.0, 95.0, 122.0, 163.0, 141.0, 128.0, 75.0, 56.0, 28.0, 7.0, 10.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.655675888061523, -7.4546966552734375, -7.253717422485352, -7.052738189697266, -6.851759433746338, -6.650780200958252, -6.449800968170166, -6.24882173538208, -6.047842502593994, -5.846863269805908, -5.645884037017822, -5.4449052810668945, -5.243926048278809, -5.042946815490723, -4.841967582702637, -4.640988349914551, -4.440009117126465, -4.239029884338379, -4.038050651550293, -3.837071657180786, -3.6360924243927, -3.4351134300231934, -3.2341341972351074, -3.0331549644470215, -2.8321762084960938, -2.631196975708008, -2.430217981338501, -2.229238748550415, -2.028259515762329, -1.8272804021835327, -1.6263012886047363, -1.4253220558166504, -1.2243428230285645, -1.023363709449768, -0.8223844766616821, -0.6214053630828857, -0.4204261898994446, -0.21944701671600342, -0.01846790313720703, 0.1825113296508789, 0.3834904432296753, 0.5844696164131165, 0.7854487895965576, 0.986427903175354, 1.1874070167541504, 1.3883862495422363, 1.5893653631210327, 1.7903445959091187, 1.991323709487915, 2.192302942276001, 2.393281936645508, 2.5942611694335938, 2.7952404022216797, 2.9962196350097656, 3.1971986293792725, 3.3981778621673584, 3.5991568565368652, 3.800136089324951, 4.001115322113037, 4.202094078063965, 4.403073310852051, 4.604052543640137, 4.805031776428223, 5.006011009216309, 5.2069902420043945]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 7.0, 10.0, 13.0, 26.0, 27.0, 22.0, 34.0, 46.0, 44.0, 59.0, 54.0, 53.0, 62.0, 63.0, 53.0, 73.0, 68.0, 71.0, 38.0, 40.0, 28.0, 30.0, 25.0, 16.0, 10.0, 6.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.664700984954834, -5.522928237915039, -5.381155967712402, -5.239383220672607, -5.097610950469971, -4.955838203430176, -4.814065933227539, -4.672293186187744, -4.530520439147949, -4.388747692108154, -4.246975421905518, -4.105202674865723, -3.963430166244507, -3.821657657623291, -3.679885149002075, -3.5381126403808594, -3.3963401317596436, -3.2545676231384277, -3.112795114517212, -2.971022605895996, -2.829249858856201, -2.6874773502349854, -2.5457048416137695, -2.4039323329925537, -2.262159824371338, -2.120387315750122, -1.9786146879196167, -1.8368421792984009, -1.6950695514678955, -1.5532970428466797, -1.4115245342254639, -1.269752025604248, -1.1279792785644531, -0.9862067103385925, -0.8444341421127319, -0.7026616334915161, -0.5608890652656555, -0.4191164970397949, -0.2773439884185791, -0.1355714201927185, 0.00620114803314209, 0.1479737013578415, 0.2897462546825409, 0.4315187931060791, 0.5732913613319397, 0.7150639295578003, 0.8568364381790161, 0.9986090064048767, 1.1403815746307373, 1.2821540832519531, 1.4239267110824585, 1.5656992197036743, 1.7074718475341797, 1.8492443561553955, 1.9910168647766113, 2.132789373397827, 2.274561882019043, 2.416334390640259, 2.5581068992614746, 2.6998796463012695, 2.8416521549224854, 2.983424663543701, 3.125197172164917, 3.266969680786133, 3.4087424278259277]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 8.0, 11.0, 16.0, 15.0, 25.0, 33.0, 85.0, 86.0, 158.0, 282.0, 499.0, 1034.0, 2209.0, 5433.0, 14886.0, 44695.0, 143671.0, 356295.0, 311995.0, 112119.0, 34800.0, 11818.0, 4486.0, 1953.0, 865.0, 441.0, 225.0, 148.0, 74.0, 51.0, 44.0, 36.0, 16.0, 7.0, 11.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.11328125, -4.96673583984375, -4.8201904296875, -4.67364501953125, -4.527099609375, -4.38055419921875, -4.2340087890625, -4.08746337890625, -3.94091796875, -3.79437255859375, -3.6478271484375, -3.50128173828125, -3.354736328125, -3.20819091796875, -3.0616455078125, -2.91510009765625, -2.7685546875, -2.62200927734375, -2.4754638671875, -2.32891845703125, -2.182373046875, -2.03582763671875, -1.8892822265625, -1.74273681640625, -1.59619140625, -1.44964599609375, -1.3031005859375, -1.15655517578125, -1.010009765625, -0.86346435546875, -0.7169189453125, -0.57037353515625, -0.423828125, -0.27728271484375, -0.1307373046875, 0.01580810546875, 0.162353515625, 0.30889892578125, 0.4554443359375, 0.60198974609375, 0.74853515625, 0.89508056640625, 1.0416259765625, 1.18817138671875, 1.334716796875, 1.48126220703125, 1.6278076171875, 1.77435302734375, 1.9208984375, 2.06744384765625, 2.2139892578125, 2.36053466796875, 2.507080078125, 2.65362548828125, 2.8001708984375, 2.94671630859375, 3.09326171875, 3.23980712890625, 3.3863525390625, 3.53289794921875, 3.679443359375, 3.82598876953125, 3.9725341796875, 4.11907958984375, 4.265625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 3.0, 6.0, 3.0, 6.0, 7.0, 10.0, 15.0, 13.0, 19.0, 23.0, 26.0, 23.0, 33.0, 48.0, 33.0, 36.0, 49.0, 49.0, 49.0, 46.0, 40.0, 43.0, 40.0, 45.0, 39.0, 33.0, 36.0, 31.0, 37.0, 18.0, 23.0, 15.0, 16.0, 20.0, 17.0, 13.0, 10.0, 6.0, 6.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.578125, -2.48687744140625, -2.3956298828125, -2.30438232421875, -2.213134765625, -2.12188720703125, -2.0306396484375, -1.93939208984375, -1.84814453125, -1.75689697265625, -1.6656494140625, -1.57440185546875, -1.483154296875, -1.39190673828125, -1.3006591796875, -1.20941162109375, -1.1181640625, -1.02691650390625, -0.9356689453125, -0.84442138671875, -0.753173828125, -0.66192626953125, -0.5706787109375, -0.47943115234375, -0.38818359375, -0.29693603515625, -0.2056884765625, -0.11444091796875, -0.023193359375, 0.06805419921875, 0.1593017578125, 0.25054931640625, 0.341796875, 0.43304443359375, 0.5242919921875, 0.61553955078125, 0.706787109375, 0.79803466796875, 0.8892822265625, 0.98052978515625, 1.07177734375, 1.16302490234375, 1.2542724609375, 1.34552001953125, 1.436767578125, 1.52801513671875, 1.6192626953125, 1.71051025390625, 1.8017578125, 1.89300537109375, 1.9842529296875, 2.07550048828125, 2.166748046875, 2.25799560546875, 2.3492431640625, 2.44049072265625, 2.53173828125, 2.62298583984375, 2.7142333984375, 2.80548095703125, 2.896728515625, 2.98797607421875, 3.0792236328125, 3.17047119140625, 3.26171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 13.0, 13.0, 17.0, 26.0, 31.0, 69.0, 74.0, 130.0, 163.0, 328.0, 579.0, 1241.0, 3257.0, 16100.0, 224133.0, 738858.0, 52694.0, 6901.0, 1885.0, 861.0, 424.0, 244.0, 157.0, 97.0, 66.0, 47.0, 36.0, 23.0, 18.0, 16.0, 9.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.515625, -10.17919921875, -9.8427734375, -9.50634765625, -9.169921875, -8.83349609375, -8.4970703125, -8.16064453125, -7.82421875, -7.48779296875, -7.1513671875, -6.81494140625, -6.478515625, -6.14208984375, -5.8056640625, -5.46923828125, -5.1328125, -4.79638671875, -4.4599609375, -4.12353515625, -3.787109375, -3.45068359375, -3.1142578125, -2.77783203125, -2.44140625, -2.10498046875, -1.7685546875, -1.43212890625, -1.095703125, -0.75927734375, -0.4228515625, -0.08642578125, 0.25, 0.58642578125, 0.9228515625, 1.25927734375, 1.595703125, 1.93212890625, 2.2685546875, 2.60498046875, 2.94140625, 3.27783203125, 3.6142578125, 3.95068359375, 4.287109375, 4.62353515625, 4.9599609375, 5.29638671875, 5.6328125, 5.96923828125, 6.3056640625, 6.64208984375, 6.978515625, 7.31494140625, 7.6513671875, 7.98779296875, 8.32421875, 8.66064453125, 8.9970703125, 9.33349609375, 9.669921875, 10.00634765625, 10.3427734375, 10.67919921875, 11.015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 10.0, 15.0, 15.0, 18.0, 16.0, 19.0, 28.0, 40.0, 33.0, 46.0, 43.0, 48.0, 57.0, 65.0, 52.0, 64.0, 56.0, 45.0, 36.0, 44.0, 28.0, 37.0, 33.0, 25.0, 22.0, 18.0, 9.0, 12.0, 9.0, 9.0, 5.0, 3.0, 6.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-17.203125, -16.72119140625, -16.2392578125, -15.75732421875, -15.275390625, -14.79345703125, -14.3115234375, -13.82958984375, -13.34765625, -12.86572265625, -12.3837890625, -11.90185546875, -11.419921875, -10.93798828125, -10.4560546875, -9.97412109375, -9.4921875, -9.01025390625, -8.5283203125, -8.04638671875, -7.564453125, -7.08251953125, -6.6005859375, -6.11865234375, -5.63671875, -5.15478515625, -4.6728515625, -4.19091796875, -3.708984375, -3.22705078125, -2.7451171875, -2.26318359375, -1.78125, -1.29931640625, -0.8173828125, -0.33544921875, 0.146484375, 0.62841796875, 1.1103515625, 1.59228515625, 2.07421875, 2.55615234375, 3.0380859375, 3.52001953125, 4.001953125, 4.48388671875, 4.9658203125, 5.44775390625, 5.9296875, 6.41162109375, 6.8935546875, 7.37548828125, 7.857421875, 8.33935546875, 8.8212890625, 9.30322265625, 9.78515625, 10.26708984375, 10.7490234375, 11.23095703125, 11.712890625, 12.19482421875, 12.6767578125, 13.15869140625, 13.640625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 11.0, 6.0, 12.0, 23.0, 28.0, 38.0, 72.0, 106.0, 206.0, 372.0, 800.0, 2967.0, 28099.0, 799720.0, 204808.0, 8530.0, 1546.0, 566.0, 244.0, 161.0, 84.0, 57.0, 40.0, 18.0, 19.0, 11.0, 9.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.90655517578125, -3.7271728515625, -3.54779052734375, -3.368408203125, -3.18902587890625, -3.0096435546875, -2.83026123046875, -2.65087890625, -2.47149658203125, -2.2921142578125, -2.11273193359375, -1.933349609375, -1.75396728515625, -1.5745849609375, -1.39520263671875, -1.2158203125, -1.03643798828125, -0.8570556640625, -0.67767333984375, -0.498291015625, -0.31890869140625, -0.1395263671875, 0.03985595703125, 0.21923828125, 0.39862060546875, 0.5780029296875, 0.75738525390625, 0.936767578125, 1.11614990234375, 1.2955322265625, 1.47491455078125, 1.654296875, 1.83367919921875, 2.0130615234375, 2.19244384765625, 2.371826171875, 2.55120849609375, 2.7305908203125, 2.90997314453125, 3.08935546875, 3.26873779296875, 3.4481201171875, 3.62750244140625, 3.806884765625, 3.98626708984375, 4.1656494140625, 4.34503173828125, 4.5244140625, 4.70379638671875, 4.8831787109375, 5.06256103515625, 5.241943359375, 5.42132568359375, 5.6007080078125, 5.78009033203125, 5.95947265625, 6.13885498046875, 6.3182373046875, 6.49761962890625, 6.677001953125, 6.85638427734375, 7.0357666015625, 7.21514892578125, 7.39453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 3.0, 7.0, 5.0, 6.0, 6.0, 6.0, 12.0, 12.0, 28.0, 25.0, 31.0, 29.0, 53.0, 62.0, 63.0, 77.0, 84.0, 71.0, 61.0, 54.0, 63.0, 35.0, 34.0, 34.0, 19.0, 25.0, 25.0, 15.0, 2.0, 7.0, 9.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00036525726318359375, -0.0003535449504852295, -0.00034183263778686523, -0.000330120325088501, -0.0003184080123901367, -0.00030669569969177246, -0.0002949833869934082, -0.00028327107429504395, -0.0002715587615966797, -0.00025984644889831543, -0.00024813413619995117, -0.00023642182350158691, -0.00022470951080322266, -0.0002129971981048584, -0.00020128488540649414, -0.00018957257270812988, -0.00017786026000976562, -0.00016614794731140137, -0.0001544356346130371, -0.00014272332191467285, -0.0001310110092163086, -0.00011929869651794434, -0.00010758638381958008, -9.587407112121582e-05, -8.416175842285156e-05, -7.24494457244873e-05, -6.073713302612305e-05, -4.902482032775879e-05, -3.731250762939453e-05, -2.5600194931030273e-05, -1.3887882232666016e-05, -2.175569534301758e-06, 9.5367431640625e-06, 2.1249055862426758e-05, 3.2961368560791016e-05, 4.4673681259155273e-05, 5.638599395751953e-05, 6.809830665588379e-05, 7.981061935424805e-05, 9.15229320526123e-05, 0.00010323524475097656, 0.00011494755744934082, 0.00012665987014770508, 0.00013837218284606934, 0.0001500844955444336, 0.00016179680824279785, 0.0001735091209411621, 0.00018522143363952637, 0.00019693374633789062, 0.00020864605903625488, 0.00022035837173461914, 0.0002320706844329834, 0.00024378299713134766, 0.0002554953098297119, 0.00026720762252807617, 0.00027891993522644043, 0.0002906322479248047, 0.00030234456062316895, 0.0003140568733215332, 0.00032576918601989746, 0.0003374814987182617, 0.000349193811416626, 0.00036090612411499023, 0.0003726184368133545, 0.00038433074951171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 8.0, 6.0, 10.0, 19.0, 29.0, 42.0, 89.0, 164.0, 370.0, 1112.0, 5360.0, 124879.0, 892163.0, 20690.0, 2468.0, 617.0, 265.0, 114.0, 62.0, 38.0, 18.0, 18.0, 5.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65234375, -6.41705322265625, -6.1817626953125, -5.94647216796875, -5.711181640625, -5.47589111328125, -5.2406005859375, -5.00531005859375, -4.77001953125, -4.53472900390625, -4.2994384765625, -4.06414794921875, -3.828857421875, -3.59356689453125, -3.3582763671875, -3.12298583984375, -2.8876953125, -2.65240478515625, -2.4171142578125, -2.18182373046875, -1.946533203125, -1.71124267578125, -1.4759521484375, -1.24066162109375, -1.00537109375, -0.77008056640625, -0.5347900390625, -0.29949951171875, -0.064208984375, 0.17108154296875, 0.4063720703125, 0.64166259765625, 0.876953125, 1.11224365234375, 1.3475341796875, 1.58282470703125, 1.818115234375, 2.05340576171875, 2.2886962890625, 2.52398681640625, 2.75927734375, 2.99456787109375, 3.2298583984375, 3.46514892578125, 3.700439453125, 3.93572998046875, 4.1710205078125, 4.40631103515625, 4.6416015625, 4.87689208984375, 5.1121826171875, 5.34747314453125, 5.582763671875, 5.81805419921875, 6.0533447265625, 6.28863525390625, 6.52392578125, 6.75921630859375, 6.9945068359375, 7.22979736328125, 7.465087890625, 7.70037841796875, 7.9356689453125, 8.17095947265625, 8.40625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 10.0, 11.0, 16.0, 36.0, 94.0, 156.0, 209.0, 223.0, 129.0, 55.0, 30.0, 18.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1796875, -10.91302490234375, -10.6463623046875, -10.37969970703125, -10.113037109375, -9.84637451171875, -9.5797119140625, -9.31304931640625, -9.04638671875, -8.77972412109375, -8.5130615234375, -8.24639892578125, -7.979736328125, -7.71307373046875, -7.4464111328125, -7.17974853515625, -6.9130859375, -6.64642333984375, -6.3797607421875, -6.11309814453125, -5.846435546875, -5.57977294921875, -5.3131103515625, -5.04644775390625, -4.77978515625, -4.51312255859375, -4.2464599609375, -3.97979736328125, -3.713134765625, -3.44647216796875, -3.1798095703125, -2.91314697265625, -2.646484375, -2.37982177734375, -2.1131591796875, -1.84649658203125, -1.579833984375, -1.31317138671875, -1.0465087890625, -0.77984619140625, -0.51318359375, -0.24652099609375, 0.0201416015625, 0.28680419921875, 0.553466796875, 0.82012939453125, 1.0867919921875, 1.35345458984375, 1.6201171875, 1.88677978515625, 2.1534423828125, 2.42010498046875, 2.686767578125, 2.95343017578125, 3.2200927734375, 3.48675537109375, 3.75341796875, 4.02008056640625, 4.2867431640625, 4.55340576171875, 4.820068359375, 5.08673095703125, 5.3533935546875, 5.62005615234375, 5.88671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 9.0, 24.0, 50.0, 219.0, 439.0, 206.0, 40.0, 9.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.6992950439453, -156.8820343017578, -152.06478881835938, -147.24752807617188, -142.43026733398438, -137.61302185058594, -132.79576110839844, -127.97850799560547, -123.1612548828125, -118.34400177001953, -113.52674865722656, -108.70948791503906, -103.8922348022461, -99.07498168945312, -94.25772094726562, -89.44046783447266, -84.62321472167969, -79.80596160888672, -74.98870849609375, -70.17144775390625, -65.35419464111328, -60.53694152832031, -55.71968460083008, -50.902427673339844, -46.085174560546875, -41.267921447753906, -36.45066452026367, -31.63340950012207, -26.81615447998047, -21.998899459838867, -17.181644439697266, -12.364387512207031, -7.547149658203125, -2.7298946380615234, 2.087360382080078, 6.90461540222168, 11.721870422363281, 16.539125442504883, 21.356380462646484, 26.17363739013672, 30.990890502929688, 35.808143615722656, 40.62540054321289, 45.442657470703125, 50.259910583496094, 55.07716369628906, 59.8944206237793, 64.71167755126953, 69.5289306640625, 74.34618377685547, 79.16343688964844, 83.98069763183594, 88.7979507446289, 93.61520385742188, 98.43246459960938, 103.24971771240234, 108.06697082519531, 112.88422393798828, 117.70147705078125, 122.51873779296875, 127.33599090576172, 132.1532440185547, 136.9705047607422, 141.78775024414062, 146.60501098632812]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 8.0, 8.0, 10.0, 8.0, 16.0, 10.0, 8.0, 18.0, 20.0, 35.0, 32.0, 35.0, 32.0, 46.0, 54.0, 44.0, 59.0, 56.0, 46.0, 47.0, 49.0, 44.0, 43.0, 42.0, 34.0, 32.0, 28.0, 30.0, 21.0, 14.0, 18.0, 10.0, 9.0, 5.0, 9.0, 5.0, 7.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-64.63883209228516, -62.67627716064453, -60.71372604370117, -58.75117111206055, -56.78861999511719, -54.82606506347656, -52.8635139465332, -50.90095901489258, -48.93840789794922, -46.975852966308594, -45.013301849365234, -43.05074691772461, -41.08819580078125, -39.125640869140625, -37.163089752197266, -35.20053482055664, -33.23798370361328, -31.27543067932129, -29.312877655029297, -27.350324630737305, -25.387771606445312, -23.425216674804688, -21.462665557861328, -19.500110626220703, -17.537555694580078, -15.575002670288086, -13.612449645996094, -11.649896621704102, -9.68734359741211, -7.724789619445801, -5.762236595153809, -3.7996835708618164, -1.8371315002441406, 0.1254216432571411, 2.087974786758423, 4.050528049468994, 6.013081073760986, 7.975634574890137, 9.938187599182129, 11.900740623474121, 13.863293647766113, 15.825846672058105, 17.788400650024414, 19.750953674316406, 21.7135066986084, 23.67605972290039, 25.638612747192383, 27.601165771484375, 29.563718795776367, 31.52627182006836, 33.488826751708984, 35.451377868652344, 37.41393280029297, 39.37648391723633, 41.33903884887695, 43.30158996582031, 45.26414489746094, 47.22669982910156, 49.18925094604492, 51.15180587768555, 53.114356994628906, 55.07691192626953, 57.03946304321289, 59.002017974853516, 60.964569091796875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 6.0, 13.0, 23.0, 27.0, 32.0, 69.0, 138.0, 194.0, 396.0, 737.0, 1492.0, 3486.0, 9320.0, 33457.0, 258557.0, 3806590.0, 57198.0, 13662.0, 4792.0, 1990.0, 889.0, 546.0, 231.0, 161.0, 93.0, 61.0, 33.0, 22.0, 23.0, 13.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.650390625, -3.510894775390625, -3.37139892578125, -3.231903076171875, -3.0924072265625, -2.952911376953125, -2.81341552734375, -2.673919677734375, -2.534423828125, -2.394927978515625, -2.25543212890625, -2.115936279296875, -1.9764404296875, -1.836944580078125, -1.69744873046875, -1.557952880859375, -1.41845703125, -1.278961181640625, -1.13946533203125, -0.999969482421875, -0.8604736328125, -0.720977783203125, -0.58148193359375, -0.441986083984375, -0.302490234375, -0.162994384765625, -0.02349853515625, 0.115997314453125, 0.2554931640625, 0.394989013671875, 0.53448486328125, 0.673980712890625, 0.8134765625, 0.952972412109375, 1.09246826171875, 1.231964111328125, 1.3714599609375, 1.510955810546875, 1.65045166015625, 1.789947509765625, 1.929443359375, 2.068939208984375, 2.20843505859375, 2.347930908203125, 2.4874267578125, 2.626922607421875, 2.76641845703125, 2.905914306640625, 3.04541015625, 3.184906005859375, 3.32440185546875, 3.463897705078125, 3.6033935546875, 3.742889404296875, 3.88238525390625, 4.021881103515625, 4.161376953125, 4.300872802734375, 4.44036865234375, 4.579864501953125, 4.7193603515625, 4.858856201171875, 4.99835205078125, 5.137847900390625, 5.27734375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 7.0, 9.0, 8.0, 7.0, 15.0, 18.0, 16.0, 17.0, 25.0, 25.0, 24.0, 40.0, 38.0, 44.0, 48.0, 49.0, 51.0, 56.0, 55.0, 41.0, 51.0, 31.0, 46.0, 36.0, 30.0, 39.0, 17.0, 29.0, 28.0, 10.0, 14.0, 19.0, 13.0, 10.0, 10.0, 6.0, 3.0, 2.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.875, -2.77935791015625, -2.6837158203125, -2.58807373046875, -2.492431640625, -2.39678955078125, -2.3011474609375, -2.20550537109375, -2.10986328125, -2.01422119140625, -1.9185791015625, -1.82293701171875, -1.727294921875, -1.63165283203125, -1.5360107421875, -1.44036865234375, -1.3447265625, -1.24908447265625, -1.1534423828125, -1.05780029296875, -0.962158203125, -0.86651611328125, -0.7708740234375, -0.67523193359375, -0.57958984375, -0.48394775390625, -0.3883056640625, -0.29266357421875, -0.197021484375, -0.10137939453125, -0.0057373046875, 0.08990478515625, 0.185546875, 0.28118896484375, 0.3768310546875, 0.47247314453125, 0.568115234375, 0.66375732421875, 0.7593994140625, 0.85504150390625, 0.95068359375, 1.04632568359375, 1.1419677734375, 1.23760986328125, 1.333251953125, 1.42889404296875, 1.5245361328125, 1.62017822265625, 1.7158203125, 1.81146240234375, 1.9071044921875, 2.00274658203125, 2.098388671875, 2.19403076171875, 2.2896728515625, 2.38531494140625, 2.48095703125, 2.57659912109375, 2.6722412109375, 2.76788330078125, 2.863525390625, 2.95916748046875, 3.0548095703125, 3.15045166015625, 3.24609375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 14.0, 13.0, 12.0, 19.0, 31.0, 48.0, 87.0, 130.0, 226.0, 364.0, 538.0, 883.0, 1656.0, 3331.0, 7141.0, 17625.0, 62910.0, 3071050.0, 936630.0, 60195.0, 17364.0, 6891.0, 3223.0, 1660.0, 882.0, 522.0, 317.0, 211.0, 121.0, 64.0, 39.0, 35.0, 12.0, 14.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.04296875, -2.93798828125, -2.8330078125, -2.72802734375, -2.623046875, -2.51806640625, -2.4130859375, -2.30810546875, -2.203125, -2.09814453125, -1.9931640625, -1.88818359375, -1.783203125, -1.67822265625, -1.5732421875, -1.46826171875, -1.36328125, -1.25830078125, -1.1533203125, -1.04833984375, -0.943359375, -0.83837890625, -0.7333984375, -0.62841796875, -0.5234375, -0.41845703125, -0.3134765625, -0.20849609375, -0.103515625, 0.00146484375, 0.1064453125, 0.21142578125, 0.31640625, 0.42138671875, 0.5263671875, 0.63134765625, 0.736328125, 0.84130859375, 0.9462890625, 1.05126953125, 1.15625, 1.26123046875, 1.3662109375, 1.47119140625, 1.576171875, 1.68115234375, 1.7861328125, 1.89111328125, 1.99609375, 2.10107421875, 2.2060546875, 2.31103515625, 2.416015625, 2.52099609375, 2.6259765625, 2.73095703125, 2.8359375, 2.94091796875, 3.0458984375, 3.15087890625, 3.255859375, 3.36083984375, 3.4658203125, 3.57080078125, 3.67578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 5.0, 4.0, 3.0, 5.0, 16.0, 6.0, 21.0, 38.0, 73.0, 109.0, 293.0, 2961.0, 266.0, 101.0, 47.0, 27.0, 35.0, 17.0, 9.0, 7.0, 9.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1552734375, -1.1235809326171875, -1.091888427734375, -1.0601959228515625, -1.02850341796875, -0.9968109130859375, -0.965118408203125, -0.9334259033203125, -0.9017333984375, -0.8700408935546875, -0.838348388671875, -0.8066558837890625, -0.77496337890625, -0.7432708740234375, -0.711578369140625, -0.6798858642578125, -0.648193359375, -0.6165008544921875, -0.584808349609375, -0.5531158447265625, -0.52142333984375, -0.4897308349609375, -0.458038330078125, -0.4263458251953125, -0.3946533203125, -0.3629608154296875, -0.331268310546875, -0.2995758056640625, -0.26788330078125, -0.2361907958984375, -0.204498291015625, -0.1728057861328125, -0.14111328125, -0.1094207763671875, -0.077728271484375, -0.0460357666015625, -0.01434326171875, 0.0173492431640625, 0.049041748046875, 0.0807342529296875, 0.1124267578125, 0.1441192626953125, 0.175811767578125, 0.2075042724609375, 0.23919677734375, 0.2708892822265625, 0.302581787109375, 0.3342742919921875, 0.365966796875, 0.3976593017578125, 0.429351806640625, 0.4610443115234375, 0.49273681640625, 0.5244293212890625, 0.556121826171875, 0.5878143310546875, 0.6195068359375, 0.6511993408203125, 0.682891845703125, 0.7145843505859375, 0.74627685546875, 0.7779693603515625, 0.809661865234375, 0.8413543701171875, 0.873046875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 13.0, 9.0, 16.0, 34.0, 65.0, 102.0, 152.0, 137.0, 158.0, 129.0, 84.0, 41.0, 26.0, 15.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.194028377532959, -4.024294853210449, -3.8545613288879395, -3.684828042984009, -3.515094518661499, -3.3453609943389893, -3.1756277084350586, -3.005894184112549, -2.836160659790039, -2.6664271354675293, -2.4966936111450195, -2.326960325241089, -2.157226800918579, -1.9874932765960693, -1.8177598714828491, -1.648026466369629, -1.4782929420471191, -1.3085594177246094, -1.1388260126113892, -0.9690925478935242, -0.7993590831756592, -0.6296256184577942, -0.4598921537399292, -0.290158748626709, -0.12042522430419922, 0.04930824041366577, 0.21904170513153076, 0.38877516984939575, 0.5585086345672607, 0.7282420992851257, 0.8979755640029907, 1.067708969116211, 1.2374420166015625, 1.4071755409240723, 1.5769089460372925, 1.7466423511505127, 1.9163758754730225, 2.0861093997955322, 2.255842685699463, 2.4255762100219727, 2.5953097343444824, 2.765043258666992, 2.934776782989502, 3.1045100688934326, 3.2742435932159424, 3.443977117538452, 3.613710403442383, 3.7834439277648926, 3.9531774520874023, 4.122910976409912, 4.292644500732422, 4.462378025054932, 4.632111549377441, 4.801844596862793, 4.971578121185303, 5.1413116455078125, 5.311045169830322, 5.480778694152832, 5.650512218475342, 5.820245742797852, 5.989978790283203, 6.159712314605713, 6.329445838928223, 6.499179363250732, 6.668912887573242]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 11.0, 11.0, 7.0, 12.0, 18.0, 20.0, 21.0, 28.0, 31.0, 33.0, 34.0, 41.0, 47.0, 58.0, 35.0, 60.0, 42.0, 58.0, 43.0, 39.0, 46.0, 44.0, 29.0, 37.0, 30.0, 22.0, 21.0, 20.0, 18.0, 13.0, 11.0, 9.0, 12.0, 5.0, 6.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.207690715789795, -2.136155366897583, -2.064620018005371, -1.9930845499038696, -1.9215492010116577, -1.8500138521194458, -1.7784783840179443, -1.7069430351257324, -1.6354076862335205, -1.5638723373413086, -1.4923369884490967, -1.4208015203475952, -1.3492661714553833, -1.2777308225631714, -1.20619535446167, -1.134660005569458, -1.063124656677246, -0.9915893077850342, -0.9200538992881775, -0.8485184907913208, -0.7769831418991089, -0.705447793006897, -0.6339123845100403, -0.5623769760131836, -0.4908416271209717, -0.4193062484264374, -0.3477708697319031, -0.2762354910373688, -0.20470011234283447, -0.13316473364830017, -0.06162935495376587, 0.00990605354309082, 0.08144140243530273, 0.15297678112983704, 0.22451215982437134, 0.29604753851890564, 0.36758291721343994, 0.43911829590797424, 0.5106536746025085, 0.5821890830993652, 0.6537244319915771, 0.7252597808837891, 0.7967951893806458, 0.8683305978775024, 0.9398659467697144, 1.0114012956619263, 1.0829367637634277, 1.1544721126556396, 1.2260074615478516, 1.2975428104400635, 1.3690781593322754, 1.4406136274337769, 1.5121489763259888, 1.5836843252182007, 1.6552197933197021, 1.726755142211914, 1.798290491104126, 1.869825839996338, 1.9413611888885498, 2.0128965377807617, 2.0844321250915527, 2.1559674739837646, 2.2275028228759766, 2.2990381717681885, 2.3705735206604004]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 11.0, 15.0, 33.0, 46.0, 99.0, 131.0, 292.0, 576.0, 1311.0, 3297.0, 10180.0, 37211.0, 153493.0, 461280.0, 282718.0, 70781.0, 18052.0, 5447.0, 1899.0, 813.0, 369.0, 220.0, 104.0, 58.0, 38.0, 33.0, 17.0, 10.0, 7.0, 3.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.19921875, -6.043182373046875, -5.88714599609375, -5.731109619140625, -5.5750732421875, -5.419036865234375, -5.26300048828125, -5.106964111328125, -4.950927734375, -4.794891357421875, -4.63885498046875, -4.482818603515625, -4.3267822265625, -4.170745849609375, -4.01470947265625, -3.858673095703125, -3.70263671875, -3.546600341796875, -3.39056396484375, -3.234527587890625, -3.0784912109375, -2.922454833984375, -2.76641845703125, -2.610382080078125, -2.454345703125, -2.298309326171875, -2.14227294921875, -1.986236572265625, -1.8302001953125, -1.674163818359375, -1.51812744140625, -1.362091064453125, -1.2060546875, -1.050018310546875, -0.89398193359375, -0.737945556640625, -0.5819091796875, -0.425872802734375, -0.26983642578125, -0.113800048828125, 0.042236328125, 0.198272705078125, 0.35430908203125, 0.510345458984375, 0.6663818359375, 0.822418212890625, 0.97845458984375, 1.134490966796875, 1.29052734375, 1.446563720703125, 1.60260009765625, 1.758636474609375, 1.9146728515625, 2.070709228515625, 2.22674560546875, 2.382781982421875, 2.538818359375, 2.694854736328125, 2.85089111328125, 3.006927490234375, 3.1629638671875, 3.319000244140625, 3.47503662109375, 3.631072998046875, 3.787109375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 8.0, 1.0, 5.0, 8.0, 8.0, 10.0, 7.0, 22.0, 17.0, 22.0, 26.0, 28.0, 28.0, 33.0, 48.0, 47.0, 52.0, 51.0, 53.0, 51.0, 43.0, 51.0, 42.0, 34.0, 41.0, 43.0, 34.0, 32.0, 25.0, 18.0, 26.0, 16.0, 11.0, 22.0, 14.0, 9.0, 2.0, 7.0, 2.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.517578125, -2.420074462890625, -2.32257080078125, -2.225067138671875, -2.1275634765625, -2.030059814453125, -1.93255615234375, -1.835052490234375, -1.737548828125, -1.640045166015625, -1.54254150390625, -1.445037841796875, -1.3475341796875, -1.250030517578125, -1.15252685546875, -1.055023193359375, -0.95751953125, -0.860015869140625, -0.76251220703125, -0.665008544921875, -0.5675048828125, -0.470001220703125, -0.37249755859375, -0.274993896484375, -0.177490234375, -0.079986572265625, 0.01751708984375, 0.115020751953125, 0.2125244140625, 0.310028076171875, 0.40753173828125, 0.505035400390625, 0.6025390625, 0.700042724609375, 0.79754638671875, 0.895050048828125, 0.9925537109375, 1.090057373046875, 1.18756103515625, 1.285064697265625, 1.382568359375, 1.480072021484375, 1.57757568359375, 1.675079345703125, 1.7725830078125, 1.870086669921875, 1.96759033203125, 2.065093994140625, 2.16259765625, 2.260101318359375, 2.35760498046875, 2.455108642578125, 2.5526123046875, 2.650115966796875, 2.74761962890625, 2.845123291015625, 2.942626953125, 3.040130615234375, 3.13763427734375, 3.235137939453125, 3.3326416015625, 3.430145263671875, 3.52764892578125, 3.625152587890625, 3.72265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 5.0, 7.0, 11.0, 26.0, 36.0, 55.0, 142.0, 384.0, 1093.0, 4969.0, 288717.0, 743487.0, 7449.0, 1394.0, 407.0, 178.0, 84.0, 41.0, 19.0, 14.0, 9.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.234375, -20.55126953125, -19.8681640625, -19.18505859375, -18.501953125, -17.81884765625, -17.1357421875, -16.45263671875, -15.76953125, -15.08642578125, -14.4033203125, -13.72021484375, -13.037109375, -12.35400390625, -11.6708984375, -10.98779296875, -10.3046875, -9.62158203125, -8.9384765625, -8.25537109375, -7.572265625, -6.88916015625, -6.2060546875, -5.52294921875, -4.83984375, -4.15673828125, -3.4736328125, -2.79052734375, -2.107421875, -1.42431640625, -0.7412109375, -0.05810546875, 0.625, 1.30810546875, 1.9912109375, 2.67431640625, 3.357421875, 4.04052734375, 4.7236328125, 5.40673828125, 6.08984375, 6.77294921875, 7.4560546875, 8.13916015625, 8.822265625, 9.50537109375, 10.1884765625, 10.87158203125, 11.5546875, 12.23779296875, 12.9208984375, 13.60400390625, 14.287109375, 14.97021484375, 15.6533203125, 16.33642578125, 17.01953125, 17.70263671875, 18.3857421875, 19.06884765625, 19.751953125, 20.43505859375, 21.1181640625, 21.80126953125, 22.484375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 6.0, 7.0, 8.0, 18.0, 31.0, 26.0, 35.0, 33.0, 48.0, 58.0, 76.0, 68.0, 79.0, 71.0, 74.0, 64.0, 58.0, 41.0, 39.0, 32.0, 23.0, 25.0, 20.0, 19.0, 15.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.09375, -15.389892578125, -14.68603515625, -13.982177734375, -13.2783203125, -12.574462890625, -11.87060546875, -11.166748046875, -10.462890625, -9.759033203125, -9.05517578125, -8.351318359375, -7.6474609375, -6.943603515625, -6.23974609375, -5.535888671875, -4.83203125, -4.128173828125, -3.42431640625, -2.720458984375, -2.0166015625, -1.312744140625, -0.60888671875, 0.094970703125, 0.798828125, 1.502685546875, 2.20654296875, 2.910400390625, 3.6142578125, 4.318115234375, 5.02197265625, 5.725830078125, 6.4296875, 7.133544921875, 7.83740234375, 8.541259765625, 9.2451171875, 9.948974609375, 10.65283203125, 11.356689453125, 12.060546875, 12.764404296875, 13.46826171875, 14.172119140625, 14.8759765625, 15.579833984375, 16.28369140625, 16.987548828125, 17.69140625, 18.395263671875, 19.09912109375, 19.802978515625, 20.5068359375, 21.210693359375, 21.91455078125, 22.618408203125, 23.322265625, 24.026123046875, 24.72998046875, 25.433837890625, 26.1376953125, 26.841552734375, 27.54541015625, 28.249267578125, 28.953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 9.0, 7.0, 5.0, 13.0, 25.0, 25.0, 35.0, 41.0, 75.0, 118.0, 235.0, 494.0, 2379.0, 335588.0, 705426.0, 2834.0, 560.0, 270.0, 123.0, 78.0, 53.0, 35.0, 29.0, 24.0, 15.0, 11.0, 5.0, 8.0, 4.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.9296875, -10.5533447265625, -10.177001953125, -9.8006591796875, -9.42431640625, -9.0479736328125, -8.671630859375, -8.2952880859375, -7.9189453125, -7.5426025390625, -7.166259765625, -6.7899169921875, -6.41357421875, -6.0372314453125, -5.660888671875, -5.2845458984375, -4.908203125, -4.5318603515625, -4.155517578125, -3.7791748046875, -3.40283203125, -3.0264892578125, -2.650146484375, -2.2738037109375, -1.8974609375, -1.5211181640625, -1.144775390625, -0.7684326171875, -0.39208984375, -0.0157470703125, 0.360595703125, 0.7369384765625, 1.11328125, 1.4896240234375, 1.865966796875, 2.2423095703125, 2.61865234375, 2.9949951171875, 3.371337890625, 3.7476806640625, 4.1240234375, 4.5003662109375, 4.876708984375, 5.2530517578125, 5.62939453125, 6.0057373046875, 6.382080078125, 6.7584228515625, 7.134765625, 7.5111083984375, 7.887451171875, 8.2637939453125, 8.64013671875, 9.0164794921875, 9.392822265625, 9.7691650390625, 10.1455078125, 10.5218505859375, 10.898193359375, 11.2745361328125, 11.65087890625, 12.0272216796875, 12.403564453125, 12.7799072265625, 13.15625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 8.0, 4.0, 8.0, 10.0, 12.0, 16.0, 11.0, 21.0, 34.0, 32.0, 43.0, 41.0, 82.0, 103.0, 110.0, 121.0, 67.0, 63.0, 28.0, 39.0, 28.0, 29.0, 20.0, 14.0, 16.0, 8.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004839897155761719, -0.00046999379992485046, -0.00045599788427352905, -0.00044200196862220764, -0.00042800605297088623, -0.0004140101373195648, -0.0004000142216682434, -0.000386018306016922, -0.0003720223903656006, -0.0003580264747142792, -0.00034403055906295776, -0.00033003464341163635, -0.00031603872776031494, -0.00030204281210899353, -0.0002880468964576721, -0.0002740509808063507, -0.0002600550651550293, -0.0002460591495037079, -0.00023206323385238647, -0.00021806731820106506, -0.00020407140254974365, -0.00019007548689842224, -0.00017607957124710083, -0.00016208365559577942, -0.000148087739944458, -0.0001340918242931366, -0.00012009590864181519, -0.00010609999299049377, -9.210407733917236e-05, -7.810816168785095e-05, -6.411224603652954e-05, -5.011633038520813e-05, -3.612041473388672e-05, -2.2124499082565308e-05, -8.128583431243896e-06, 5.867332220077515e-06, 1.9863247871398926e-05, 3.385916352272034e-05, 4.785507917404175e-05, 6.185099482536316e-05, 7.584691047668457e-05, 8.984282612800598e-05, 0.00010383874177932739, 0.0001178346574306488, 0.00013183057308197021, 0.00014582648873329163, 0.00015982240438461304, 0.00017381832003593445, 0.00018781423568725586, 0.00020181015133857727, 0.00021580606698989868, 0.0002298019826412201, 0.0002437978982925415, 0.0002577938139438629, 0.0002717897295951843, 0.00028578564524650574, 0.00029978156089782715, 0.00031377747654914856, 0.00032777339220046997, 0.0003417693078517914, 0.0003557652235031128, 0.0003697611391544342, 0.0003837570548057556, 0.000397752970457077, 0.00041174888610839844]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 6.0, 6.0, 14.0, 20.0, 32.0, 48.0, 54.0, 112.0, 189.0, 361.0, 989.0, 4379.0, 65114.0, 945989.0, 26804.0, 2905.0, 799.0, 306.0, 157.0, 89.0, 46.0, 40.0, 22.0, 22.0, 14.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8125, -8.56341552734375, -8.3143310546875, -8.06524658203125, -7.816162109375, -7.56707763671875, -7.3179931640625, -7.06890869140625, -6.81982421875, -6.57073974609375, -6.3216552734375, -6.07257080078125, -5.823486328125, -5.57440185546875, -5.3253173828125, -5.07623291015625, -4.8271484375, -4.57806396484375, -4.3289794921875, -4.07989501953125, -3.830810546875, -3.58172607421875, -3.3326416015625, -3.08355712890625, -2.83447265625, -2.58538818359375, -2.3363037109375, -2.08721923828125, -1.838134765625, -1.58905029296875, -1.3399658203125, -1.09088134765625, -0.841796875, -0.59271240234375, -0.3436279296875, -0.09454345703125, 0.154541015625, 0.40362548828125, 0.6527099609375, 0.90179443359375, 1.15087890625, 1.39996337890625, 1.6490478515625, 1.89813232421875, 2.147216796875, 2.39630126953125, 2.6453857421875, 2.89447021484375, 3.1435546875, 3.39263916015625, 3.6417236328125, 3.89080810546875, 4.139892578125, 4.38897705078125, 4.6380615234375, 4.88714599609375, 5.13623046875, 5.38531494140625, 5.6343994140625, 5.88348388671875, 6.132568359375, 6.38165283203125, 6.6307373046875, 6.87982177734375, 7.12890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 11.0, 17.0, 13.0, 36.0, 67.0, 104.0, 167.0, 179.0, 124.0, 95.0, 45.0, 35.0, 15.0, 14.0, 12.0, 7.0, 5.0, 2.0, 5.0, 9.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.97265625, -6.76947021484375, -6.5662841796875, -6.36309814453125, -6.159912109375, -5.95672607421875, -5.7535400390625, -5.55035400390625, -5.34716796875, -5.14398193359375, -4.9407958984375, -4.73760986328125, -4.534423828125, -4.33123779296875, -4.1280517578125, -3.92486572265625, -3.7216796875, -3.51849365234375, -3.3153076171875, -3.11212158203125, -2.908935546875, -2.70574951171875, -2.5025634765625, -2.29937744140625, -2.09619140625, -1.89300537109375, -1.6898193359375, -1.48663330078125, -1.283447265625, -1.08026123046875, -0.8770751953125, -0.67388916015625, -0.470703125, -0.26751708984375, -0.0643310546875, 0.13885498046875, 0.342041015625, 0.54522705078125, 0.7484130859375, 0.95159912109375, 1.15478515625, 1.35797119140625, 1.5611572265625, 1.76434326171875, 1.967529296875, 2.17071533203125, 2.3739013671875, 2.57708740234375, 2.7802734375, 2.98345947265625, 3.1866455078125, 3.38983154296875, 3.593017578125, 3.79620361328125, 3.9993896484375, 4.20257568359375, 4.40576171875, 4.60894775390625, 4.8121337890625, 5.01531982421875, 5.218505859375, 5.42169189453125, 5.6248779296875, 5.82806396484375, 6.03125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 12.0, 42.0, 351.0, 538.0, 49.0, 12.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-336.7786865234375, -329.4750671386719, -322.17144775390625, -314.8677978515625, -307.5641784667969, -300.26055908203125, -292.9569396972656, -285.6533203125, -278.34967041015625, -271.0460510253906, -263.742431640625, -256.43878173828125, -249.13516235351562, -241.83154296875, -234.52792358398438, -227.2242889404297, -219.92066955566406, -212.61705017089844, -205.31341552734375, -198.00979614257812, -190.70616149902344, -183.4025421142578, -176.09890747070312, -168.7952880859375, -161.49166870117188, -154.18804931640625, -146.88441467285156, -139.58079528808594, -132.27716064453125, -124.97354125976562, -117.66991424560547, -110.36628723144531, -103.06263732910156, -95.7590103149414, -88.45538330078125, -81.15176391601562, -73.84812927246094, -66.54450988769531, -59.240882873535156, -51.937255859375, -44.633628845214844, -37.33000183105469, -30.026376724243164, -22.72275161743164, -15.419124603271484, -8.115497589111328, -0.8118743896484375, 6.491752624511719, 13.795379638671875, 21.09900665283203, 28.402631759643555, 35.70625686645508, 43.009883880615234, 50.31351089477539, 57.61713409423828, 64.92076110839844, 72.2243881225586, 79.52801513671875, 86.8316421508789, 94.13526916503906, 101.43888854980469, 108.74252319335938, 116.046142578125, 123.34976959228516, 130.6533966064453]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 6.0, 10.0, 9.0, 15.0, 20.0, 18.0, 21.0, 32.0, 26.0, 19.0, 45.0, 36.0, 33.0, 48.0, 46.0, 47.0, 48.0, 62.0, 62.0, 26.0, 52.0, 31.0, 32.0, 34.0, 25.0, 22.0, 30.0, 28.0, 18.0, 15.0, 15.0, 15.0, 12.0, 6.0, 5.0, 6.0, 0.0, 6.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.04741668701172, -56.154151916503906, -54.26089096069336, -52.36762619018555, -50.474365234375, -48.58110046386719, -46.687835693359375, -44.79457473754883, -42.90131378173828, -41.00804901123047, -39.11478805541992, -37.22152328491211, -35.32826232910156, -33.43499755859375, -31.54173469543457, -29.64847183227539, -27.755207061767578, -25.8619441986084, -23.96868133544922, -22.075416564941406, -20.18215560913086, -18.288890838623047, -16.395627975463867, -14.502365112304688, -12.609102249145508, -10.715839385986328, -8.822576522827148, -6.929312705993652, -5.036049842834473, -3.142786979675293, -1.2495231628417969, 0.6437397003173828, 2.536998748779297, 4.430261611938477, 6.3235249519348145, 8.216788291931152, 10.110051155090332, 12.003314018249512, 13.896577835083008, 15.789840698242188, 17.683103561401367, 19.576366424560547, 21.469629287719727, 23.362892150878906, 25.25615692138672, 27.149417877197266, 29.042682647705078, 30.935945510864258, 32.82920837402344, 34.72247314453125, 36.6157341003418, 38.50899887084961, 40.402259826660156, 42.29552459716797, 44.18878936767578, 46.08205032348633, 47.975311279296875, 49.86857604980469, 51.761837005615234, 53.65510177612305, 55.548362731933594, 57.441627502441406, 59.33489227294922, 61.228153228759766, 63.12141799926758]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 9.0, 4.0, 6.0, 5.0, 17.0, 17.0, 17.0, 48.0, 41.0, 80.0, 188.0, 272.0, 578.0, 1186.0, 2746.0, 6852.0, 21093.0, 96035.0, 3632132.0, 367191.0, 45004.0, 12432.0, 4467.0, 1859.0, 886.0, 452.0, 257.0, 140.0, 75.0, 64.0, 34.0, 23.0, 13.0, 19.0, 9.0, 11.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.10546875, -2.9849853515625, -2.864501953125, -2.7440185546875, -2.62353515625, -2.5030517578125, -2.382568359375, -2.2620849609375, -2.1416015625, -2.0211181640625, -1.900634765625, -1.7801513671875, -1.65966796875, -1.5391845703125, -1.418701171875, -1.2982177734375, -1.177734375, -1.0572509765625, -0.936767578125, -0.8162841796875, -0.69580078125, -0.5753173828125, -0.454833984375, -0.3343505859375, -0.2138671875, -0.0933837890625, 0.027099609375, 0.1475830078125, 0.26806640625, 0.3885498046875, 0.509033203125, 0.6295166015625, 0.75, 0.8704833984375, 0.990966796875, 1.1114501953125, 1.23193359375, 1.3524169921875, 1.472900390625, 1.5933837890625, 1.7138671875, 1.8343505859375, 1.954833984375, 2.0753173828125, 2.19580078125, 2.3162841796875, 2.436767578125, 2.5572509765625, 2.677734375, 2.7982177734375, 2.918701171875, 3.0391845703125, 3.15966796875, 3.2801513671875, 3.400634765625, 3.5211181640625, 3.6416015625, 3.7620849609375, 3.882568359375, 4.0030517578125, 4.12353515625, 4.2440185546875, 4.364501953125, 4.4849853515625, 4.60546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 14.0, 7.0, 18.0, 18.0, 39.0, 44.0, 44.0, 67.0, 59.0, 70.0, 63.0, 65.0, 68.0, 66.0, 57.0, 60.0, 49.0, 44.0, 30.0, 25.0, 27.0, 12.0, 10.0, 8.0, 5.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3203125, -4.17578125, -4.03125, -3.88671875, -3.7421875, -3.59765625, -3.453125, -3.30859375, -3.1640625, -3.01953125, -2.875, -2.73046875, -2.5859375, -2.44140625, -2.296875, -2.15234375, -2.0078125, -1.86328125, -1.71875, -1.57421875, -1.4296875, -1.28515625, -1.140625, -0.99609375, -0.8515625, -0.70703125, -0.5625, -0.41796875, -0.2734375, -0.12890625, 0.015625, 0.16015625, 0.3046875, 0.44921875, 0.59375, 0.73828125, 0.8828125, 1.02734375, 1.171875, 1.31640625, 1.4609375, 1.60546875, 1.75, 1.89453125, 2.0390625, 2.18359375, 2.328125, 2.47265625, 2.6171875, 2.76171875, 2.90625, 3.05078125, 3.1953125, 3.33984375, 3.484375, 3.62890625, 3.7734375, 3.91796875, 4.0625, 4.20703125, 4.3515625, 4.49609375, 4.640625, 4.78515625, 4.9296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 10.0, 8.0, 19.0, 28.0, 23.0, 34.0, 51.0, 50.0, 60.0, 76.0, 94.0, 127.0, 112.0, 169.0, 226.0, 389.0, 756.0, 2405.0, 12149.0, 136682.0, 3955288.0, 73483.0, 8319.0, 1828.0, 588.0, 307.0, 197.0, 155.0, 123.0, 107.0, 83.0, 60.0, 58.0, 46.0, 46.0, 32.0, 15.0, 16.0, 16.0, 11.0, 8.0, 4.0, 6.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.19140625, -6.97607421875, -6.7607421875, -6.54541015625, -6.330078125, -6.11474609375, -5.8994140625, -5.68408203125, -5.46875, -5.25341796875, -5.0380859375, -4.82275390625, -4.607421875, -4.39208984375, -4.1767578125, -3.96142578125, -3.74609375, -3.53076171875, -3.3154296875, -3.10009765625, -2.884765625, -2.66943359375, -2.4541015625, -2.23876953125, -2.0234375, -1.80810546875, -1.5927734375, -1.37744140625, -1.162109375, -0.94677734375, -0.7314453125, -0.51611328125, -0.30078125, -0.08544921875, 0.1298828125, 0.34521484375, 0.560546875, 0.77587890625, 0.9912109375, 1.20654296875, 1.421875, 1.63720703125, 1.8525390625, 2.06787109375, 2.283203125, 2.49853515625, 2.7138671875, 2.92919921875, 3.14453125, 3.35986328125, 3.5751953125, 3.79052734375, 4.005859375, 4.22119140625, 4.4365234375, 4.65185546875, 4.8671875, 5.08251953125, 5.2978515625, 5.51318359375, 5.728515625, 5.94384765625, 6.1591796875, 6.37451171875, 6.58984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 13.0, 14.0, 58.0, 196.0, 3010.0, 600.0, 100.0, 40.0, 25.0, 9.0, 5.0, 3.0, 4.0], "bins": [-8.4296875, -8.278366088867188, -8.127044677734375, -7.9757232666015625, -7.82440185546875, -7.6730804443359375, -7.521759033203125, -7.3704376220703125, -7.2191162109375, -7.0677947998046875, -6.916473388671875, -6.7651519775390625, -6.61383056640625, -6.4625091552734375, -6.311187744140625, -6.1598663330078125, -6.008544921875, -5.8572235107421875, -5.705902099609375, -5.5545806884765625, -5.40325927734375, -5.2519378662109375, -5.100616455078125, -4.9492950439453125, -4.7979736328125, -4.6466522216796875, -4.495330810546875, -4.3440093994140625, -4.19268798828125, -4.0413665771484375, -3.890045166015625, -3.7387237548828125, -3.58740234375, -3.4360809326171875, -3.284759521484375, -3.1334381103515625, -2.98211669921875, -2.8307952880859375, -2.679473876953125, -2.5281524658203125, -2.3768310546875, -2.2255096435546875, -2.074188232421875, -1.9228668212890625, -1.77154541015625, -1.6202239990234375, -1.468902587890625, -1.3175811767578125, -1.166259765625, -1.0149383544921875, -0.863616943359375, -0.7122955322265625, -0.56097412109375, -0.4096527099609375, -0.258331298828125, -0.1070098876953125, 0.0443115234375, 0.1956329345703125, 0.346954345703125, 0.4982757568359375, 0.64959716796875, 0.8009185791015625, 0.952239990234375, 1.1035614013671875, 1.2548828125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 35.0, 151.0, 356.0, 282.0, 100.0, 41.0, 9.0, 6.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.27711486816406, -32.434696197509766, -31.592275619506836, -30.74985694885254, -29.907438278198242, -29.065017700195312, -28.222599029541016, -27.38018035888672, -26.53775978088379, -25.695341110229492, -24.852920532226562, -24.010501861572266, -23.16808319091797, -22.32566261291504, -21.483243942260742, -20.640823364257812, -19.798404693603516, -18.95598602294922, -18.11356544494629, -17.271146774291992, -16.428728103637695, -15.586307525634766, -14.743888854980469, -13.901469230651855, -13.059051513671875, -12.216631889343262, -11.374213218688965, -10.531793594360352, -9.689373970031738, -8.846954345703125, -8.004535675048828, -7.162116050720215, -6.319696426391602, -5.4772772789001465, -4.634857654571533, -3.792438507080078, -2.950019121170044, -2.1075997352600098, -1.2651805877685547, -0.4227609634399414, 0.41965818405151367, 1.2620775699615479, 2.104496955871582, 2.946916103363037, 3.7893354892730713, 4.6317548751831055, 5.4741740226745605, 6.316593647003174, 7.159012794494629, 8.001432418823242, 8.843851089477539, 9.686270713806152, 10.528690338134766, 11.371109008789062, 12.213528633117676, 13.055948257446289, 13.898366928100586, 14.7407865524292, 15.583205223083496, 16.42562484741211, 17.268043518066406, 18.110464096069336, 18.952882766723633, 19.795303344726562, 20.63772201538086]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 4.0, 10.0, 14.0, 14.0, 19.0, 23.0, 28.0, 32.0, 51.0, 61.0, 68.0, 69.0, 59.0, 70.0, 68.0, 74.0, 53.0, 47.0, 51.0, 40.0, 34.0, 24.0, 29.0, 16.0, 12.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.29165267944336, -12.886375427246094, -12.481098175048828, -12.075819969177246, -11.67054271697998, -11.265265464782715, -10.859987258911133, -10.454710006713867, -10.049432754516602, -9.644155502319336, -9.23887825012207, -8.833600044250488, -8.428322792053223, -8.023045539855957, -7.617767810821533, -7.212490081787109, -6.807212829589844, -6.401935577392578, -5.996657848358154, -5.5913801193237305, -5.186102867126465, -4.780825614929199, -4.375547885894775, -3.9702703952789307, -3.564992904663086, -3.159715414047241, -2.7544379234313965, -2.3491604328155518, -1.943882942199707, -1.5386054515838623, -1.1333279609680176, -0.7280504703521729, -0.3227729797363281, 0.0825045108795166, 0.48778200149536133, 0.893059492111206, 1.2983369827270508, 1.7036144733428955, 2.1088919639587402, 2.514169454574585, 2.9194469451904297, 3.3247244358062744, 3.730001926422119, 4.135279655456543, 4.540556907653809, 4.945834159851074, 5.351111888885498, 5.756389617919922, 6.1616668701171875, 6.566944122314453, 6.972221851348877, 7.377499580383301, 7.782776832580566, 8.188054084777832, 8.593332290649414, 8.99860954284668, 9.403886795043945, 9.809164047241211, 10.214441299438477, 10.619719505310059, 11.024996757507324, 11.43027400970459, 11.835552215576172, 12.240829467773438, 12.646106719970703]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 10.0, 6.0, 10.0, 22.0, 44.0, 79.0, 132.0, 255.0, 638.0, 1670.0, 5781.0, 28602.0, 221196.0, 640391.0, 125864.0, 17661.0, 4038.0, 1232.0, 447.0, 221.0, 111.0, 64.0, 28.0, 12.0, 22.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.56640625, -5.32818603515625, -5.0899658203125, -4.85174560546875, -4.613525390625, -4.37530517578125, -4.1370849609375, -3.89886474609375, -3.66064453125, -3.42242431640625, -3.1842041015625, -2.94598388671875, -2.707763671875, -2.46954345703125, -2.2313232421875, -1.99310302734375, -1.7548828125, -1.51666259765625, -1.2784423828125, -1.04022216796875, -0.802001953125, -0.56378173828125, -0.3255615234375, -0.08734130859375, 0.15087890625, 0.38909912109375, 0.6273193359375, 0.86553955078125, 1.103759765625, 1.34197998046875, 1.5802001953125, 1.81842041015625, 2.056640625, 2.29486083984375, 2.5330810546875, 2.77130126953125, 3.009521484375, 3.24774169921875, 3.4859619140625, 3.72418212890625, 3.96240234375, 4.20062255859375, 4.4388427734375, 4.67706298828125, 4.915283203125, 5.15350341796875, 5.3917236328125, 5.62994384765625, 5.8681640625, 6.10638427734375, 6.3446044921875, 6.58282470703125, 6.821044921875, 7.05926513671875, 7.2974853515625, 7.53570556640625, 7.77392578125, 8.01214599609375, 8.2503662109375, 8.48858642578125, 8.726806640625, 8.96502685546875, 9.2032470703125, 9.44146728515625, 9.6796875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 9.0, 9.0, 19.0, 17.0, 15.0, 41.0, 26.0, 48.0, 54.0, 67.0, 60.0, 63.0, 55.0, 61.0, 44.0, 53.0, 51.0, 53.0, 53.0, 37.0, 36.0, 25.0, 17.0, 20.0, 12.0, 12.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5078125, -3.38433837890625, -3.2608642578125, -3.13739013671875, -3.013916015625, -2.89044189453125, -2.7669677734375, -2.64349365234375, -2.52001953125, -2.39654541015625, -2.2730712890625, -2.14959716796875, -2.026123046875, -1.90264892578125, -1.7791748046875, -1.65570068359375, -1.5322265625, -1.40875244140625, -1.2852783203125, -1.16180419921875, -1.038330078125, -0.91485595703125, -0.7913818359375, -0.66790771484375, -0.54443359375, -0.42095947265625, -0.2974853515625, -0.17401123046875, -0.050537109375, 0.07293701171875, 0.1964111328125, 0.31988525390625, 0.443359375, 0.56683349609375, 0.6903076171875, 0.81378173828125, 0.937255859375, 1.06072998046875, 1.1842041015625, 1.30767822265625, 1.43115234375, 1.55462646484375, 1.6781005859375, 1.80157470703125, 1.925048828125, 2.04852294921875, 2.1719970703125, 2.29547119140625, 2.4189453125, 2.54241943359375, 2.6658935546875, 2.78936767578125, 2.912841796875, 3.03631591796875, 3.1597900390625, 3.28326416015625, 3.40673828125, 3.53021240234375, 3.6536865234375, 3.77716064453125, 3.900634765625, 4.02410888671875, 4.1475830078125, 4.27105712890625, 4.39453125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 9.0, 11.0, 6.0, 13.0, 20.0, 26.0, 31.0, 49.0, 69.0, 131.0, 192.0, 328.0, 717.0, 2201.0, 15409.0, 854441.0, 166320.0, 6031.0, 1326.0, 528.0, 249.0, 151.0, 102.0, 60.0, 41.0, 33.0, 15.0, 12.0, 14.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.234375, -16.6748046875, -16.115234375, -15.5556640625, -14.99609375, -14.4365234375, -13.876953125, -13.3173828125, -12.7578125, -12.1982421875, -11.638671875, -11.0791015625, -10.51953125, -9.9599609375, -9.400390625, -8.8408203125, -8.28125, -7.7216796875, -7.162109375, -6.6025390625, -6.04296875, -5.4833984375, -4.923828125, -4.3642578125, -3.8046875, -3.2451171875, -2.685546875, -2.1259765625, -1.56640625, -1.0068359375, -0.447265625, 0.1123046875, 0.671875, 1.2314453125, 1.791015625, 2.3505859375, 2.91015625, 3.4697265625, 4.029296875, 4.5888671875, 5.1484375, 5.7080078125, 6.267578125, 6.8271484375, 7.38671875, 7.9462890625, 8.505859375, 9.0654296875, 9.625, 10.1845703125, 10.744140625, 11.3037109375, 11.86328125, 12.4228515625, 12.982421875, 13.5419921875, 14.1015625, 14.6611328125, 15.220703125, 15.7802734375, 16.33984375, 16.8994140625, 17.458984375, 18.0185546875, 18.578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 5.0, 11.0, 14.0, 19.0, 39.0, 39.0, 50.0, 57.0, 72.0, 84.0, 79.0, 77.0, 93.0, 87.0, 67.0, 63.0, 34.0, 21.0, 22.0, 18.0, 10.0, 11.0, 10.0, 7.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.90625, -24.19970703125, -23.4931640625, -22.78662109375, -22.080078125, -21.37353515625, -20.6669921875, -19.96044921875, -19.25390625, -18.54736328125, -17.8408203125, -17.13427734375, -16.427734375, -15.72119140625, -15.0146484375, -14.30810546875, -13.6015625, -12.89501953125, -12.1884765625, -11.48193359375, -10.775390625, -10.06884765625, -9.3623046875, -8.65576171875, -7.94921875, -7.24267578125, -6.5361328125, -5.82958984375, -5.123046875, -4.41650390625, -3.7099609375, -3.00341796875, -2.296875, -1.59033203125, -0.8837890625, -0.17724609375, 0.529296875, 1.23583984375, 1.9423828125, 2.64892578125, 3.35546875, 4.06201171875, 4.7685546875, 5.47509765625, 6.181640625, 6.88818359375, 7.5947265625, 8.30126953125, 9.0078125, 9.71435546875, 10.4208984375, 11.12744140625, 11.833984375, 12.54052734375, 13.2470703125, 13.95361328125, 14.66015625, 15.36669921875, 16.0732421875, 16.77978515625, 17.486328125, 18.19287109375, 18.8994140625, 19.60595703125, 20.3125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 9.0, 11.0, 25.0, 15.0, 26.0, 28.0, 40.0, 47.0, 77.0, 89.0, 172.0, 261.0, 568.0, 1587.0, 8960.0, 239315.0, 776572.0, 16839.0, 2346.0, 672.0, 303.0, 172.0, 129.0, 76.0, 55.0, 38.0, 35.0, 12.0, 11.0, 12.0, 8.0, 14.0, 3.0, 2.0, 5.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-6.765625, -6.58819580078125, -6.4107666015625, -6.23333740234375, -6.055908203125, -5.87847900390625, -5.7010498046875, -5.52362060546875, -5.34619140625, -5.16876220703125, -4.9913330078125, -4.81390380859375, -4.636474609375, -4.45904541015625, -4.2816162109375, -4.10418701171875, -3.9267578125, -3.74932861328125, -3.5718994140625, -3.39447021484375, -3.217041015625, -3.03961181640625, -2.8621826171875, -2.68475341796875, -2.50732421875, -2.32989501953125, -2.1524658203125, -1.97503662109375, -1.797607421875, -1.62017822265625, -1.4427490234375, -1.26531982421875, -1.087890625, -0.91046142578125, -0.7330322265625, -0.55560302734375, -0.378173828125, -0.20074462890625, -0.0233154296875, 0.15411376953125, 0.33154296875, 0.50897216796875, 0.6864013671875, 0.86383056640625, 1.041259765625, 1.21868896484375, 1.3961181640625, 1.57354736328125, 1.7509765625, 1.92840576171875, 2.1058349609375, 2.28326416015625, 2.460693359375, 2.63812255859375, 2.8155517578125, 2.99298095703125, 3.17041015625, 3.34783935546875, 3.5252685546875, 3.70269775390625, 3.880126953125, 4.05755615234375, 4.2349853515625, 4.41241455078125, 4.58984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 5.0, 8.0, 10.0, 22.0, 26.0, 24.0, 34.0, 38.0, 47.0, 82.0, 101.0, 167.0, 107.0, 80.0, 48.0, 39.0, 26.0, 33.0, 20.0, 18.0, 8.0, 6.0, 10.0, 4.0, 5.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005340576171875, -0.0005159154534339905, -0.000497773289680481, -0.00047963112592697144, -0.0004614889621734619, -0.0004433467984199524, -0.00042520463466644287, -0.00040706247091293335, -0.00038892030715942383, -0.0003707781434059143, -0.0003526359796524048, -0.00033449381589889526, -0.00031635165214538574, -0.0002982094883918762, -0.0002800673246383667, -0.0002619251608848572, -0.00024378299713134766, -0.00022564083337783813, -0.0002074986696243286, -0.0001893565058708191, -0.00017121434211730957, -0.00015307217836380005, -0.00013493001461029053, -0.000116787850856781, -9.864568710327148e-05, -8.050352334976196e-05, -6.236135959625244e-05, -4.421919584274292e-05, -2.60770320892334e-05, -7.934868335723877e-06, 1.0207295417785645e-05, 2.8349459171295166e-05, 4.649162292480469e-05, 6.463378667831421e-05, 8.277595043182373e-05, 0.00010091811418533325, 0.00011906027793884277, 0.0001372024416923523, 0.00015534460544586182, 0.00017348676919937134, 0.00019162893295288086, 0.00020977109670639038, 0.0002279132604598999, 0.0002460554242134094, 0.00026419758796691895, 0.00028233975172042847, 0.000300481915473938, 0.0003186240792274475, 0.00033676624298095703, 0.00035490840673446655, 0.0003730505704879761, 0.0003911927342414856, 0.0004093348979949951, 0.00042747706174850464, 0.00044561922550201416, 0.0004637613892555237, 0.0004819035530090332, 0.0005000457167625427, 0.0005181878805160522, 0.0005363300442695618, 0.0005544722080230713, 0.0005726143717765808, 0.0005907565355300903, 0.0006088986992835999, 0.0006270408630371094]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 10.0, 13.0, 15.0, 14.0, 27.0, 32.0, 42.0, 43.0, 75.0, 98.0, 139.0, 243.0, 476.0, 988.0, 2484.0, 7345.0, 34846.0, 809628.0, 169347.0, 15101.0, 4250.0, 1639.0, 690.0, 332.0, 192.0, 116.0, 68.0, 68.0, 51.0, 28.0, 27.0, 32.0, 17.0, 21.0, 10.0, 6.0, 8.0, 8.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.15625, -5.0035400390625, -4.850830078125, -4.6981201171875, -4.54541015625, -4.3927001953125, -4.239990234375, -4.0872802734375, -3.9345703125, -3.7818603515625, -3.629150390625, -3.4764404296875, -3.32373046875, -3.1710205078125, -3.018310546875, -2.8656005859375, -2.712890625, -2.5601806640625, -2.407470703125, -2.2547607421875, -2.10205078125, -1.9493408203125, -1.796630859375, -1.6439208984375, -1.4912109375, -1.3385009765625, -1.185791015625, -1.0330810546875, -0.88037109375, -0.7276611328125, -0.574951171875, -0.4222412109375, -0.26953125, -0.1168212890625, 0.035888671875, 0.1885986328125, 0.34130859375, 0.4940185546875, 0.646728515625, 0.7994384765625, 0.9521484375, 1.1048583984375, 1.257568359375, 1.4102783203125, 1.56298828125, 1.7156982421875, 1.868408203125, 2.0211181640625, 2.173828125, 2.3265380859375, 2.479248046875, 2.6319580078125, 2.78466796875, 2.9373779296875, 3.090087890625, 3.2427978515625, 3.3955078125, 3.5482177734375, 3.700927734375, 3.8536376953125, 4.00634765625, 4.1590576171875, 4.311767578125, 4.4644775390625, 4.6171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 8.0, 8.0, 6.0, 17.0, 20.0, 31.0, 52.0, 119.0, 227.0, 214.0, 137.0, 63.0, 34.0, 24.0, 8.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96875, -4.77044677734375, -4.5721435546875, -4.37384033203125, -4.175537109375, -3.97723388671875, -3.7789306640625, -3.58062744140625, -3.38232421875, -3.18402099609375, -2.9857177734375, -2.78741455078125, -2.589111328125, -2.39080810546875, -2.1925048828125, -1.99420166015625, -1.7958984375, -1.59759521484375, -1.3992919921875, -1.20098876953125, -1.002685546875, -0.80438232421875, -0.6060791015625, -0.40777587890625, -0.20947265625, -0.01116943359375, 0.1871337890625, 0.38543701171875, 0.583740234375, 0.78204345703125, 0.9803466796875, 1.17864990234375, 1.376953125, 1.57525634765625, 1.7735595703125, 1.97186279296875, 2.170166015625, 2.36846923828125, 2.5667724609375, 2.76507568359375, 2.96337890625, 3.16168212890625, 3.3599853515625, 3.55828857421875, 3.756591796875, 3.95489501953125, 4.1531982421875, 4.35150146484375, 4.5498046875, 4.74810791015625, 4.9464111328125, 5.14471435546875, 5.343017578125, 5.54132080078125, 5.7396240234375, 5.93792724609375, 6.13623046875, 6.33453369140625, 6.5328369140625, 6.73114013671875, 6.929443359375, 7.12774658203125, 7.3260498046875, 7.52435302734375, 7.72265625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 13.0, 18.0, 121.0, 395.0, 349.0, 81.0, 14.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.31387329101562, -161.40142822265625, -156.48898315429688, -151.5765380859375, -146.66409301757812, -141.75164794921875, -136.83920288085938, -131.9267578125, -127.01431274414062, -122.10186767578125, -117.18942260742188, -112.2769775390625, -107.36453247070312, -102.45208740234375, -97.53964233398438, -92.627197265625, -87.71475219726562, -82.80230712890625, -77.88986206054688, -72.9774169921875, -68.06497192382812, -63.15252685546875, -58.240081787109375, -53.32763671875, -48.415191650390625, -43.50274658203125, -38.590301513671875, -33.6778564453125, -28.765411376953125, -23.85296630859375, -18.940521240234375, -14.028076171875, -9.115615844726562, -4.2031707763671875, 0.7092742919921875, 5.6217193603515625, 10.534164428710938, 15.446609497070312, 20.359054565429688, 25.271499633789062, 30.183944702148438, 35.09638977050781, 40.00883483886719, 44.92127990722656, 49.83372497558594, 54.74617004394531, 59.65861511230469, 64.57106018066406, 69.48350524902344, 74.39595031738281, 79.30839538574219, 84.22084045410156, 89.13328552246094, 94.04573059082031, 98.95817565917969, 103.87062072753906, 108.78306579589844, 113.69551086425781, 118.60795593261719, 123.52040100097656, 128.43284606933594, 133.3452911376953, 138.2577362060547, 143.17018127441406, 148.08262634277344]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 6.0, 4.0, 7.0, 5.0, 8.0, 8.0, 10.0, 9.0, 14.0, 12.0, 21.0, 22.0, 19.0, 32.0, 25.0, 34.0, 22.0, 37.0, 37.0, 31.0, 45.0, 49.0, 50.0, 40.0, 42.0, 49.0, 37.0, 40.0, 45.0, 33.0, 28.0, 22.0, 29.0, 25.0, 23.0, 12.0, 7.0, 9.0, 8.0, 9.0, 6.0, 10.0, 6.0, 3.0, 0.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.15082931518555, -49.483055114746094, -47.815284729003906, -46.14751052856445, -44.479736328125, -42.81196594238281, -41.14419174194336, -39.476417541503906, -37.80864715576172, -36.140872955322266, -34.47310256958008, -32.805328369140625, -31.137554168701172, -29.46978187561035, -27.80200958251953, -26.134235382080078, -24.466461181640625, -22.798688888549805, -21.13091468811035, -19.46314239501953, -17.795368194580078, -16.127595901489258, -14.459823608398438, -12.7920503616333, -11.124277114868164, -9.456503868103027, -7.788731098175049, -6.12095832824707, -4.453185081481934, -2.785411834716797, -1.1176395416259766, 0.5501337051391602, 2.2179107666015625, 3.88568377494812, 5.553456783294678, 7.221229553222656, 8.889002799987793, 10.55677604675293, 12.22454833984375, 13.892321586608887, 15.560094833374023, 17.227867126464844, 18.895641326904297, 20.563413619995117, 22.231185913085938, 23.89896011352539, 25.56673240661621, 27.23450469970703, 28.902278900146484, 30.570051193237305, 32.237823486328125, 33.90559768676758, 35.57337188720703, 37.24114227294922, 38.90891647338867, 40.576690673828125, 42.24446105957031, 43.912235260009766, 45.58000564575195, 47.247779846191406, 48.91555404663086, 50.58332824707031, 52.2510986328125, 53.91887283325195, 55.586647033691406]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 5.0, 4.0, 8.0, 14.0, 18.0, 25.0, 49.0, 71.0, 133.0, 237.0, 496.0, 1063.0, 2673.0, 8291.0, 42011.0, 868562.0, 3140789.0, 108037.0, 14431.0, 4143.0, 1527.0, 740.0, 391.0, 225.0, 128.0, 74.0, 44.0, 27.0, 23.0, 17.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.2071533203125, -5.054931640625, -4.9027099609375, -4.75048828125, -4.5982666015625, -4.446044921875, -4.2938232421875, -4.1416015625, -3.9893798828125, -3.837158203125, -3.6849365234375, -3.53271484375, -3.3804931640625, -3.228271484375, -3.0760498046875, -2.923828125, -2.7716064453125, -2.619384765625, -2.4671630859375, -2.31494140625, -2.1627197265625, -2.010498046875, -1.8582763671875, -1.7060546875, -1.5538330078125, -1.401611328125, -1.2493896484375, -1.09716796875, -0.9449462890625, -0.792724609375, -0.6405029296875, -0.48828125, -0.3360595703125, -0.183837890625, -0.0316162109375, 0.12060546875, 0.2728271484375, 0.425048828125, 0.5772705078125, 0.7294921875, 0.8817138671875, 1.033935546875, 1.1861572265625, 1.33837890625, 1.4906005859375, 1.642822265625, 1.7950439453125, 1.947265625, 2.0994873046875, 2.251708984375, 2.4039306640625, 2.55615234375, 2.7083740234375, 2.860595703125, 3.0128173828125, 3.1650390625, 3.3172607421875, 3.469482421875, 3.6217041015625, 3.77392578125, 3.9261474609375, 4.078369140625, 4.2305908203125, 4.3828125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 8.0, 16.0, 14.0, 19.0, 28.0, 25.0, 34.0, 50.0, 50.0, 52.0, 59.0, 69.0, 57.0, 56.0, 47.0, 57.0, 44.0, 45.0, 38.0, 46.0, 35.0, 25.0, 21.0, 25.0, 15.0, 10.0, 8.0, 7.0, 2.0, 11.0, 3.0, 1.0, 8.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.69921875, -3.591796875, -3.484375, -3.376953125, -3.26953125, -3.162109375, -3.0546875, -2.947265625, -2.83984375, -2.732421875, -2.625, -2.517578125, -2.41015625, -2.302734375, -2.1953125, -2.087890625, -1.98046875, -1.873046875, -1.765625, -1.658203125, -1.55078125, -1.443359375, -1.3359375, -1.228515625, -1.12109375, -1.013671875, -0.90625, -0.798828125, -0.69140625, -0.583984375, -0.4765625, -0.369140625, -0.26171875, -0.154296875, -0.046875, 0.060546875, 0.16796875, 0.275390625, 0.3828125, 0.490234375, 0.59765625, 0.705078125, 0.8125, 0.919921875, 1.02734375, 1.134765625, 1.2421875, 1.349609375, 1.45703125, 1.564453125, 1.671875, 1.779296875, 1.88671875, 1.994140625, 2.1015625, 2.208984375, 2.31640625, 2.423828125, 2.53125, 2.638671875, 2.74609375, 2.853515625, 2.9609375, 3.068359375, 3.17578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 8.0, 11.0, 21.0, 24.0, 44.0, 88.0, 183.0, 466.0, 1466.0, 6024.0, 42030.0, 3175328.0, 938423.0, 24117.0, 4076.0, 1216.0, 386.0, 164.0, 73.0, 39.0, 19.0, 18.0, 12.0, 6.0, 9.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.9990234375, -7.755859375, -7.5126953125, -7.26953125, -7.0263671875, -6.783203125, -6.5400390625, -6.296875, -6.0537109375, -5.810546875, -5.5673828125, -5.32421875, -5.0810546875, -4.837890625, -4.5947265625, -4.3515625, -4.1083984375, -3.865234375, -3.6220703125, -3.37890625, -3.1357421875, -2.892578125, -2.6494140625, -2.40625, -2.1630859375, -1.919921875, -1.6767578125, -1.43359375, -1.1904296875, -0.947265625, -0.7041015625, -0.4609375, -0.2177734375, 0.025390625, 0.2685546875, 0.51171875, 0.7548828125, 0.998046875, 1.2412109375, 1.484375, 1.7275390625, 1.970703125, 2.2138671875, 2.45703125, 2.7001953125, 2.943359375, 3.1865234375, 3.4296875, 3.6728515625, 3.916015625, 4.1591796875, 4.40234375, 4.6455078125, 4.888671875, 5.1318359375, 5.375, 5.6181640625, 5.861328125, 6.1044921875, 6.34765625, 6.5908203125, 6.833984375, 7.0771484375, 7.3203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 12.0, 22.0, 29.0, 43.0, 65.0, 132.0, 274.0, 855.0, 1409.0, 718.0, 277.0, 88.0, 41.0, 24.0, 19.0, 14.0, 9.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.953125, -5.72802734375, -5.5029296875, -5.27783203125, -5.052734375, -4.82763671875, -4.6025390625, -4.37744140625, -4.15234375, -3.92724609375, -3.7021484375, -3.47705078125, -3.251953125, -3.02685546875, -2.8017578125, -2.57666015625, -2.3515625, -2.12646484375, -1.9013671875, -1.67626953125, -1.451171875, -1.22607421875, -1.0009765625, -0.77587890625, -0.55078125, -0.32568359375, -0.1005859375, 0.12451171875, 0.349609375, 0.57470703125, 0.7998046875, 1.02490234375, 1.25, 1.47509765625, 1.7001953125, 1.92529296875, 2.150390625, 2.37548828125, 2.6005859375, 2.82568359375, 3.05078125, 3.27587890625, 3.5009765625, 3.72607421875, 3.951171875, 4.17626953125, 4.4013671875, 4.62646484375, 4.8515625, 5.07666015625, 5.3017578125, 5.52685546875, 5.751953125, 5.97705078125, 6.2021484375, 6.42724609375, 6.65234375, 6.87744140625, 7.1025390625, 7.32763671875, 7.552734375, 7.77783203125, 8.0029296875, 8.22802734375, 8.453125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 8.0, 15.0, 43.0, 160.0, 317.0, 250.0, 118.0, 49.0, 17.0, 10.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.55470657348633, -52.43673324584961, -50.31875991821289, -48.20078659057617, -46.08281326293945, -43.964839935302734, -41.84687042236328, -39.72889709472656, -37.610923767089844, -35.492950439453125, -33.374977111816406, -31.257003784179688, -29.13903045654297, -27.02105712890625, -24.903085708618164, -22.785112380981445, -20.667137145996094, -18.549163818359375, -16.431190490722656, -14.313218116760254, -12.195244789123535, -10.077271461486816, -7.959299087524414, -5.841325759887695, -3.7233524322509766, -1.605379343032837, 0.5125937461853027, 2.6305665969848633, 4.748539924621582, 6.866513252258301, 8.984485626220703, 11.102458953857422, 13.220436096191406, 15.338409423828125, 17.456382751464844, 19.574356079101562, 21.69232940673828, 23.810302734375, 25.928274154663086, 28.046247482299805, 30.164220809936523, 32.28219223022461, 34.40016555786133, 36.51813888549805, 38.636112213134766, 40.754085540771484, 42.8720588684082, 44.99003219604492, 47.10800552368164, 49.22597885131836, 51.34395217895508, 53.4619255065918, 55.579898834228516, 57.697872161865234, 59.81584167480469, 61.933815002441406, 64.05178833007812, 66.16976165771484, 68.28773498535156, 70.40570831298828, 72.523681640625, 74.64165496826172, 76.75962829589844, 78.87760162353516, 80.99557495117188]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 13.0, 10.0, 18.0, 21.0, 17.0, 21.0, 22.0, 30.0, 41.0, 40.0, 47.0, 43.0, 49.0, 44.0, 51.0, 58.0, 66.0, 49.0, 48.0, 47.0, 37.0, 40.0, 32.0, 31.0, 29.0, 19.0, 16.0, 18.0, 15.0, 11.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.581113815307617, -24.68790054321289, -23.79468536376953, -22.901472091674805, -22.008258819580078, -21.11504554748535, -20.221832275390625, -19.328617095947266, -18.43540382385254, -17.542190551757812, -16.648975372314453, -15.755762100219727, -14.862548828125, -13.969335556030273, -13.07612133026123, -12.182907104492188, -11.289693832397461, -10.396480560302734, -9.503266334533691, -8.610052108764648, -7.716838836669922, -6.823625087738037, -5.930411338806152, -5.037197589874268, -4.143983840942383, -3.250770092010498, -2.3575563430786133, -1.4643425941467285, -0.5711288452148438, 0.322084903717041, 1.2152986526489258, 2.1085124015808105, 3.001728057861328, 3.894941806793213, 4.788155555725098, 5.681369304656982, 6.574583053588867, 7.467796802520752, 8.361010551452637, 9.25422477722168, 10.147438049316406, 11.040651321411133, 11.933865547180176, 12.827079772949219, 13.720293045043945, 14.613506317138672, 15.506720542907715, 16.399934768676758, 17.293148040771484, 18.18636131286621, 19.079574584960938, 19.972789764404297, 20.866003036499023, 21.75921630859375, 22.65243148803711, 23.545644760131836, 24.438858032226562, 25.33207130432129, 26.225284576416016, 27.118499755859375, 28.0117130279541, 28.904926300048828, 29.798141479492188, 30.691354751586914, 31.58456802368164]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 5.0, 8.0, 7.0, 12.0, 20.0, 19.0, 37.0, 43.0, 75.0, 126.0, 214.0, 379.0, 738.0, 1551.0, 3632.0, 9530.0, 30398.0, 114486.0, 466842.0, 314834.0, 73254.0, 20464.0, 6644.0, 2671.0, 1142.0, 596.0, 310.0, 178.0, 101.0, 60.0, 41.0, 33.0, 25.0, 25.0, 12.0, 14.0, 10.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.52734375, -5.37310791015625, -5.2188720703125, -5.06463623046875, -4.910400390625, -4.75616455078125, -4.6019287109375, -4.44769287109375, -4.29345703125, -4.13922119140625, -3.9849853515625, -3.83074951171875, -3.676513671875, -3.52227783203125, -3.3680419921875, -3.21380615234375, -3.0595703125, -2.90533447265625, -2.7510986328125, -2.59686279296875, -2.442626953125, -2.28839111328125, -2.1341552734375, -1.97991943359375, -1.82568359375, -1.67144775390625, -1.5172119140625, -1.36297607421875, -1.208740234375, -1.05450439453125, -0.9002685546875, -0.74603271484375, -0.591796875, -0.43756103515625, -0.2833251953125, -0.12908935546875, 0.025146484375, 0.17938232421875, 0.3336181640625, 0.48785400390625, 0.64208984375, 0.79632568359375, 0.9505615234375, 1.10479736328125, 1.259033203125, 1.41326904296875, 1.5675048828125, 1.72174072265625, 1.8759765625, 2.03021240234375, 2.1844482421875, 2.33868408203125, 2.492919921875, 2.64715576171875, 2.8013916015625, 2.95562744140625, 3.10986328125, 3.26409912109375, 3.4183349609375, 3.57257080078125, 3.726806640625, 3.88104248046875, 4.0352783203125, 4.18951416015625, 4.34375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 2.0, 7.0, 6.0, 13.0, 17.0, 24.0, 24.0, 29.0, 46.0, 64.0, 58.0, 64.0, 53.0, 64.0, 78.0, 47.0, 67.0, 62.0, 37.0, 38.0, 42.0, 32.0, 29.0, 26.0, 18.0, 13.0, 14.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69921875, -3.5853271484375, -3.471435546875, -3.3575439453125, -3.24365234375, -3.1297607421875, -3.015869140625, -2.9019775390625, -2.7880859375, -2.6741943359375, -2.560302734375, -2.4464111328125, -2.33251953125, -2.2186279296875, -2.104736328125, -1.9908447265625, -1.876953125, -1.7630615234375, -1.649169921875, -1.5352783203125, -1.42138671875, -1.3074951171875, -1.193603515625, -1.0797119140625, -0.9658203125, -0.8519287109375, -0.738037109375, -0.6241455078125, -0.51025390625, -0.3963623046875, -0.282470703125, -0.1685791015625, -0.0546875, 0.0592041015625, 0.173095703125, 0.2869873046875, 0.40087890625, 0.5147705078125, 0.628662109375, 0.7425537109375, 0.8564453125, 0.9703369140625, 1.084228515625, 1.1981201171875, 1.31201171875, 1.4259033203125, 1.539794921875, 1.6536865234375, 1.767578125, 1.8814697265625, 1.995361328125, 2.1092529296875, 2.22314453125, 2.3370361328125, 2.450927734375, 2.5648193359375, 2.6787109375, 2.7926025390625, 2.906494140625, 3.0203857421875, 3.13427734375, 3.2481689453125, 3.362060546875, 3.4759521484375, 3.58984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 7.0, 2.0, 7.0, 6.0, 8.0, 14.0, 19.0, 17.0, 24.0, 25.0, 55.0, 80.0, 135.0, 178.0, 352.0, 762.0, 2160.0, 9820.0, 236570.0, 776824.0, 16625.0, 2834.0, 944.0, 439.0, 235.0, 135.0, 83.0, 55.0, 32.0, 27.0, 19.0, 18.0, 9.0, 10.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.5625, -18.0185546875, -17.474609375, -16.9306640625, -16.38671875, -15.8427734375, -15.298828125, -14.7548828125, -14.2109375, -13.6669921875, -13.123046875, -12.5791015625, -12.03515625, -11.4912109375, -10.947265625, -10.4033203125, -9.859375, -9.3154296875, -8.771484375, -8.2275390625, -7.68359375, -7.1396484375, -6.595703125, -6.0517578125, -5.5078125, -4.9638671875, -4.419921875, -3.8759765625, -3.33203125, -2.7880859375, -2.244140625, -1.7001953125, -1.15625, -0.6123046875, -0.068359375, 0.4755859375, 1.01953125, 1.5634765625, 2.107421875, 2.6513671875, 3.1953125, 3.7392578125, 4.283203125, 4.8271484375, 5.37109375, 5.9150390625, 6.458984375, 7.0029296875, 7.546875, 8.0908203125, 8.634765625, 9.1787109375, 9.72265625, 10.2666015625, 10.810546875, 11.3544921875, 11.8984375, 12.4423828125, 12.986328125, 13.5302734375, 14.07421875, 14.6181640625, 15.162109375, 15.7060546875, 16.25]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 2.0, 9.0, 11.0, 11.0, 10.0, 22.0, 43.0, 45.0, 57.0, 59.0, 81.0, 85.0, 88.0, 91.0, 75.0, 66.0, 69.0, 43.0, 30.0, 26.0, 16.0, 14.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.5625, -21.92529296875, -21.2880859375, -20.65087890625, -20.013671875, -19.37646484375, -18.7392578125, -18.10205078125, -17.46484375, -16.82763671875, -16.1904296875, -15.55322265625, -14.916015625, -14.27880859375, -13.6416015625, -13.00439453125, -12.3671875, -11.72998046875, -11.0927734375, -10.45556640625, -9.818359375, -9.18115234375, -8.5439453125, -7.90673828125, -7.26953125, -6.63232421875, -5.9951171875, -5.35791015625, -4.720703125, -4.08349609375, -3.4462890625, -2.80908203125, -2.171875, -1.53466796875, -0.8974609375, -0.26025390625, 0.376953125, 1.01416015625, 1.6513671875, 2.28857421875, 2.92578125, 3.56298828125, 4.2001953125, 4.83740234375, 5.474609375, 6.11181640625, 6.7490234375, 7.38623046875, 8.0234375, 8.66064453125, 9.2978515625, 9.93505859375, 10.572265625, 11.20947265625, 11.8466796875, 12.48388671875, 13.12109375, 13.75830078125, 14.3955078125, 15.03271484375, 15.669921875, 16.30712890625, 16.9443359375, 17.58154296875, 18.21875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 6.0, 13.0, 9.0, 8.0, 27.0, 38.0, 50.0, 80.0, 114.0, 212.0, 403.0, 945.0, 5486.0, 214177.0, 815651.0, 9044.0, 1237.0, 435.0, 220.0, 125.0, 78.0, 60.0, 42.0, 30.0, 19.0, 10.0, 7.0, 3.0, 2.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.328125, -9.0374755859375, -8.746826171875, -8.4561767578125, -8.16552734375, -7.8748779296875, -7.584228515625, -7.2935791015625, -7.0029296875, -6.7122802734375, -6.421630859375, -6.1309814453125, -5.84033203125, -5.5496826171875, -5.259033203125, -4.9683837890625, -4.677734375, -4.3870849609375, -4.096435546875, -3.8057861328125, -3.51513671875, -3.2244873046875, -2.933837890625, -2.6431884765625, -2.3525390625, -2.0618896484375, -1.771240234375, -1.4805908203125, -1.18994140625, -0.8992919921875, -0.608642578125, -0.3179931640625, -0.02734375, 0.2633056640625, 0.553955078125, 0.8446044921875, 1.13525390625, 1.4259033203125, 1.716552734375, 2.0072021484375, 2.2978515625, 2.5885009765625, 2.879150390625, 3.1697998046875, 3.46044921875, 3.7510986328125, 4.041748046875, 4.3323974609375, 4.623046875, 4.9136962890625, 5.204345703125, 5.4949951171875, 5.78564453125, 6.0762939453125, 6.366943359375, 6.6575927734375, 6.9482421875, 7.2388916015625, 7.529541015625, 7.8201904296875, 8.11083984375, 8.4014892578125, 8.692138671875, 8.9827880859375, 9.2734375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 15.0, 6.0, 3.0, 5.0, 12.0, 11.0, 13.0, 11.0, 16.0, 26.0, 29.0, 49.0, 96.0, 191.0, 183.0, 109.0, 46.0, 37.0, 27.0, 23.0, 17.0, 14.0, 12.0, 7.0, 3.0, 5.0, 3.0, 4.0, 6.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0008878707885742188, -0.000863291323184967, -0.0008387118577957153, -0.0008141323924064636, -0.0007895529270172119, -0.0007649734616279602, -0.0007403939962387085, -0.0007158145308494568, -0.0006912350654602051, -0.0006666556000709534, -0.0006420761346817017, -0.00061749666929245, -0.0005929172039031982, -0.0005683377385139465, -0.0005437582731246948, -0.0005191788077354431, -0.0004945993423461914, -0.0004700198769569397, -0.000445440411567688, -0.0004208609461784363, -0.00039628148078918457, -0.00037170201539993286, -0.00034712255001068115, -0.00032254308462142944, -0.00029796361923217773, -0.000273384153842926, -0.0002488046884536743, -0.0002242252230644226, -0.0001996457576751709, -0.0001750662922859192, -0.00015048682689666748, -0.00012590736150741577, -0.00010132789611816406, -7.674843072891235e-05, -5.2168965339660645e-05, -2.7589499950408936e-05, -3.0100345611572266e-06, 2.1569430828094482e-05, 4.614889621734619e-05, 7.07283616065979e-05, 9.530782699584961e-05, 0.00011988729238510132, 0.00014446675777435303, 0.00016904622316360474, 0.00019362568855285645, 0.00021820515394210815, 0.00024278461933135986, 0.00026736408472061157, 0.0002919435501098633, 0.000316523015499115, 0.0003411024808883667, 0.0003656819462776184, 0.0003902614116668701, 0.0004148408770561218, 0.00043942034244537354, 0.00046399980783462524, 0.000488579273223877, 0.0005131587386131287, 0.0005377382040023804, 0.0005623176693916321, 0.0005868971347808838, 0.0006114766001701355, 0.0006360560655593872, 0.0006606355309486389, 0.0006852149963378906]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 1.0, 7.0, 11.0, 13.0, 12.0, 16.0, 28.0, 39.0, 39.0, 54.0, 68.0, 113.0, 163.0, 241.0, 458.0, 862.0, 1989.0, 5162.0, 16303.0, 119629.0, 851283.0, 36480.0, 9290.0, 3243.0, 1356.0, 632.0, 356.0, 203.0, 134.0, 88.0, 74.0, 45.0, 44.0, 47.0, 17.0, 8.0, 13.0, 11.0, 8.0, 3.0, 7.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6015625, -6.39697265625, -6.1923828125, -5.98779296875, -5.783203125, -5.57861328125, -5.3740234375, -5.16943359375, -4.96484375, -4.76025390625, -4.5556640625, -4.35107421875, -4.146484375, -3.94189453125, -3.7373046875, -3.53271484375, -3.328125, -3.12353515625, -2.9189453125, -2.71435546875, -2.509765625, -2.30517578125, -2.1005859375, -1.89599609375, -1.69140625, -1.48681640625, -1.2822265625, -1.07763671875, -0.873046875, -0.66845703125, -0.4638671875, -0.25927734375, -0.0546875, 0.14990234375, 0.3544921875, 0.55908203125, 0.763671875, 0.96826171875, 1.1728515625, 1.37744140625, 1.58203125, 1.78662109375, 1.9912109375, 2.19580078125, 2.400390625, 2.60498046875, 2.8095703125, 3.01416015625, 3.21875, 3.42333984375, 3.6279296875, 3.83251953125, 4.037109375, 4.24169921875, 4.4462890625, 4.65087890625, 4.85546875, 5.06005859375, 5.2646484375, 5.46923828125, 5.673828125, 5.87841796875, 6.0830078125, 6.28759765625, 6.4921875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 5.0, 6.0, 10.0, 9.0, 18.0, 19.0, 48.0, 100.0, 260.0, 244.0, 121.0, 49.0, 25.0, 21.0, 7.0, 14.0, 10.0, 6.0, 2.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6171875, -8.34033203125, -8.0634765625, -7.78662109375, -7.509765625, -7.23291015625, -6.9560546875, -6.67919921875, -6.40234375, -6.12548828125, -5.8486328125, -5.57177734375, -5.294921875, -5.01806640625, -4.7412109375, -4.46435546875, -4.1875, -3.91064453125, -3.6337890625, -3.35693359375, -3.080078125, -2.80322265625, -2.5263671875, -2.24951171875, -1.97265625, -1.69580078125, -1.4189453125, -1.14208984375, -0.865234375, -0.58837890625, -0.3115234375, -0.03466796875, 0.2421875, 0.51904296875, 0.7958984375, 1.07275390625, 1.349609375, 1.62646484375, 1.9033203125, 2.18017578125, 2.45703125, 2.73388671875, 3.0107421875, 3.28759765625, 3.564453125, 3.84130859375, 4.1181640625, 4.39501953125, 4.671875, 4.94873046875, 5.2255859375, 5.50244140625, 5.779296875, 6.05615234375, 6.3330078125, 6.60986328125, 6.88671875, 7.16357421875, 7.4404296875, 7.71728515625, 7.994140625, 8.27099609375, 8.5478515625, 8.82470703125, 9.1015625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 30.0, 86.0, 329.0, 350.0, 143.0, 29.0, 9.0, 3.0, 9.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-170.97976684570312, -166.71546936035156, -162.45115661621094, -158.18685913085938, -153.92254638671875, -149.6582489013672, -145.39393615722656, -141.129638671875, -136.86532592773438, -132.6010284423828, -128.3367156982422, -124.0724105834961, -119.80810546875, -115.54380798339844, -111.27950286865234, -107.01519775390625, -102.75090026855469, -98.4865951538086, -94.2222900390625, -89.9579849243164, -85.69367980957031, -81.42938232421875, -77.16507720947266, -72.90077209472656, -68.63646697998047, -64.37216186523438, -60.10785675048828, -55.84355545043945, -51.57925033569336, -47.314945220947266, -43.05064392089844, -38.786338806152344, -34.52204132080078, -30.257736206054688, -25.993432998657227, -21.729129791259766, -17.464824676513672, -13.200519561767578, -8.936216354370117, -4.671913146972656, -0.4076080322265625, 3.856696128845215, 8.121000289916992, 12.38530445098877, 16.649608612060547, 20.91391372680664, 25.1782169342041, 29.442520141601562, 33.706825256347656, 37.97113037109375, 42.235435485839844, 46.49973678588867, 50.764041900634766, 55.02834701538086, 59.29264831542969, 63.55695343017578, 67.82125854492188, 72.08556365966797, 76.34986877441406, 80.61417388916016, 84.87847900390625, 89.14277648925781, 93.4070816040039, 97.67138671875, 101.9356918334961]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 2.0, 5.0, 13.0, 8.0, 9.0, 13.0, 13.0, 16.0, 22.0, 21.0, 17.0, 34.0, 28.0, 39.0, 41.0, 39.0, 37.0, 54.0, 51.0, 49.0, 61.0, 37.0, 39.0, 36.0, 41.0, 34.0, 35.0, 33.0, 27.0, 27.0, 19.0, 13.0, 19.0, 13.0, 12.0, 4.0, 11.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.449851989746094, -43.055641174316406, -41.66143035888672, -40.267215728759766, -38.87300491333008, -37.47879409790039, -36.08457946777344, -34.69036865234375, -33.29615783691406, -31.901947021484375, -30.507734298706055, -29.113521575927734, -27.719310760498047, -26.32509994506836, -24.93088722229004, -23.53667449951172, -22.14246368408203, -20.748252868652344, -19.354040145874023, -17.959827423095703, -16.565616607666016, -15.171404838562012, -13.777193069458008, -12.382981300354004, -10.98876953125, -9.594557762145996, -8.200345993041992, -6.806134223937988, -5.411922454833984, -4.0177106857299805, -2.6234989166259766, -1.2292871475219727, 0.16492462158203125, 1.5591363906860352, 2.953348159790039, 4.347559928894043, 5.741771697998047, 7.135983467102051, 8.530195236206055, 9.924407005310059, 11.318618774414062, 12.712830543518066, 14.10704231262207, 15.501254081726074, 16.895465850830078, 18.289676666259766, 19.683889389038086, 21.078102111816406, 22.472312927246094, 23.86652374267578, 25.2607364654541, 26.654949188232422, 28.04916000366211, 29.443370819091797, 30.837583541870117, 32.23179626464844, 33.626007080078125, 35.02021789550781, 36.4144287109375, 37.80864334106445, 39.20285415649414, 40.59706497192383, 41.99127960205078, 43.38549041748047, 44.779701232910156]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 6.0, 1.0, 8.0, 11.0, 23.0, 70.0, 91.0, 190.0, 481.0, 2986.0, 4136321.0, 52721.0, 820.0, 246.0, 129.0, 67.0, 44.0, 22.0, 11.0, 11.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.71875, -23.915283203125, -23.11181640625, -22.308349609375, -21.5048828125, -20.701416015625, -19.89794921875, -19.094482421875, -18.291015625, -17.487548828125, -16.68408203125, -15.880615234375, -15.0771484375, -14.273681640625, -13.47021484375, -12.666748046875, -11.86328125, -11.059814453125, -10.25634765625, -9.452880859375, -8.6494140625, -7.845947265625, -7.04248046875, -6.239013671875, -5.435546875, -4.632080078125, -3.82861328125, -3.025146484375, -2.2216796875, -1.418212890625, -0.61474609375, 0.188720703125, 0.9921875, 1.795654296875, 2.59912109375, 3.402587890625, 4.2060546875, 5.009521484375, 5.81298828125, 6.616455078125, 7.419921875, 8.223388671875, 9.02685546875, 9.830322265625, 10.6337890625, 11.437255859375, 12.24072265625, 13.044189453125, 13.84765625, 14.651123046875, 15.45458984375, 16.258056640625, 17.0615234375, 17.864990234375, 18.66845703125, 19.471923828125, 20.275390625, 21.078857421875, 21.88232421875, 22.685791015625, 23.4892578125, 24.292724609375, 25.09619140625, 25.899658203125, 26.703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 7.0, 1.0, 1.0, 7.0, 5.0, 18.0, 17.0, 24.0, 16.0, 28.0, 34.0, 32.0, 43.0, 53.0, 55.0, 75.0, 55.0, 57.0, 63.0, 53.0, 44.0, 46.0, 46.0, 44.0, 49.0, 24.0, 21.0, 16.0, 16.0, 17.0, 15.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.13671875, -4.034423828125, -3.93212890625, -3.829833984375, -3.7275390625, -3.625244140625, -3.52294921875, -3.420654296875, -3.318359375, -3.216064453125, -3.11376953125, -3.011474609375, -2.9091796875, -2.806884765625, -2.70458984375, -2.602294921875, -2.5, -2.397705078125, -2.29541015625, -2.193115234375, -2.0908203125, -1.988525390625, -1.88623046875, -1.783935546875, -1.681640625, -1.579345703125, -1.47705078125, -1.374755859375, -1.2724609375, -1.170166015625, -1.06787109375, -0.965576171875, -0.86328125, -0.760986328125, -0.65869140625, -0.556396484375, -0.4541015625, -0.351806640625, -0.24951171875, -0.147216796875, -0.044921875, 0.057373046875, 0.15966796875, 0.261962890625, 0.3642578125, 0.466552734375, 0.56884765625, 0.671142578125, 0.7734375, 0.875732421875, 0.97802734375, 1.080322265625, 1.1826171875, 1.284912109375, 1.38720703125, 1.489501953125, 1.591796875, 1.694091796875, 1.79638671875, 1.898681640625, 2.0009765625, 2.103271484375, 2.20556640625, 2.307861328125, 2.41015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 10.0, 5.0, 16.0, 15.0, 26.0, 39.0, 47.0, 78.0, 93.0, 137.0, 254.0, 343.0, 686.0, 1517.0, 3959.0, 14197.0, 78743.0, 1734244.0, 2246940.0, 90862.0, 15328.0, 4070.0, 1368.0, 563.0, 290.0, 159.0, 90.0, 66.0, 42.0, 29.0, 14.0, 11.0, 13.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.1015625, -5.941162109375, -5.78076171875, -5.620361328125, -5.4599609375, -5.299560546875, -5.13916015625, -4.978759765625, -4.818359375, -4.657958984375, -4.49755859375, -4.337158203125, -4.1767578125, -4.016357421875, -3.85595703125, -3.695556640625, -3.53515625, -3.374755859375, -3.21435546875, -3.053955078125, -2.8935546875, -2.733154296875, -2.57275390625, -2.412353515625, -2.251953125, -2.091552734375, -1.93115234375, -1.770751953125, -1.6103515625, -1.449951171875, -1.28955078125, -1.129150390625, -0.96875, -0.808349609375, -0.64794921875, -0.487548828125, -0.3271484375, -0.166748046875, -0.00634765625, 0.154052734375, 0.314453125, 0.474853515625, 0.63525390625, 0.795654296875, 0.9560546875, 1.116455078125, 1.27685546875, 1.437255859375, 1.59765625, 1.758056640625, 1.91845703125, 2.078857421875, 2.2392578125, 2.399658203125, 2.56005859375, 2.720458984375, 2.880859375, 3.041259765625, 3.20166015625, 3.362060546875, 3.5224609375, 3.682861328125, 3.84326171875, 4.003662109375, 4.1640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 8.0, 6.0, 13.0, 22.0, 26.0, 48.0, 65.0, 136.0, 257.0, 564.0, 1036.0, 950.0, 473.0, 220.0, 90.0, 63.0, 30.0, 24.0, 14.0, 14.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40234375, -7.21197509765625, -7.0216064453125, -6.83123779296875, -6.640869140625, -6.45050048828125, -6.2601318359375, -6.06976318359375, -5.87939453125, -5.68902587890625, -5.4986572265625, -5.30828857421875, -5.117919921875, -4.92755126953125, -4.7371826171875, -4.54681396484375, -4.3564453125, -4.16607666015625, -3.9757080078125, -3.78533935546875, -3.594970703125, -3.40460205078125, -3.2142333984375, -3.02386474609375, -2.83349609375, -2.64312744140625, -2.4527587890625, -2.26239013671875, -2.072021484375, -1.88165283203125, -1.6912841796875, -1.50091552734375, -1.310546875, -1.12017822265625, -0.9298095703125, -0.73944091796875, -0.549072265625, -0.35870361328125, -0.1683349609375, 0.02203369140625, 0.21240234375, 0.40277099609375, 0.5931396484375, 0.78350830078125, 0.973876953125, 1.16424560546875, 1.3546142578125, 1.54498291015625, 1.7353515625, 1.92572021484375, 2.1160888671875, 2.30645751953125, 2.496826171875, 2.68719482421875, 2.8775634765625, 3.06793212890625, 3.25830078125, 3.44866943359375, 3.6390380859375, 3.82940673828125, 4.019775390625, 4.21014404296875, 4.4005126953125, 4.59088134765625, 4.78125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 15.0, 23.0, 101.0, 305.0, 360.0, 150.0, 33.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.0438461303711, -78.52041625976562, -75.99697875976562, -73.47354888916016, -70.95011901855469, -68.42668151855469, -65.90325164794922, -63.379817962646484, -60.85638427734375, -58.332950592041016, -55.80951690673828, -53.28608703613281, -50.76265335083008, -48.239219665527344, -45.715789794921875, -43.19235610961914, -40.668922424316406, -38.14548873901367, -35.62205505371094, -33.09862518310547, -30.575191497802734, -28.0517578125, -25.5283260345459, -23.004894256591797, -20.481460571289062, -17.958026885986328, -15.434595108032227, -12.911162376403809, -10.38772964477539, -7.864296913146973, -5.340864181518555, -2.817432403564453, -0.2939910888671875, 2.2294416427612305, 4.752874374389648, 7.276307106018066, 9.799739837646484, 12.323172569274902, 14.84660530090332, 17.370037078857422, 19.893470764160156, 22.41690444946289, 24.940336227416992, 27.463768005371094, 29.987201690673828, 32.51063537597656, 35.03406524658203, 37.557498931884766, 40.0809326171875, 42.604366302490234, 45.12779998779297, 47.65122985839844, 50.17466354370117, 52.698097229003906, 55.221527099609375, 57.74496078491211, 60.268394470214844, 62.79182815551758, 65.31526184082031, 67.83869171142578, 70.36212158203125, 72.88555908203125, 75.40898895263672, 77.93241882324219, 80.45585632324219]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 1.0, 5.0, 9.0, 12.0, 13.0, 9.0, 9.0, 17.0, 22.0, 32.0, 26.0, 33.0, 36.0, 37.0, 48.0, 63.0, 50.0, 68.0, 60.0, 56.0, 63.0, 57.0, 53.0, 36.0, 37.0, 34.0, 20.0, 19.0, 14.0, 8.0, 14.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.202231407165527, -14.542743682861328, -13.883256912231445, -13.223769187927246, -12.564281463623047, -11.904794692993164, -11.245306968688965, -10.585819244384766, -9.926332473754883, -9.266844749450684, -8.6073579788208, -7.947870254516602, -7.2883830070495605, -6.6288957595825195, -5.96940803527832, -5.309920787811279, -4.650433540344238, -3.9909462928771973, -3.331458806991577, -2.671971321105957, -2.012484073638916, -1.352996826171875, -0.6935093402862549, -0.034021854400634766, 0.6254653930664062, 1.2849527597427368, 1.9444401264190674, 2.6039276123046875, 3.2634148597717285, 3.9229021072387695, 4.582389831542969, 5.24187707901001, 5.901363372802734, 6.560850620269775, 7.220337867736816, 7.879825592041016, 8.539312362670898, 9.198800086975098, 9.858287811279297, 10.51777458190918, 11.177262306213379, 11.836750030517578, 12.496236801147461, 13.15572452545166, 13.81521224975586, 14.474699020385742, 15.134186744689941, 15.79367446899414, 16.453161239624023, 17.112648010253906, 17.772136688232422, 18.431623458862305, 19.091110229492188, 19.750598907470703, 20.410085678100586, 21.06957244873047, 21.729061126708984, 22.388547897338867, 23.048036575317383, 23.707523345947266, 24.36701011657715, 25.02649688720703, 25.685985565185547, 26.34547233581543, 27.004959106445312]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 17.0, 24.0, 38.0, 43.0, 73.0, 91.0, 153.0, 222.0, 343.0, 585.0, 1136.0, 2495.0, 6410.0, 19891.0, 75483.0, 354301.0, 448619.0, 99117.0, 25752.0, 8024.0, 2848.0, 1249.0, 609.0, 364.0, 216.0, 121.0, 89.0, 68.0, 37.0, 28.0, 27.0, 22.0, 8.0, 10.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.82421875, -4.6690673828125, -4.513916015625, -4.3587646484375, -4.20361328125, -4.0484619140625, -3.893310546875, -3.7381591796875, -3.5830078125, -3.4278564453125, -3.272705078125, -3.1175537109375, -2.96240234375, -2.8072509765625, -2.652099609375, -2.4969482421875, -2.341796875, -2.1866455078125, -2.031494140625, -1.8763427734375, -1.72119140625, -1.5660400390625, -1.410888671875, -1.2557373046875, -1.1005859375, -0.9454345703125, -0.790283203125, -0.6351318359375, -0.47998046875, -0.3248291015625, -0.169677734375, -0.0145263671875, 0.140625, 0.2957763671875, 0.450927734375, 0.6060791015625, 0.76123046875, 0.9163818359375, 1.071533203125, 1.2266845703125, 1.3818359375, 1.5369873046875, 1.692138671875, 1.8472900390625, 2.00244140625, 2.1575927734375, 2.312744140625, 2.4678955078125, 2.623046875, 2.7781982421875, 2.933349609375, 3.0885009765625, 3.24365234375, 3.3988037109375, 3.553955078125, 3.7091064453125, 3.8642578125, 4.0194091796875, 4.174560546875, 4.3297119140625, 4.48486328125, 4.6400146484375, 4.795166015625, 4.9503173828125, 5.10546875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 8.0, 7.0, 10.0, 21.0, 25.0, 21.0, 27.0, 30.0, 33.0, 39.0, 44.0, 50.0, 46.0, 69.0, 58.0, 53.0, 53.0, 53.0, 50.0, 47.0, 37.0, 31.0, 45.0, 38.0, 12.0, 18.0, 16.0, 10.0, 15.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-3.8515625, -3.757171630859375, -3.66278076171875, -3.568389892578125, -3.4739990234375, -3.379608154296875, -3.28521728515625, -3.190826416015625, -3.096435546875, -3.002044677734375, -2.90765380859375, -2.813262939453125, -2.7188720703125, -2.624481201171875, -2.53009033203125, -2.435699462890625, -2.34130859375, -2.246917724609375, -2.15252685546875, -2.058135986328125, -1.9637451171875, -1.869354248046875, -1.77496337890625, -1.680572509765625, -1.586181640625, -1.491790771484375, -1.39739990234375, -1.303009033203125, -1.2086181640625, -1.114227294921875, -1.01983642578125, -0.925445556640625, -0.8310546875, -0.736663818359375, -0.64227294921875, -0.547882080078125, -0.4534912109375, -0.359100341796875, -0.26470947265625, -0.170318603515625, -0.075927734375, 0.018463134765625, 0.11285400390625, 0.207244873046875, 0.3016357421875, 0.396026611328125, 0.49041748046875, 0.584808349609375, 0.67919921875, 0.773590087890625, 0.86798095703125, 0.962371826171875, 1.0567626953125, 1.151153564453125, 1.24554443359375, 1.339935302734375, 1.434326171875, 1.528717041015625, 1.62310791015625, 1.717498779296875, 1.8118896484375, 1.906280517578125, 2.00067138671875, 2.095062255859375, 2.189453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 3.0, 4.0, 9.0, 15.0, 21.0, 29.0, 31.0, 52.0, 94.0, 130.0, 218.0, 382.0, 859.0, 2224.0, 8064.0, 55148.0, 750541.0, 204871.0, 18996.0, 4125.0, 1379.0, 577.0, 292.0, 155.0, 105.0, 62.0, 53.0, 26.0, 14.0, 15.0, 11.0, 9.0, 7.0, 5.0, 2.0, 10.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-11.0078125, -10.681640625, -10.35546875, -10.029296875, -9.703125, -9.376953125, -9.05078125, -8.724609375, -8.3984375, -8.072265625, -7.74609375, -7.419921875, -7.09375, -6.767578125, -6.44140625, -6.115234375, -5.7890625, -5.462890625, -5.13671875, -4.810546875, -4.484375, -4.158203125, -3.83203125, -3.505859375, -3.1796875, -2.853515625, -2.52734375, -2.201171875, -1.875, -1.548828125, -1.22265625, -0.896484375, -0.5703125, -0.244140625, 0.08203125, 0.408203125, 0.734375, 1.060546875, 1.38671875, 1.712890625, 2.0390625, 2.365234375, 2.69140625, 3.017578125, 3.34375, 3.669921875, 3.99609375, 4.322265625, 4.6484375, 4.974609375, 5.30078125, 5.626953125, 5.953125, 6.279296875, 6.60546875, 6.931640625, 7.2578125, 7.583984375, 7.91015625, 8.236328125, 8.5625, 8.888671875, 9.21484375, 9.541015625, 9.8671875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 6.0, 5.0, 7.0, 8.0, 15.0, 20.0, 20.0, 14.0, 33.0, 39.0, 50.0, 56.0, 47.0, 63.0, 80.0, 48.0, 57.0, 52.0, 48.0, 51.0, 59.0, 42.0, 37.0, 32.0, 23.0, 24.0, 13.0, 13.0, 13.0, 7.0, 4.0, 3.0, 2.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6484375, -13.218505859375, -12.78857421875, -12.358642578125, -11.9287109375, -11.498779296875, -11.06884765625, -10.638916015625, -10.208984375, -9.779052734375, -9.34912109375, -8.919189453125, -8.4892578125, -8.059326171875, -7.62939453125, -7.199462890625, -6.76953125, -6.339599609375, -5.90966796875, -5.479736328125, -5.0498046875, -4.619873046875, -4.18994140625, -3.760009765625, -3.330078125, -2.900146484375, -2.47021484375, -2.040283203125, -1.6103515625, -1.180419921875, -0.75048828125, -0.320556640625, 0.109375, 0.539306640625, 0.96923828125, 1.399169921875, 1.8291015625, 2.259033203125, 2.68896484375, 3.118896484375, 3.548828125, 3.978759765625, 4.40869140625, 4.838623046875, 5.2685546875, 5.698486328125, 6.12841796875, 6.558349609375, 6.98828125, 7.418212890625, 7.84814453125, 8.278076171875, 8.7080078125, 9.137939453125, 9.56787109375, 9.997802734375, 10.427734375, 10.857666015625, 11.28759765625, 11.717529296875, 12.1474609375, 12.577392578125, 13.00732421875, 13.437255859375, 13.8671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 15.0, 16.0, 39.0, 93.0, 166.0, 504.0, 2771.0, 59367.0, 974474.0, 9421.0, 1113.0, 289.0, 124.0, 59.0, 34.0, 15.0, 15.0, 8.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.765625, -14.307861328125, -13.85009765625, -13.392333984375, -12.9345703125, -12.476806640625, -12.01904296875, -11.561279296875, -11.103515625, -10.645751953125, -10.18798828125, -9.730224609375, -9.2724609375, -8.814697265625, -8.35693359375, -7.899169921875, -7.44140625, -6.983642578125, -6.52587890625, -6.068115234375, -5.6103515625, -5.152587890625, -4.69482421875, -4.237060546875, -3.779296875, -3.321533203125, -2.86376953125, -2.406005859375, -1.9482421875, -1.490478515625, -1.03271484375, -0.574951171875, -0.1171875, 0.340576171875, 0.79833984375, 1.256103515625, 1.7138671875, 2.171630859375, 2.62939453125, 3.087158203125, 3.544921875, 4.002685546875, 4.46044921875, 4.918212890625, 5.3759765625, 5.833740234375, 6.29150390625, 6.749267578125, 7.20703125, 7.664794921875, 8.12255859375, 8.580322265625, 9.0380859375, 9.495849609375, 9.95361328125, 10.411376953125, 10.869140625, 11.326904296875, 11.78466796875, 12.242431640625, 12.7001953125, 13.157958984375, 13.61572265625, 14.073486328125, 14.53125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 5.0, 4.0, 4.0, 1.0, 6.0, 10.0, 8.0, 14.0, 27.0, 39.0, 60.0, 110.0, 239.0, 213.0, 107.0, 46.0, 31.0, 21.0, 20.0, 11.0, 6.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009636878967285156, -0.0009264424443244934, -0.0008891969919204712, -0.000851951539516449, -0.0008147060871124268, -0.0007774606347084045, -0.0007402151823043823, -0.0007029697299003601, -0.0006657242774963379, -0.0006284788250923157, -0.0005912333726882935, -0.0005539879202842712, -0.000516742467880249, -0.0004794970154762268, -0.0004422515630722046, -0.0004050061106681824, -0.00036776065826416016, -0.00033051520586013794, -0.0002932697534561157, -0.0002560243010520935, -0.0002187788486480713, -0.00018153339624404907, -0.00014428794384002686, -0.00010704249143600464, -6.979703903198242e-05, -3.2551586627960205e-05, 4.693865776062012e-06, 4.193931818008423e-05, 7.918477058410645e-05, 0.00011643022298812866, 0.00015367567539215088, 0.0001909211277961731, 0.0002281665802001953, 0.00026541203260421753, 0.00030265748500823975, 0.00033990293741226196, 0.0003771483898162842, 0.0004143938422203064, 0.0004516392946243286, 0.0004888847470283508, 0.000526130199432373, 0.0005633756518363953, 0.0006006211042404175, 0.0006378665566444397, 0.0006751120090484619, 0.0007123574614524841, 0.0007496029138565063, 0.0007868483662605286, 0.0008240938186645508, 0.000861339271068573, 0.0008985847234725952, 0.0009358301758766174, 0.0009730756282806396, 0.0010103210806846619, 0.001047566533088684, 0.0010848119854927063, 0.0011220574378967285, 0.0011593028903007507, 0.001196548342704773, 0.0012337937951087952, 0.0012710392475128174, 0.0013082846999168396, 0.0013455301523208618, 0.001382775604724884, 0.0014200210571289062]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 7.0, 8.0, 16.0, 27.0, 35.0, 70.0, 134.0, 213.0, 422.0, 962.0, 2868.0, 11107.0, 82360.0, 883394.0, 53664.0, 9165.0, 2402.0, 822.0, 363.0, 214.0, 133.0, 52.0, 40.0, 21.0, 18.0, 12.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3828125, -7.190673828125, -6.99853515625, -6.806396484375, -6.6142578125, -6.422119140625, -6.22998046875, -6.037841796875, -5.845703125, -5.653564453125, -5.46142578125, -5.269287109375, -5.0771484375, -4.885009765625, -4.69287109375, -4.500732421875, -4.30859375, -4.116455078125, -3.92431640625, -3.732177734375, -3.5400390625, -3.347900390625, -3.15576171875, -2.963623046875, -2.771484375, -2.579345703125, -2.38720703125, -2.195068359375, -2.0029296875, -1.810791015625, -1.61865234375, -1.426513671875, -1.234375, -1.042236328125, -0.85009765625, -0.657958984375, -0.4658203125, -0.273681640625, -0.08154296875, 0.110595703125, 0.302734375, 0.494873046875, 0.68701171875, 0.879150390625, 1.0712890625, 1.263427734375, 1.45556640625, 1.647705078125, 1.83984375, 2.031982421875, 2.22412109375, 2.416259765625, 2.6083984375, 2.800537109375, 2.99267578125, 3.184814453125, 3.376953125, 3.569091796875, 3.76123046875, 3.953369140625, 4.1455078125, 4.337646484375, 4.52978515625, 4.721923828125, 4.9140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 9.0, 11.0, 10.0, 14.0, 22.0, 39.0, 36.0, 61.0, 83.0, 110.0, 136.0, 112.0, 85.0, 68.0, 47.0, 34.0, 22.0, 17.0, 12.0, 6.0, 8.0, 6.0, 7.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.259765625, -3.149566650390625, -3.03936767578125, -2.929168701171875, -2.8189697265625, -2.708770751953125, -2.59857177734375, -2.488372802734375, -2.378173828125, -2.267974853515625, -2.15777587890625, -2.047576904296875, -1.9373779296875, -1.827178955078125, -1.71697998046875, -1.606781005859375, -1.49658203125, -1.386383056640625, -1.27618408203125, -1.165985107421875, -1.0557861328125, -0.945587158203125, -0.83538818359375, -0.725189208984375, -0.614990234375, -0.504791259765625, -0.39459228515625, -0.284393310546875, -0.1741943359375, -0.063995361328125, 0.04620361328125, 0.156402587890625, 0.2666015625, 0.376800537109375, 0.48699951171875, 0.597198486328125, 0.7073974609375, 0.817596435546875, 0.92779541015625, 1.037994384765625, 1.148193359375, 1.258392333984375, 1.36859130859375, 1.478790283203125, 1.5889892578125, 1.699188232421875, 1.80938720703125, 1.919586181640625, 2.02978515625, 2.139984130859375, 2.25018310546875, 2.360382080078125, 2.4705810546875, 2.580780029296875, 2.69097900390625, 2.801177978515625, 2.911376953125, 3.021575927734375, 3.13177490234375, 3.241973876953125, 3.3521728515625, 3.462371826171875, 3.57257080078125, 3.682769775390625, 3.79296875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 14.0, 33.0, 159.0, 460.0, 252.0, 45.0, 19.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.2841796875, -152.60556030273438, -147.92694091796875, -143.24830627441406, -138.56968688964844, -133.8910675048828, -129.21243286132812, -124.5338134765625, -119.85519409179688, -115.17657470703125, -110.4979476928711, -105.81932067871094, -101.14070129394531, -96.46208190917969, -91.78345489501953, -87.10482788085938, -82.42620849609375, -77.74758911132812, -73.06896209716797, -68.39033508300781, -63.71171569824219, -59.0330924987793, -54.354469299316406, -49.675846099853516, -44.997222900390625, -40.318599700927734, -35.639976501464844, -30.961353302001953, -26.282730102539062, -21.604106903076172, -16.92548370361328, -12.24686050415039, -7.5682373046875, -2.8896141052246094, 1.7890090942382812, 6.467632293701172, 11.146255493164062, 15.824878692626953, 20.503501892089844, 25.182125091552734, 29.860748291015625, 34.539371490478516, 39.217994689941406, 43.8966178894043, 48.57524108886719, 53.25386428833008, 57.93248748779297, 62.61111068725586, 67.28973388671875, 71.96835327148438, 76.64698028564453, 81.32560729980469, 86.00422668457031, 90.68284606933594, 95.3614730834961, 100.04010009765625, 104.71871948242188, 109.3973388671875, 114.07596588134766, 118.75459289550781, 123.43321228027344, 128.11183166503906, 132.79046630859375, 137.46908569335938, 142.147705078125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 9.0, 10.0, 13.0, 12.0, 27.0, 28.0, 35.0, 46.0, 47.0, 53.0, 60.0, 67.0, 92.0, 84.0, 72.0, 66.0, 49.0, 32.0, 40.0, 46.0, 20.0, 23.0, 25.0, 15.0, 9.0, 7.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.068634033203125, -53.983089447021484, -51.89754867553711, -49.81200408935547, -47.726463317871094, -45.64091873168945, -43.55537414550781, -41.46983337402344, -39.38429260253906, -37.29874801635742, -35.21320724487305, -33.127662658691406, -31.04212188720703, -28.95657730102539, -26.871034622192383, -24.785491943359375, -22.699947357177734, -20.614404678344727, -18.52886199951172, -16.443317413330078, -14.357775688171387, -12.272233009338379, -10.186689376831055, -8.101146697998047, -6.015604019165039, -3.930061101913452, -1.8445181846618652, 0.24102497100830078, 2.3265676498413086, 4.412110328674316, 6.497653961181641, 8.583196640014648, 10.668739318847656, 12.754281997680664, 14.839824676513672, 16.925369262695312, 19.010910034179688, 21.096454620361328, 23.181997299194336, 25.267539978027344, 27.35308265686035, 29.43862533569336, 31.524168014526367, 33.609710693359375, 35.695255279541016, 37.78079605102539, 39.86634063720703, 41.951881408691406, 44.03742599487305, 46.12297058105469, 48.20851135253906, 50.2940559387207, 52.37959671020508, 54.46514129638672, 56.550682067871094, 58.636226654052734, 60.721771240234375, 62.807315826416016, 64.89286041259766, 66.97840118408203, 69.0639419555664, 71.14948272705078, 73.23503112792969, 75.32057189941406, 77.40611267089844]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 14.0, 9.0, 26.0, 18.0, 45.0, 88.0, 110.0, 181.0, 294.0, 574.0, 1282.0, 3274.0, 11758.0, 77509.0, 1629968.0, 2327380.0, 119063.0, 15714.0, 4016.0, 1422.0, 642.0, 356.0, 197.0, 111.0, 82.0, 45.0, 31.0, 20.0, 17.0, 5.0, 10.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.5, -6.34552001953125, -6.1910400390625, -6.03656005859375, -5.882080078125, -5.72760009765625, -5.5731201171875, -5.41864013671875, -5.26416015625, -5.10968017578125, -4.9552001953125, -4.80072021484375, -4.646240234375, -4.49176025390625, -4.3372802734375, -4.18280029296875, -4.0283203125, -3.87384033203125, -3.7193603515625, -3.56488037109375, -3.410400390625, -3.25592041015625, -3.1014404296875, -2.94696044921875, -2.79248046875, -2.63800048828125, -2.4835205078125, -2.32904052734375, -2.174560546875, -2.02008056640625, -1.8656005859375, -1.71112060546875, -1.556640625, -1.40216064453125, -1.2476806640625, -1.09320068359375, -0.938720703125, -0.78424072265625, -0.6297607421875, -0.47528076171875, -0.32080078125, -0.16632080078125, -0.0118408203125, 0.14263916015625, 0.297119140625, 0.45159912109375, 0.6060791015625, 0.76055908203125, 0.9150390625, 1.06951904296875, 1.2239990234375, 1.37847900390625, 1.532958984375, 1.68743896484375, 1.8419189453125, 1.99639892578125, 2.15087890625, 2.30535888671875, 2.4598388671875, 2.61431884765625, 2.768798828125, 2.92327880859375, 3.0777587890625, 3.23223876953125, 3.38671875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 9.0, 6.0, 9.0, 10.0, 13.0, 24.0, 32.0, 27.0, 23.0, 40.0, 41.0, 47.0, 54.0, 51.0, 80.0, 57.0, 65.0, 51.0, 61.0, 57.0, 46.0, 34.0, 36.0, 31.0, 25.0, 15.0, 14.0, 9.0, 10.0, 10.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.46942138671875, -2.3685302734375, -2.26763916015625, -2.166748046875, -2.06585693359375, -1.9649658203125, -1.86407470703125, -1.76318359375, -1.66229248046875, -1.5614013671875, -1.46051025390625, -1.359619140625, -1.25872802734375, -1.1578369140625, -1.05694580078125, -0.9560546875, -0.85516357421875, -0.7542724609375, -0.65338134765625, -0.552490234375, -0.45159912109375, -0.3507080078125, -0.24981689453125, -0.14892578125, -0.04803466796875, 0.0528564453125, 0.15374755859375, 0.254638671875, 0.35552978515625, 0.4564208984375, 0.55731201171875, 0.658203125, 0.75909423828125, 0.8599853515625, 0.96087646484375, 1.061767578125, 1.16265869140625, 1.2635498046875, 1.36444091796875, 1.46533203125, 1.56622314453125, 1.6671142578125, 1.76800537109375, 1.868896484375, 1.96978759765625, 2.0706787109375, 2.17156982421875, 2.2724609375, 2.37335205078125, 2.4742431640625, 2.57513427734375, 2.676025390625, 2.77691650390625, 2.8778076171875, 2.97869873046875, 3.07958984375, 3.18048095703125, 3.2813720703125, 3.38226318359375, 3.483154296875, 3.58404541015625, 3.6849365234375, 3.78582763671875, 3.88671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 10.0, 18.0, 23.0, 36.0, 79.0, 155.0, 367.0, 1090.0, 5472.0, 81161.0, 3732606.0, 357551.0, 13150.0, 1805.0, 439.0, 157.0, 77.0, 40.0, 22.0, 10.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9140625, -12.61846923828125, -12.3228759765625, -12.02728271484375, -11.731689453125, -11.43609619140625, -11.1405029296875, -10.84490966796875, -10.54931640625, -10.25372314453125, -9.9581298828125, -9.66253662109375, -9.366943359375, -9.07135009765625, -8.7757568359375, -8.48016357421875, -8.1845703125, -7.88897705078125, -7.5933837890625, -7.29779052734375, -7.002197265625, -6.70660400390625, -6.4110107421875, -6.11541748046875, -5.81982421875, -5.52423095703125, -5.2286376953125, -4.93304443359375, -4.637451171875, -4.34185791015625, -4.0462646484375, -3.75067138671875, -3.455078125, -3.15948486328125, -2.8638916015625, -2.56829833984375, -2.272705078125, -1.97711181640625, -1.6815185546875, -1.38592529296875, -1.09033203125, -0.79473876953125, -0.4991455078125, -0.20355224609375, 0.092041015625, 0.38763427734375, 0.6832275390625, 0.97882080078125, 1.2744140625, 1.57000732421875, 1.8656005859375, 2.16119384765625, 2.456787109375, 2.75238037109375, 3.0479736328125, 3.34356689453125, 3.63916015625, 3.93475341796875, 4.2303466796875, 4.52593994140625, 4.821533203125, 5.11712646484375, 5.4127197265625, 5.70831298828125, 6.00390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 9.0, 19.0, 18.0, 41.0, 43.0, 70.0, 128.0, 214.0, 381.0, 711.0, 881.0, 676.0, 366.0, 201.0, 114.0, 66.0, 36.0, 18.0, 17.0, 16.0, 10.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3984375, -7.18365478515625, -6.9688720703125, -6.75408935546875, -6.539306640625, -6.32452392578125, -6.1097412109375, -5.89495849609375, -5.68017578125, -5.46539306640625, -5.2506103515625, -5.03582763671875, -4.821044921875, -4.60626220703125, -4.3914794921875, -4.17669677734375, -3.9619140625, -3.74713134765625, -3.5323486328125, -3.31756591796875, -3.102783203125, -2.88800048828125, -2.6732177734375, -2.45843505859375, -2.24365234375, -2.02886962890625, -1.8140869140625, -1.59930419921875, -1.384521484375, -1.16973876953125, -0.9549560546875, -0.74017333984375, -0.525390625, -0.31060791015625, -0.0958251953125, 0.11895751953125, 0.333740234375, 0.54852294921875, 0.7633056640625, 0.97808837890625, 1.19287109375, 1.40765380859375, 1.6224365234375, 1.83721923828125, 2.052001953125, 2.26678466796875, 2.4815673828125, 2.69635009765625, 2.9111328125, 3.12591552734375, 3.3406982421875, 3.55548095703125, 3.770263671875, 3.98504638671875, 4.1998291015625, 4.41461181640625, 4.62939453125, 4.84417724609375, 5.0589599609375, 5.27374267578125, 5.488525390625, 5.70330810546875, 5.9180908203125, 6.13287353515625, 6.34765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 13.0, 24.0, 51.0, 109.0, 201.0, 218.0, 216.0, 93.0, 38.0, 6.0, 14.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.858489990234375, -48.71120834350586, -46.563926696777344, -44.41664505004883, -42.26936340332031, -40.1220817565918, -37.97480010986328, -35.82752227783203, -33.68023681640625, -31.532955169677734, -29.38567352294922, -27.238391876220703, -25.091110229492188, -22.943828582763672, -20.79654884338379, -18.649267196655273, -16.50198745727539, -14.354705810546875, -12.20742416381836, -10.06014347076416, -7.9128618240356445, -5.765580177307129, -3.6182994842529297, -1.471017837524414, 0.6762638092041016, 2.823545217514038, 4.970826625823975, 7.118107795715332, 9.265389442443848, 11.412671089172363, 13.559951782226562, 15.707233428955078, 17.854515075683594, 20.00179672241211, 22.149078369140625, 24.29636001586914, 26.443641662597656, 28.590923309326172, 30.738203048706055, 32.88548278808594, 35.03276824951172, 37.180049896240234, 39.32733154296875, 41.474613189697266, 43.62189483642578, 45.7691764831543, 47.91645812988281, 50.06373596191406, 52.21101760864258, 54.358299255371094, 56.50558090209961, 58.652862548828125, 60.80014419555664, 62.947425842285156, 65.0947036743164, 67.24198913574219, 69.38926696777344, 71.53654479980469, 73.68383026123047, 75.83110809326172, 77.9783935546875, 80.12567138671875, 82.27295684814453, 84.42023468017578, 86.56752014160156]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 10.0, 10.0, 11.0, 8.0, 9.0, 22.0, 19.0, 31.0, 31.0, 45.0, 41.0, 57.0, 40.0, 49.0, 62.0, 45.0, 56.0, 52.0, 52.0, 43.0, 51.0, 40.0, 39.0, 34.0, 35.0, 16.0, 17.0, 10.0, 17.0, 6.0, 14.0, 7.0, 6.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.343591690063477, -20.335092544555664, -19.32659339904785, -18.31809425354004, -17.309593200683594, -16.30109405517578, -15.292594909667969, -14.284095764160156, -13.275596618652344, -12.267097473144531, -11.258598327636719, -10.25009822845459, -9.241599082946777, -8.233099937438965, -7.224600315093994, -6.216100692749023, -5.207601547241211, -4.199102401733398, -3.1906027793884277, -2.182103395462036, -1.1736040115356445, -0.16510486602783203, 0.8433947563171387, 1.8518943786621094, 2.860393524169922, 3.8688929080963135, 4.877392292022705, 5.885891914367676, 6.894391059875488, 7.902890205383301, 8.91139030456543, 9.919889450073242, 10.928386688232422, 11.936885833740234, 12.945384979248047, 13.953885078430176, 14.962384223937988, 15.9708833694458, 16.97938346862793, 17.987882614135742, 18.996381759643555, 20.004880905151367, 21.01338005065918, 22.021879196166992, 23.030380249023438, 24.03887939453125, 25.047378540039062, 26.055877685546875, 27.064376831054688, 28.0728759765625, 29.081375122070312, 30.089874267578125, 31.098373413085938, 32.10687255859375, 33.11537170410156, 34.123870849609375, 35.13236999511719, 36.140869140625, 37.14936828613281, 38.157867431640625, 39.16636657714844, 40.17486572265625, 41.18336486816406, 42.191864013671875, 43.20036697387695]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 6.0, 11.0, 8.0, 31.0, 32.0, 49.0, 63.0, 83.0, 160.0, 239.0, 425.0, 879.0, 1914.0, 5882.0, 22054.0, 98475.0, 473583.0, 350035.0, 70499.0, 16344.0, 4518.0, 1596.0, 693.0, 366.0, 216.0, 115.0, 75.0, 57.0, 44.0, 30.0, 23.0, 7.0, 11.0, 9.0, 1.0, 6.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.5, -7.29669189453125, -7.0933837890625, -6.89007568359375, -6.686767578125, -6.48345947265625, -6.2801513671875, -6.07684326171875, -5.87353515625, -5.67022705078125, -5.4669189453125, -5.26361083984375, -5.060302734375, -4.85699462890625, -4.6536865234375, -4.45037841796875, -4.2470703125, -4.04376220703125, -3.8404541015625, -3.63714599609375, -3.433837890625, -3.23052978515625, -3.0272216796875, -2.82391357421875, -2.62060546875, -2.41729736328125, -2.2139892578125, -2.01068115234375, -1.807373046875, -1.60406494140625, -1.4007568359375, -1.19744873046875, -0.994140625, -0.79083251953125, -0.5875244140625, -0.38421630859375, -0.180908203125, 0.02239990234375, 0.2257080078125, 0.42901611328125, 0.63232421875, 0.83563232421875, 1.0389404296875, 1.24224853515625, 1.445556640625, 1.64886474609375, 1.8521728515625, 2.05548095703125, 2.2587890625, 2.46209716796875, 2.6654052734375, 2.86871337890625, 3.072021484375, 3.27532958984375, 3.4786376953125, 3.68194580078125, 3.88525390625, 4.08856201171875, 4.2918701171875, 4.49517822265625, 4.698486328125, 4.90179443359375, 5.1051025390625, 5.30841064453125, 5.51171875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 9.0, 10.0, 7.0, 8.0, 12.0, 18.0, 19.0, 24.0, 23.0, 20.0, 28.0, 34.0, 44.0, 42.0, 56.0, 44.0, 46.0, 52.0, 53.0, 56.0, 63.0, 42.0, 39.0, 41.0, 38.0, 31.0, 21.0, 23.0, 19.0, 12.0, 15.0, 15.0, 14.0, 9.0, 4.0, 8.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.52734375, -2.44281005859375, -2.3582763671875, -2.27374267578125, -2.189208984375, -2.10467529296875, -2.0201416015625, -1.93560791015625, -1.85107421875, -1.76654052734375, -1.6820068359375, -1.59747314453125, -1.512939453125, -1.42840576171875, -1.3438720703125, -1.25933837890625, -1.1748046875, -1.09027099609375, -1.0057373046875, -0.92120361328125, -0.836669921875, -0.75213623046875, -0.6676025390625, -0.58306884765625, -0.49853515625, -0.41400146484375, -0.3294677734375, -0.24493408203125, -0.160400390625, -0.07586669921875, 0.0086669921875, 0.09320068359375, 0.177734375, 0.26226806640625, 0.3468017578125, 0.43133544921875, 0.515869140625, 0.60040283203125, 0.6849365234375, 0.76947021484375, 0.85400390625, 0.93853759765625, 1.0230712890625, 1.10760498046875, 1.192138671875, 1.27667236328125, 1.3612060546875, 1.44573974609375, 1.5302734375, 1.61480712890625, 1.6993408203125, 1.78387451171875, 1.868408203125, 1.95294189453125, 2.0374755859375, 2.12200927734375, 2.20654296875, 2.29107666015625, 2.3756103515625, 2.46014404296875, 2.544677734375, 2.62921142578125, 2.7137451171875, 2.79827880859375, 2.8828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 7.0, 12.0, 9.0, 14.0, 22.0, 20.0, 29.0, 43.0, 60.0, 93.0, 126.0, 223.0, 338.0, 549.0, 948.0, 1993.0, 5240.0, 22177.0, 254278.0, 708316.0, 40985.0, 7517.0, 2618.0, 1164.0, 664.0, 354.0, 245.0, 155.0, 89.0, 71.0, 44.0, 33.0, 26.0, 20.0, 13.0, 15.0, 11.0, 4.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.2890625, -11.9068603515625, -11.524658203125, -11.1424560546875, -10.76025390625, -10.3780517578125, -9.995849609375, -9.6136474609375, -9.2314453125, -8.8492431640625, -8.467041015625, -8.0848388671875, -7.70263671875, -7.3204345703125, -6.938232421875, -6.5560302734375, -6.173828125, -5.7916259765625, -5.409423828125, -5.0272216796875, -4.64501953125, -4.2628173828125, -3.880615234375, -3.4984130859375, -3.1162109375, -2.7340087890625, -2.351806640625, -1.9696044921875, -1.58740234375, -1.2052001953125, -0.822998046875, -0.4407958984375, -0.05859375, 0.3236083984375, 0.705810546875, 1.0880126953125, 1.47021484375, 1.8524169921875, 2.234619140625, 2.6168212890625, 2.9990234375, 3.3812255859375, 3.763427734375, 4.1456298828125, 4.52783203125, 4.9100341796875, 5.292236328125, 5.6744384765625, 6.056640625, 6.4388427734375, 6.821044921875, 7.2032470703125, 7.58544921875, 7.9676513671875, 8.349853515625, 8.7320556640625, 9.1142578125, 9.4964599609375, 9.878662109375, 10.2608642578125, 10.64306640625, 11.0252685546875, 11.407470703125, 11.7896728515625, 12.171875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 3.0, 6.0, 10.0, 14.0, 15.0, 18.0, 20.0, 35.0, 51.0, 38.0, 61.0, 51.0, 77.0, 62.0, 59.0, 51.0, 55.0, 52.0, 48.0, 44.0, 43.0, 36.0, 30.0, 19.0, 25.0, 19.0, 9.0, 9.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.8671875, -11.4453125, -11.0234375, -10.6015625, -10.1796875, -9.7578125, -9.3359375, -8.9140625, -8.4921875, -8.0703125, -7.6484375, -7.2265625, -6.8046875, -6.3828125, -5.9609375, -5.5390625, -5.1171875, -4.6953125, -4.2734375, -3.8515625, -3.4296875, -3.0078125, -2.5859375, -2.1640625, -1.7421875, -1.3203125, -0.8984375, -0.4765625, -0.0546875, 0.3671875, 0.7890625, 1.2109375, 1.6328125, 2.0546875, 2.4765625, 2.8984375, 3.3203125, 3.7421875, 4.1640625, 4.5859375, 5.0078125, 5.4296875, 5.8515625, 6.2734375, 6.6953125, 7.1171875, 7.5390625, 7.9609375, 8.3828125, 8.8046875, 9.2265625, 9.6484375, 10.0703125, 10.4921875, 10.9140625, 11.3359375, 11.7578125, 12.1796875, 12.6015625, 13.0234375, 13.4453125, 13.8671875, 14.2890625, 14.7109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 9.0, 6.0, 14.0, 27.0, 28.0, 38.0, 42.0, 85.0, 129.0, 203.0, 390.0, 745.0, 1631.0, 3859.0, 12637.0, 68643.0, 837964.0, 98725.0, 15056.0, 4413.0, 1861.0, 847.0, 445.0, 256.0, 159.0, 95.0, 60.0, 54.0, 27.0, 22.0, 20.0, 8.0, 15.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.83203125, -6.6285400390625, -6.425048828125, -6.2215576171875, -6.01806640625, -5.8145751953125, -5.611083984375, -5.4075927734375, -5.2041015625, -5.0006103515625, -4.797119140625, -4.5936279296875, -4.39013671875, -4.1866455078125, -3.983154296875, -3.7796630859375, -3.576171875, -3.3726806640625, -3.169189453125, -2.9656982421875, -2.76220703125, -2.5587158203125, -2.355224609375, -2.1517333984375, -1.9482421875, -1.7447509765625, -1.541259765625, -1.3377685546875, -1.13427734375, -0.9307861328125, -0.727294921875, -0.5238037109375, -0.3203125, -0.1168212890625, 0.086669921875, 0.2901611328125, 0.49365234375, 0.6971435546875, 0.900634765625, 1.1041259765625, 1.3076171875, 1.5111083984375, 1.714599609375, 1.9180908203125, 2.12158203125, 2.3250732421875, 2.528564453125, 2.7320556640625, 2.935546875, 3.1390380859375, 3.342529296875, 3.5460205078125, 3.74951171875, 3.9530029296875, 4.156494140625, 4.3599853515625, 4.5634765625, 4.7669677734375, 4.970458984375, 5.1739501953125, 5.37744140625, 5.5809326171875, 5.784423828125, 5.9879150390625, 6.19140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 7.0, 13.0, 16.0, 28.0, 33.0, 45.0, 71.0, 98.0, 310.0, 161.0, 74.0, 47.0, 32.0, 24.0, 10.0, 8.0, 2.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00133514404296875, -0.001270383596420288, -0.0012056231498718262, -0.0011408627033233643, -0.0010761022567749023, -0.0010113418102264404, -0.0009465813636779785, -0.0008818209171295166, -0.0008170604705810547, -0.0007523000240325928, -0.0006875395774841309, -0.0006227791309356689, -0.000558018684387207, -0.0004932582378387451, -0.0004284977912902832, -0.0003637373447418213, -0.0002989768981933594, -0.00023421645164489746, -0.00016945600509643555, -0.00010469555854797363, -3.993511199951172e-05, 2.4825334548950195e-05, 8.958578109741211e-05, 0.00015434622764587402, 0.00021910667419433594, 0.00028386712074279785, 0.00034862756729125977, 0.0004133880138397217, 0.0004781484603881836, 0.0005429089069366455, 0.0006076693534851074, 0.0006724298000335693, 0.0007371902465820312, 0.0008019506931304932, 0.0008667111396789551, 0.000931471586227417, 0.000996232032775879, 0.0010609924793243408, 0.0011257529258728027, 0.0011905133724212646, 0.0012552738189697266, 0.0013200342655181885, 0.0013847947120666504, 0.0014495551586151123, 0.0015143156051635742, 0.0015790760517120361, 0.001643836498260498, 0.00170859694480896, 0.0017733573913574219, 0.0018381178379058838, 0.0019028782844543457, 0.0019676387310028076, 0.0020323991775512695, 0.0020971596240997314, 0.0021619200706481934, 0.0022266805171966553, 0.002291440963745117, 0.002356201410293579, 0.002420961856842041, 0.002485722303390503, 0.002550482749938965, 0.0026152431964874268, 0.0026800036430358887, 0.0027447640895843506, 0.0028095245361328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 10.0, 8.0, 9.0, 4.0, 9.0, 23.0, 20.0, 27.0, 39.0, 59.0, 75.0, 92.0, 144.0, 202.0, 304.0, 516.0, 823.0, 1590.0, 3525.0, 9184.0, 29286.0, 217268.0, 715417.0, 47364.0, 13010.0, 4819.0, 2028.0, 1016.0, 546.0, 355.0, 223.0, 138.0, 117.0, 72.0, 52.0, 41.0, 41.0, 32.0, 22.0, 11.0, 7.0, 9.0, 10.0, 1.0, 7.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.1875, -5.0096435546875, -4.831787109375, -4.6539306640625, -4.47607421875, -4.2982177734375, -4.120361328125, -3.9425048828125, -3.7646484375, -3.5867919921875, -3.408935546875, -3.2310791015625, -3.05322265625, -2.8753662109375, -2.697509765625, -2.5196533203125, -2.341796875, -2.1639404296875, -1.986083984375, -1.8082275390625, -1.63037109375, -1.4525146484375, -1.274658203125, -1.0968017578125, -0.9189453125, -0.7410888671875, -0.563232421875, -0.3853759765625, -0.20751953125, -0.0296630859375, 0.148193359375, 0.3260498046875, 0.50390625, 0.6817626953125, 0.859619140625, 1.0374755859375, 1.21533203125, 1.3931884765625, 1.571044921875, 1.7489013671875, 1.9267578125, 2.1046142578125, 2.282470703125, 2.4603271484375, 2.63818359375, 2.8160400390625, 2.993896484375, 3.1717529296875, 3.349609375, 3.5274658203125, 3.705322265625, 3.8831787109375, 4.06103515625, 4.2388916015625, 4.416748046875, 4.5946044921875, 4.7724609375, 4.9503173828125, 5.128173828125, 5.3060302734375, 5.48388671875, 5.6617431640625, 5.839599609375, 6.0174560546875, 6.1953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 3.0, 6.0, 8.0, 9.0, 12.0, 21.0, 28.0, 26.0, 54.0, 106.0, 187.0, 187.0, 105.0, 58.0, 45.0, 38.0, 22.0, 9.0, 12.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 10.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.2578125, -7.05657958984375, -6.8553466796875, -6.65411376953125, -6.452880859375, -6.25164794921875, -6.0504150390625, -5.84918212890625, -5.64794921875, -5.44671630859375, -5.2454833984375, -5.04425048828125, -4.843017578125, -4.64178466796875, -4.4405517578125, -4.23931884765625, -4.0380859375, -3.83685302734375, -3.6356201171875, -3.43438720703125, -3.233154296875, -3.03192138671875, -2.8306884765625, -2.62945556640625, -2.42822265625, -2.22698974609375, -2.0257568359375, -1.82452392578125, -1.623291015625, -1.42205810546875, -1.2208251953125, -1.01959228515625, -0.818359375, -0.61712646484375, -0.4158935546875, -0.21466064453125, -0.013427734375, 0.18780517578125, 0.3890380859375, 0.59027099609375, 0.79150390625, 0.99273681640625, 1.1939697265625, 1.39520263671875, 1.596435546875, 1.79766845703125, 1.9989013671875, 2.20013427734375, 2.4013671875, 2.60260009765625, 2.8038330078125, 3.00506591796875, 3.206298828125, 3.40753173828125, 3.6087646484375, 3.80999755859375, 4.01123046875, 4.21246337890625, 4.4136962890625, 4.61492919921875, 4.816162109375, 5.01739501953125, 5.2186279296875, 5.41986083984375, 5.62109375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 11.0, 34.0, 151.0, 422.0, 235.0, 99.0, 24.0, 5.0, 7.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.61068725585938, -98.59862518310547, -93.58656311035156, -88.57450103759766, -83.56243896484375, -78.55038452148438, -73.53832244873047, -68.52626037597656, -63.514198303222656, -58.50213623046875, -53.490074157714844, -48.4780158996582, -43.4659538269043, -38.45389175415039, -33.44183349609375, -28.429771423339844, -23.417709350585938, -18.40564727783203, -13.393587112426758, -8.381525993347168, -3.369464874267578, 1.6425971984863281, 6.654657363891602, 11.666717529296875, 16.67877960205078, 21.690841674804688, 26.70290184020996, 31.714962005615234, 36.72702407836914, 41.73908615112305, 46.75114440917969, 51.763206481933594, 56.7752685546875, 61.787330627441406, 66.79939270019531, 71.81145477294922, 76.82351684570312, 81.8355712890625, 86.8476333618164, 91.85969543457031, 96.87175750732422, 101.88381958007812, 106.89588165283203, 111.90794372558594, 116.91999816894531, 121.93206787109375, 126.94412231445312, 131.9561767578125, 136.96824645996094, 141.9803009033203, 146.99237060546875, 152.00442504882812, 157.01649475097656, 162.02854919433594, 167.04061889648438, 172.05267333984375, 177.06472778320312, 182.0767822265625, 187.08885192871094, 192.1009063720703, 197.11297607421875, 202.12503051757812, 207.13710021972656, 212.14915466308594, 217.16122436523438]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 2.0, 12.0, 5.0, 8.0, 6.0, 16.0, 13.0, 12.0, 18.0, 13.0, 28.0, 28.0, 29.0, 26.0, 25.0, 36.0, 49.0, 54.0, 66.0, 81.0, 65.0, 60.0, 39.0, 43.0, 23.0, 32.0, 30.0, 25.0, 24.0, 17.0, 19.0, 21.0, 12.0, 10.0, 11.0, 11.0, 3.0, 9.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.980628967285156, -48.57236862182617, -47.16410827636719, -45.75585174560547, -44.347591400146484, -42.9393310546875, -41.531070709228516, -40.12281036376953, -38.71455383300781, -37.30629348754883, -35.898033142089844, -34.489776611328125, -33.08151626586914, -31.673255920410156, -30.264995574951172, -28.85673713684082, -27.448476791381836, -26.04021644592285, -24.6319580078125, -23.223697662353516, -21.815439224243164, -20.40717887878418, -18.998920440673828, -17.590660095214844, -16.18239974975586, -14.774140357971191, -13.365880966186523, -11.957620620727539, -10.549362182617188, -9.141101837158203, -7.732842445373535, -6.324583053588867, -4.916324615478516, -3.5080652236938477, -2.0998055934906006, -0.6915459632873535, 0.7167134284973145, 2.1249728202819824, 3.5332326889038086, 4.941492080688477, 6.3497514724731445, 7.7580108642578125, 9.16627025604248, 10.574529647827148, 11.982789993286133, 13.391048431396484, 14.799308776855469, 16.207569122314453, 17.615827560424805, 19.02408790588379, 20.43234634399414, 21.840606689453125, 23.248865127563477, 24.65712547302246, 26.065383911132812, 27.473644256591797, 28.88190460205078, 30.290164947509766, 31.698423385620117, 33.10668182373047, 34.51494216918945, 35.92320251464844, 37.33146286010742, 38.739723205566406, 40.147979736328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 1.0, 7.0, 1.0, 4.0, 4.0, 8.0, 17.0, 20.0, 24.0, 36.0, 46.0, 99.0, 116.0, 190.0, 348.0, 675.0, 1433.0, 4167.0, 19417.0, 448021.0, 3583206.0, 118538.0, 12282.0, 3171.0, 1184.0, 526.0, 275.0, 146.0, 88.0, 68.0, 46.0, 28.0, 20.0, 15.0, 12.0, 13.0, 11.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.734375, -7.50238037109375, -7.2703857421875, -7.03839111328125, -6.806396484375, -6.57440185546875, -6.3424072265625, -6.11041259765625, -5.87841796875, -5.64642333984375, -5.4144287109375, -5.18243408203125, -4.950439453125, -4.71844482421875, -4.4864501953125, -4.25445556640625, -4.0224609375, -3.79046630859375, -3.5584716796875, -3.32647705078125, -3.094482421875, -2.86248779296875, -2.6304931640625, -2.39849853515625, -2.16650390625, -1.93450927734375, -1.7025146484375, -1.47052001953125, -1.238525390625, -1.00653076171875, -0.7745361328125, -0.54254150390625, -0.310546875, -0.07855224609375, 0.1534423828125, 0.38543701171875, 0.617431640625, 0.84942626953125, 1.0814208984375, 1.31341552734375, 1.54541015625, 1.77740478515625, 2.0093994140625, 2.24139404296875, 2.473388671875, 2.70538330078125, 2.9373779296875, 3.16937255859375, 3.4013671875, 3.63336181640625, 3.8653564453125, 4.09735107421875, 4.329345703125, 4.56134033203125, 4.7933349609375, 5.02532958984375, 5.25732421875, 5.48931884765625, 5.7213134765625, 5.95330810546875, 6.185302734375, 6.41729736328125, 6.6492919921875, 6.88128662109375, 7.11328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 12.0, 13.0, 19.0, 20.0, 37.0, 46.0, 65.0, 64.0, 74.0, 72.0, 76.0, 73.0, 83.0, 70.0, 47.0, 47.0, 54.0, 26.0, 22.0, 25.0, 10.0, 16.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.95361328125, -3.8251953125, -3.69677734375, -3.568359375, -3.43994140625, -3.3115234375, -3.18310546875, -3.0546875, -2.92626953125, -2.7978515625, -2.66943359375, -2.541015625, -2.41259765625, -2.2841796875, -2.15576171875, -2.02734375, -1.89892578125, -1.7705078125, -1.64208984375, -1.513671875, -1.38525390625, -1.2568359375, -1.12841796875, -1.0, -0.87158203125, -0.7431640625, -0.61474609375, -0.486328125, -0.35791015625, -0.2294921875, -0.10107421875, 0.02734375, 0.15576171875, 0.2841796875, 0.41259765625, 0.541015625, 0.66943359375, 0.7978515625, 0.92626953125, 1.0546875, 1.18310546875, 1.3115234375, 1.43994140625, 1.568359375, 1.69677734375, 1.8251953125, 1.95361328125, 2.08203125, 2.21044921875, 2.3388671875, 2.46728515625, 2.595703125, 2.72412109375, 2.8525390625, 2.98095703125, 3.109375, 3.23779296875, 3.3662109375, 3.49462890625, 3.623046875, 3.75146484375, 3.8798828125, 4.00830078125, 4.13671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 18.0, 21.0, 40.0, 64.0, 96.0, 141.0, 228.0, 349.0, 614.0, 1363.0, 3960.0, 38315.0, 3529754.0, 601900.0, 12927.0, 2490.0, 949.0, 484.0, 228.0, 134.0, 78.0, 43.0, 20.0, 17.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 4.0], "bins": [-17.0625, -16.68182373046875, -16.3011474609375, -15.92047119140625, -15.539794921875, -15.15911865234375, -14.7784423828125, -14.39776611328125, -14.01708984375, -13.63641357421875, -13.2557373046875, -12.87506103515625, -12.494384765625, -12.11370849609375, -11.7330322265625, -11.35235595703125, -10.9716796875, -10.59100341796875, -10.2103271484375, -9.82965087890625, -9.448974609375, -9.06829833984375, -8.6876220703125, -8.30694580078125, -7.92626953125, -7.54559326171875, -7.1649169921875, -6.78424072265625, -6.403564453125, -6.02288818359375, -5.6422119140625, -5.26153564453125, -4.880859375, -4.50018310546875, -4.1195068359375, -3.73883056640625, -3.358154296875, -2.97747802734375, -2.5968017578125, -2.21612548828125, -1.83544921875, -1.45477294921875, -1.0740966796875, -0.69342041015625, -0.312744140625, 0.06793212890625, 0.4486083984375, 0.82928466796875, 1.2099609375, 1.59063720703125, 1.9713134765625, 2.35198974609375, 2.732666015625, 3.11334228515625, 3.4940185546875, 3.87469482421875, 4.25537109375, 4.63604736328125, 5.0167236328125, 5.39739990234375, 5.778076171875, 6.15875244140625, 6.5394287109375, 6.92010498046875, 7.30078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 7.0, 26.0, 31.0, 66.0, 162.0, 396.0, 1194.0, 1341.0, 545.0, 172.0, 76.0, 32.0, 6.0, 13.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8359375, -15.4208984375, -15.005859375, -14.5908203125, -14.17578125, -13.7607421875, -13.345703125, -12.9306640625, -12.515625, -12.1005859375, -11.685546875, -11.2705078125, -10.85546875, -10.4404296875, -10.025390625, -9.6103515625, -9.1953125, -8.7802734375, -8.365234375, -7.9501953125, -7.53515625, -7.1201171875, -6.705078125, -6.2900390625, -5.875, -5.4599609375, -5.044921875, -4.6298828125, -4.21484375, -3.7998046875, -3.384765625, -2.9697265625, -2.5546875, -2.1396484375, -1.724609375, -1.3095703125, -0.89453125, -0.4794921875, -0.064453125, 0.3505859375, 0.765625, 1.1806640625, 1.595703125, 2.0107421875, 2.42578125, 2.8408203125, 3.255859375, 3.6708984375, 4.0859375, 4.5009765625, 4.916015625, 5.3310546875, 5.74609375, 6.1611328125, 6.576171875, 6.9912109375, 7.40625, 7.8212890625, 8.236328125, 8.6513671875, 9.06640625, 9.4814453125, 9.896484375, 10.3115234375, 10.7265625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 12.0, 6.0, 44.0, 105.0, 246.0, 320.0, 180.0, 54.0, 16.0, 8.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-195.37515258789062, -191.56857299804688, -187.7620086669922, -183.95542907714844, -180.14886474609375, -176.34228515625, -172.53570556640625, -168.72914123535156, -164.9225616455078, -161.11598205566406, -157.30941772460938, -153.50283813476562, -149.69627380371094, -145.8896942138672, -142.0831298828125, -138.27655029296875, -134.469970703125, -130.66339111328125, -126.85682678222656, -123.05024719238281, -119.2436752319336, -115.43710327148438, -111.63053131103516, -107.82395935058594, -104.01739501953125, -100.21082305908203, -96.40425109863281, -92.59767150878906, -88.79109954833984, -84.98452758789062, -81.1779556274414, -77.37138366699219, -73.56481170654297, -69.75823974609375, -65.95166778564453, -62.14509201049805, -58.33851623535156, -54.531944274902344, -50.725372314453125, -46.918800354003906, -43.11222457885742, -39.3056526184082, -35.49907684326172, -31.6925048828125, -27.88593101501465, -24.079357147216797, -20.272785186767578, -16.466211318969727, -12.659637451171875, -8.853063583374023, -5.046490669250488, -1.2399177551269531, 2.5666561126708984, 6.37322998046875, 10.179801940917969, 13.98637580871582, 17.792949676513672, 21.599523544311523, 25.406097412109375, 29.212669372558594, 33.01924133300781, 36.8258171081543, 40.632389068603516, 44.43896484375, 48.24553680419922]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 18.0, 20.0, 28.0, 34.0, 59.0, 51.0, 65.0, 56.0, 63.0, 70.0, 92.0, 74.0, 58.0, 73.0, 52.0, 51.0, 34.0, 28.0, 14.0, 9.0, 12.0, 9.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.13494110107422, -41.48800277709961, -39.841068267822266, -38.194129943847656, -36.54719543457031, -34.9002571105957, -33.253318786621094, -31.606382369995117, -29.95944595336914, -28.312509536743164, -26.665573120117188, -25.018634796142578, -23.3716983795166, -21.724761962890625, -20.077823638916016, -18.43088722229004, -16.783950805664062, -15.137014389038086, -13.490077018737793, -11.8431396484375, -10.196203231811523, -8.549266815185547, -6.902329444885254, -5.255392074584961, -3.6084556579589844, -1.9615187644958496, -0.31458187103271484, 1.33235502243042, 2.9792919158935547, 4.626228332519531, 6.273165702819824, 7.920103073120117, 9.567039489746094, 11.21397590637207, 12.860913276672363, 14.507850646972656, 16.154787063598633, 17.80172348022461, 19.44866180419922, 21.095598220825195, 22.742534637451172, 24.38947105407715, 26.036407470703125, 27.683345794677734, 29.33028221130371, 30.977218627929688, 32.6241569519043, 34.271095275878906, 35.91802978515625, 37.56496810913086, 39.2119026184082, 40.85884094238281, 42.505775451660156, 44.152713775634766, 45.799652099609375, 47.44658660888672, 49.09352493286133, 50.74046325683594, 52.38739776611328, 54.03433609008789, 55.6812744140625, 57.328208923339844, 58.97514724731445, 60.62208557128906, 62.269020080566406]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 6.0, 10.0, 14.0, 7.0, 17.0, 20.0, 27.0, 55.0, 104.0, 162.0, 296.0, 706.0, 2174.0, 9972.0, 93689.0, 805031.0, 120587.0, 11872.0, 2319.0, 733.0, 298.0, 153.0, 107.0, 61.0, 43.0, 28.0, 16.0, 14.0, 13.0, 7.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.515625, -11.1258544921875, -10.736083984375, -10.3463134765625, -9.95654296875, -9.5667724609375, -9.177001953125, -8.7872314453125, -8.3974609375, -8.0076904296875, -7.617919921875, -7.2281494140625, -6.83837890625, -6.4486083984375, -6.058837890625, -5.6690673828125, -5.279296875, -4.8895263671875, -4.499755859375, -4.1099853515625, -3.72021484375, -3.3304443359375, -2.940673828125, -2.5509033203125, -2.1611328125, -1.7713623046875, -1.381591796875, -0.9918212890625, -0.60205078125, -0.2122802734375, 0.177490234375, 0.5672607421875, 0.95703125, 1.3468017578125, 1.736572265625, 2.1263427734375, 2.51611328125, 2.9058837890625, 3.295654296875, 3.6854248046875, 4.0751953125, 4.4649658203125, 4.854736328125, 5.2445068359375, 5.63427734375, 6.0240478515625, 6.413818359375, 6.8035888671875, 7.193359375, 7.5831298828125, 7.972900390625, 8.3626708984375, 8.75244140625, 9.1422119140625, 9.531982421875, 9.9217529296875, 10.3115234375, 10.7012939453125, 11.091064453125, 11.4808349609375, 11.87060546875, 12.2603759765625, 12.650146484375, 13.0399169921875, 13.4296875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 4.0, 7.0, 3.0, 11.0, 10.0, 17.0, 24.0, 26.0, 32.0, 37.0, 46.0, 38.0, 51.0, 59.0, 64.0, 51.0, 50.0, 67.0, 56.0, 51.0, 42.0, 51.0, 45.0, 27.0, 26.0, 23.0, 21.0, 14.0, 9.0, 15.0, 7.0, 5.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.66796875, -3.5662841796875, -3.464599609375, -3.3629150390625, -3.26123046875, -3.1595458984375, -3.057861328125, -2.9561767578125, -2.8544921875, -2.7528076171875, -2.651123046875, -2.5494384765625, -2.44775390625, -2.3460693359375, -2.244384765625, -2.1427001953125, -2.041015625, -1.9393310546875, -1.837646484375, -1.7359619140625, -1.63427734375, -1.5325927734375, -1.430908203125, -1.3292236328125, -1.2275390625, -1.1258544921875, -1.024169921875, -0.9224853515625, -0.82080078125, -0.7191162109375, -0.617431640625, -0.5157470703125, -0.4140625, -0.3123779296875, -0.210693359375, -0.1090087890625, -0.00732421875, 0.0943603515625, 0.196044921875, 0.2977294921875, 0.3994140625, 0.5010986328125, 0.602783203125, 0.7044677734375, 0.80615234375, 0.9078369140625, 1.009521484375, 1.1112060546875, 1.212890625, 1.3145751953125, 1.416259765625, 1.5179443359375, 1.61962890625, 1.7213134765625, 1.822998046875, 1.9246826171875, 2.0263671875, 2.1280517578125, 2.229736328125, 2.3314208984375, 2.43310546875, 2.5347900390625, 2.636474609375, 2.7381591796875, 2.83984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 10.0, 4.0, 11.0, 17.0, 18.0, 38.0, 50.0, 59.0, 98.0, 142.0, 257.0, 434.0, 999.0, 2783.0, 10533.0, 87189.0, 885377.0, 48726.0, 7662.0, 2203.0, 863.0, 405.0, 262.0, 121.0, 89.0, 59.0, 32.0, 26.0, 23.0, 12.0, 8.0, 7.0, 4.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-18.640625, -18.046875, -17.453125, -16.859375, -16.265625, -15.671875, -15.078125, -14.484375, -13.890625, -13.296875, -12.703125, -12.109375, -11.515625, -10.921875, -10.328125, -9.734375, -9.140625, -8.546875, -7.953125, -7.359375, -6.765625, -6.171875, -5.578125, -4.984375, -4.390625, -3.796875, -3.203125, -2.609375, -2.015625, -1.421875, -0.828125, -0.234375, 0.359375, 0.953125, 1.546875, 2.140625, 2.734375, 3.328125, 3.921875, 4.515625, 5.109375, 5.703125, 6.296875, 6.890625, 7.484375, 8.078125, 8.671875, 9.265625, 9.859375, 10.453125, 11.046875, 11.640625, 12.234375, 12.828125, 13.421875, 14.015625, 14.609375, 15.203125, 15.796875, 16.390625, 16.984375, 17.578125, 18.171875, 18.765625, 19.359375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 9.0, 3.0, 8.0, 8.0, 14.0, 13.0, 12.0, 17.0, 22.0, 29.0, 38.0, 43.0, 51.0, 62.0, 55.0, 58.0, 62.0, 48.0, 46.0, 57.0, 53.0, 48.0, 41.0, 42.0, 23.0, 17.0, 24.0, 18.0, 16.0, 13.0, 7.0, 11.0, 11.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.625, -11.224365234375, -10.82373046875, -10.423095703125, -10.0224609375, -9.621826171875, -9.22119140625, -8.820556640625, -8.419921875, -8.019287109375, -7.61865234375, -7.218017578125, -6.8173828125, -6.416748046875, -6.01611328125, -5.615478515625, -5.21484375, -4.814208984375, -4.41357421875, -4.012939453125, -3.6123046875, -3.211669921875, -2.81103515625, -2.410400390625, -2.009765625, -1.609130859375, -1.20849609375, -0.807861328125, -0.4072265625, -0.006591796875, 0.39404296875, 0.794677734375, 1.1953125, 1.595947265625, 1.99658203125, 2.397216796875, 2.7978515625, 3.198486328125, 3.59912109375, 3.999755859375, 4.400390625, 4.801025390625, 5.20166015625, 5.602294921875, 6.0029296875, 6.403564453125, 6.80419921875, 7.204833984375, 7.60546875, 8.006103515625, 8.40673828125, 8.807373046875, 9.2080078125, 9.608642578125, 10.00927734375, 10.409912109375, 10.810546875, 11.211181640625, 11.61181640625, 12.012451171875, 12.4130859375, 12.813720703125, 13.21435546875, 13.614990234375, 14.015625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 8.0, 8.0, 13.0, 10.0, 13.0, 12.0, 19.0, 33.0, 52.0, 70.0, 81.0, 155.0, 272.0, 450.0, 915.0, 1996.0, 5728.0, 26253.0, 862633.0, 129320.0, 13615.0, 3722.0, 1438.0, 711.0, 352.0, 215.0, 131.0, 92.0, 60.0, 50.0, 24.0, 28.0, 20.0, 12.0, 10.0, 7.0, 4.0, 4.0, 3.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.0, -13.6090087890625, -13.218017578125, -12.8270263671875, -12.43603515625, -12.0450439453125, -11.654052734375, -11.2630615234375, -10.8720703125, -10.4810791015625, -10.090087890625, -9.6990966796875, -9.30810546875, -8.9171142578125, -8.526123046875, -8.1351318359375, -7.744140625, -7.3531494140625, -6.962158203125, -6.5711669921875, -6.18017578125, -5.7891845703125, -5.398193359375, -5.0072021484375, -4.6162109375, -4.2252197265625, -3.834228515625, -3.4432373046875, -3.05224609375, -2.6612548828125, -2.270263671875, -1.8792724609375, -1.48828125, -1.0972900390625, -0.706298828125, -0.3153076171875, 0.07568359375, 0.4666748046875, 0.857666015625, 1.2486572265625, 1.6396484375, 2.0306396484375, 2.421630859375, 2.8126220703125, 3.20361328125, 3.5946044921875, 3.985595703125, 4.3765869140625, 4.767578125, 5.1585693359375, 5.549560546875, 5.9405517578125, 6.33154296875, 6.7225341796875, 7.113525390625, 7.5045166015625, 7.8955078125, 8.2864990234375, 8.677490234375, 9.0684814453125, 9.45947265625, 9.8504638671875, 10.241455078125, 10.6324462890625, 11.0234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 8.0, 7.0, 6.0, 6.0, 13.0, 11.0, 16.0, 24.0, 25.0, 68.0, 185.0, 354.0, 112.0, 49.0, 19.0, 29.0, 17.0, 17.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002838134765625, -0.0027576684951782227, -0.0026772022247314453, -0.002596735954284668, -0.0025162696838378906, -0.0024358034133911133, -0.002355337142944336, -0.0022748708724975586, -0.0021944046020507812, -0.002113938331604004, -0.0020334720611572266, -0.0019530057907104492, -0.0018725395202636719, -0.0017920732498168945, -0.0017116069793701172, -0.0016311407089233398, -0.0015506744384765625, -0.0014702081680297852, -0.0013897418975830078, -0.0013092756271362305, -0.0012288093566894531, -0.0011483430862426758, -0.0010678768157958984, -0.000987410545349121, -0.0009069442749023438, -0.0008264780044555664, -0.0007460117340087891, -0.0006655454635620117, -0.0005850791931152344, -0.000504612922668457, -0.0004241466522216797, -0.00034368038177490234, -0.000263214111328125, -0.00018274784088134766, -0.00010228157043457031, -2.181529998779297e-05, 5.8650970458984375e-05, 0.00013911724090576172, 0.00021958351135253906, 0.0003000497817993164, 0.00038051605224609375, 0.0004609823226928711, 0.0005414485931396484, 0.0006219148635864258, 0.0007023811340332031, 0.0007828474044799805, 0.0008633136749267578, 0.0009437799453735352, 0.0010242462158203125, 0.0011047124862670898, 0.0011851787567138672, 0.0012656450271606445, 0.0013461112976074219, 0.0014265775680541992, 0.0015070438385009766, 0.001587510108947754, 0.0016679763793945312, 0.0017484426498413086, 0.001828908920288086, 0.0019093751907348633, 0.0019898414611816406, 0.002070307731628418, 0.0021507740020751953, 0.0022312402725219727, 0.00231170654296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 8.0, 6.0, 11.0, 20.0, 23.0, 40.0, 58.0, 101.0, 155.0, 245.0, 450.0, 843.0, 2140.0, 6380.0, 26852.0, 758839.0, 224501.0, 19390.0, 5014.0, 1708.0, 793.0, 420.0, 223.0, 119.0, 80.0, 47.0, 25.0, 17.0, 8.0, 16.0, 6.0, 3.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5859375, -8.2410888671875, -7.896240234375, -7.5513916015625, -7.20654296875, -6.8616943359375, -6.516845703125, -6.1719970703125, -5.8271484375, -5.4822998046875, -5.137451171875, -4.7926025390625, -4.44775390625, -4.1029052734375, -3.758056640625, -3.4132080078125, -3.068359375, -2.7235107421875, -2.378662109375, -2.0338134765625, -1.68896484375, -1.3441162109375, -0.999267578125, -0.6544189453125, -0.3095703125, 0.0352783203125, 0.380126953125, 0.7249755859375, 1.06982421875, 1.4146728515625, 1.759521484375, 2.1043701171875, 2.44921875, 2.7940673828125, 3.138916015625, 3.4837646484375, 3.82861328125, 4.1734619140625, 4.518310546875, 4.8631591796875, 5.2080078125, 5.5528564453125, 5.897705078125, 6.2425537109375, 6.58740234375, 6.9322509765625, 7.277099609375, 7.6219482421875, 7.966796875, 8.3116455078125, 8.656494140625, 9.0013427734375, 9.34619140625, 9.6910400390625, 10.035888671875, 10.3807373046875, 10.7255859375, 11.0704345703125, 11.415283203125, 11.7601318359375, 12.10498046875, 12.4498291015625, 12.794677734375, 13.1395263671875, 13.484375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 7.0, 7.0, 4.0, 3.0, 13.0, 5.0, 11.0, 24.0, 14.0, 31.0, 50.0, 77.0, 192.0, 211.0, 133.0, 68.0, 22.0, 27.0, 13.0, 11.0, 13.0, 11.0, 10.0, 4.0, 5.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.77734375, -7.55596923828125, -7.3345947265625, -7.11322021484375, -6.891845703125, -6.67047119140625, -6.4490966796875, -6.22772216796875, -6.00634765625, -5.78497314453125, -5.5635986328125, -5.34222412109375, -5.120849609375, -4.89947509765625, -4.6781005859375, -4.45672607421875, -4.2353515625, -4.01397705078125, -3.7926025390625, -3.57122802734375, -3.349853515625, -3.12847900390625, -2.9071044921875, -2.68572998046875, -2.46435546875, -2.24298095703125, -2.0216064453125, -1.80023193359375, -1.578857421875, -1.35748291015625, -1.1361083984375, -0.91473388671875, -0.693359375, -0.47198486328125, -0.2506103515625, -0.02923583984375, 0.192138671875, 0.41351318359375, 0.6348876953125, 0.85626220703125, 1.07763671875, 1.29901123046875, 1.5203857421875, 1.74176025390625, 1.963134765625, 2.18450927734375, 2.4058837890625, 2.62725830078125, 2.8486328125, 3.07000732421875, 3.2913818359375, 3.51275634765625, 3.734130859375, 3.95550537109375, 4.1768798828125, 4.39825439453125, 4.61962890625, 4.84100341796875, 5.0623779296875, 5.28375244140625, 5.505126953125, 5.72650146484375, 5.9478759765625, 6.16925048828125, 6.390625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 18.0, 67.0, 285.0, 430.0, 115.0, 30.0, 19.0, 6.0, 8.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-275.3036193847656, -268.6140441894531, -261.9244384765625, -255.23484802246094, -248.54525756835938, -241.85568237304688, -235.1660919189453, -228.47650146484375, -221.7869110107422, -215.09732055664062, -208.40773010253906, -201.7181396484375, -195.028564453125, -188.33895874023438, -181.64938354492188, -174.9597930908203, -168.27020263671875, -161.5806121826172, -154.89102172851562, -148.20143127441406, -141.5118408203125, -134.822265625, -128.13267517089844, -121.44308471679688, -114.75349426269531, -108.06390380859375, -101.37431335449219, -94.68473052978516, -87.9951400756836, -81.30554962158203, -74.615966796875, -67.92637634277344, -61.236785888671875, -54.54719543457031, -47.857608795166016, -41.16802215576172, -34.478431701660156, -27.788841247558594, -21.099254608154297, -14.40966796875, -7.7200775146484375, -1.0304889678955078, 5.659099578857422, 12.348688125610352, 19.03827667236328, 25.727867126464844, 32.41745376586914, 39.10704040527344, 45.796630859375, 52.48622131347656, 59.17580795288086, 65.86539459228516, 72.55498504638672, 79.24457550048828, 85.93415832519531, 92.62374877929688, 99.31333923339844, 106.0029296875, 112.69252014160156, 119.3821029663086, 126.07169342041016, 132.76129150390625, 139.45086669921875, 146.1404571533203, 152.83004760742188]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 15.0, 23.0, 34.0, 37.0, 56.0, 50.0, 60.0, 83.0, 125.0, 135.0, 82.0, 72.0, 66.0, 38.0, 30.0, 24.0, 24.0, 22.0, 9.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.81681442260742, -59.843170166015625, -56.86952590942383, -53.89588165283203, -50.92223358154297, -47.94859313964844, -44.974945068359375, -42.00130081176758, -39.02765655517578, -36.054012298583984, -33.08036804199219, -30.106721878051758, -27.13307762145996, -24.159433364868164, -21.185787200927734, -18.212142944335938, -15.23849868774414, -12.264854431152344, -9.29120922088623, -6.317564010620117, -3.3439197540283203, -0.37027549743652344, 2.6033706665039062, 5.577014923095703, 8.5506591796875, 11.524303436279297, 14.49794864654541, 17.471593856811523, 20.44523811340332, 23.418882369995117, 26.392528533935547, 29.366172790527344, 32.339813232421875, 35.31345748901367, 38.28710174560547, 41.26074981689453, 44.23439025878906, 47.208038330078125, 50.18168258666992, 53.15532684326172, 56.128971099853516, 59.10261535644531, 62.07625961303711, 65.0499038696289, 68.02355194091797, 70.9971923828125, 73.97084045410156, 76.94448852539062, 79.91812896728516, 82.89177703857422, 85.86541748046875, 88.83906555175781, 91.81270599365234, 94.7863540649414, 97.75999450683594, 100.733642578125, 103.70729064941406, 106.68093872070312, 109.65457916259766, 112.62822723388672, 115.60186767578125, 118.57551574707031, 121.54916381835938, 124.5228042602539, 127.49644470214844]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 4.0, 8.0, 13.0, 15.0, 20.0, 50.0, 70.0, 181.0, 535.0, 1544.0, 5526.0, 127465.0, 4035469.0, 19473.0, 2483.0, 782.0, 273.0, 151.0, 74.0, 45.0, 24.0, 12.0, 19.0, 8.0, 8.0, 13.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.125, -22.52099609375, -21.9169921875, -21.31298828125, -20.708984375, -20.10498046875, -19.5009765625, -18.89697265625, -18.29296875, -17.68896484375, -17.0849609375, -16.48095703125, -15.876953125, -15.27294921875, -14.6689453125, -14.06494140625, -13.4609375, -12.85693359375, -12.2529296875, -11.64892578125, -11.044921875, -10.44091796875, -9.8369140625, -9.23291015625, -8.62890625, -8.02490234375, -7.4208984375, -6.81689453125, -6.212890625, -5.60888671875, -5.0048828125, -4.40087890625, -3.796875, -3.19287109375, -2.5888671875, -1.98486328125, -1.380859375, -0.77685546875, -0.1728515625, 0.43115234375, 1.03515625, 1.63916015625, 2.2431640625, 2.84716796875, 3.451171875, 4.05517578125, 4.6591796875, 5.26318359375, 5.8671875, 6.47119140625, 7.0751953125, 7.67919921875, 8.283203125, 8.88720703125, 9.4912109375, 10.09521484375, 10.69921875, 11.30322265625, 11.9072265625, 12.51123046875, 13.115234375, 13.71923828125, 14.3232421875, 14.92724609375, 15.53125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 19.0, 42.0, 87.0, 127.0, 172.0, 195.0, 147.0, 112.0, 48.0, 35.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.46795654296875, -5.1507568359375, -4.83355712890625, -4.516357421875, -4.19915771484375, -3.8819580078125, -3.56475830078125, -3.24755859375, -2.93035888671875, -2.6131591796875, -2.29595947265625, -1.978759765625, -1.66156005859375, -1.3443603515625, -1.02716064453125, -0.7099609375, -0.39276123046875, -0.0755615234375, 0.24163818359375, 0.558837890625, 0.87603759765625, 1.1932373046875, 1.51043701171875, 1.82763671875, 2.14483642578125, 2.4620361328125, 2.77923583984375, 3.096435546875, 3.41363525390625, 3.7308349609375, 4.04803466796875, 4.365234375, 4.68243408203125, 4.9996337890625, 5.31683349609375, 5.634033203125, 5.95123291015625, 6.2684326171875, 6.58563232421875, 6.90283203125, 7.22003173828125, 7.5372314453125, 7.85443115234375, 8.171630859375, 8.48883056640625, 8.8060302734375, 9.12322998046875, 9.4404296875, 9.75762939453125, 10.0748291015625, 10.39202880859375, 10.709228515625, 11.02642822265625, 11.3436279296875, 11.66082763671875, 11.97802734375, 12.29522705078125, 12.6124267578125, 12.92962646484375, 13.246826171875, 13.56402587890625, 13.8812255859375, 14.19842529296875, 14.515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 14.0, 32.0, 35.0, 52.0, 89.0, 165.0, 282.0, 544.0, 1127.0, 2829.0, 11057.0, 2719725.0, 1444471.0, 9566.0, 2302.0, 998.0, 452.0, 205.0, 120.0, 71.0, 36.0, 26.0, 32.0, 14.0, 4.0, 10.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.265625, -23.55126953125, -22.8369140625, -22.12255859375, -21.408203125, -20.69384765625, -19.9794921875, -19.26513671875, -18.55078125, -17.83642578125, -17.1220703125, -16.40771484375, -15.693359375, -14.97900390625, -14.2646484375, -13.55029296875, -12.8359375, -12.12158203125, -11.4072265625, -10.69287109375, -9.978515625, -9.26416015625, -8.5498046875, -7.83544921875, -7.12109375, -6.40673828125, -5.6923828125, -4.97802734375, -4.263671875, -3.54931640625, -2.8349609375, -2.12060546875, -1.40625, -0.69189453125, 0.0224609375, 0.73681640625, 1.451171875, 2.16552734375, 2.8798828125, 3.59423828125, 4.30859375, 5.02294921875, 5.7373046875, 6.45166015625, 7.166015625, 7.88037109375, 8.5947265625, 9.30908203125, 10.0234375, 10.73779296875, 11.4521484375, 12.16650390625, 12.880859375, 13.59521484375, 14.3095703125, 15.02392578125, 15.73828125, 16.45263671875, 17.1669921875, 17.88134765625, 18.595703125, 19.31005859375, 20.0244140625, 20.73876953125, 21.453125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 14.0, 20.0, 49.0, 127.0, 467.0, 1627.0, 1272.0, 313.0, 104.0, 32.0, 17.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.0625, -17.51318359375, -16.9638671875, -16.41455078125, -15.865234375, -15.31591796875, -14.7666015625, -14.21728515625, -13.66796875, -13.11865234375, -12.5693359375, -12.02001953125, -11.470703125, -10.92138671875, -10.3720703125, -9.82275390625, -9.2734375, -8.72412109375, -8.1748046875, -7.62548828125, -7.076171875, -6.52685546875, -5.9775390625, -5.42822265625, -4.87890625, -4.32958984375, -3.7802734375, -3.23095703125, -2.681640625, -2.13232421875, -1.5830078125, -1.03369140625, -0.484375, 0.06494140625, 0.6142578125, 1.16357421875, 1.712890625, 2.26220703125, 2.8115234375, 3.36083984375, 3.91015625, 4.45947265625, 5.0087890625, 5.55810546875, 6.107421875, 6.65673828125, 7.2060546875, 7.75537109375, 8.3046875, 8.85400390625, 9.4033203125, 9.95263671875, 10.501953125, 11.05126953125, 11.6005859375, 12.14990234375, 12.69921875, 13.24853515625, 13.7978515625, 14.34716796875, 14.896484375, 15.44580078125, 15.9951171875, 16.54443359375, 17.09375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 4.0, 13.0, 31.0, 133.0, 394.0, 330.0, 67.0, 11.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.2802734375, -201.16709899902344, -195.05392456054688, -188.94076538085938, -182.8275909423828, -176.71441650390625, -170.6012420654297, -164.48806762695312, -158.37489318847656, -152.26171875, -146.14854431152344, -140.03536987304688, -133.92221069335938, -127.80903625488281, -121.69586181640625, -115.58268737792969, -109.46952056884766, -103.3563461303711, -97.24317932128906, -91.1300048828125, -85.01683044433594, -78.90365600585938, -72.79048919677734, -66.67731475830078, -60.564144134521484, -54.45097351074219, -48.337799072265625, -42.22462844848633, -36.11145782470703, -29.99828338623047, -23.885112762451172, -17.77193832397461, -11.658767700195312, -5.545595645904541, 0.5675764083862305, 6.680747985839844, 12.793920516967773, 18.907093048095703, 25.020263671875, 31.133438110351562, 37.24660873413086, 43.359779357910156, 49.47295379638672, 55.586124420166016, 61.69929504394531, 67.81246948242188, 73.92564392089844, 80.038818359375, 86.15198516845703, 92.2651596069336, 98.37832641601562, 104.49150085449219, 110.60467529296875, 116.71784973144531, 122.83101654052734, 128.94418334960938, 135.05735778808594, 141.1705322265625, 147.28370666503906, 153.39688110351562, 159.51004028320312, 165.6232147216797, 171.73638916015625, 177.8495635986328, 183.96273803710938]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 17.0, 21.0, 45.0, 75.0, 113.0, 168.0, 154.0, 127.0, 124.0, 93.0, 33.0, 15.0, 10.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.62494659423828, -86.30365753173828, -82.98236083984375, -79.66107177734375, -76.33978271484375, -73.01849365234375, -69.69719696044922, -66.37590789794922, -63.05461502075195, -59.73332214355469, -56.41203308105469, -53.09074020385742, -49.769447326660156, -46.448158264160156, -43.12686538696289, -39.805572509765625, -36.484283447265625, -33.16299057006836, -29.84170150756836, -26.520408630371094, -23.19911766052246, -19.877826690673828, -16.556533813476562, -13.23524284362793, -9.913951873779297, -6.592660427093506, -3.271368980407715, 0.049922943115234375, 3.371213912963867, 6.6925048828125, 10.013797760009766, 13.335088729858398, 16.656387329101562, 19.977678298950195, 23.298969268798828, 26.620262145996094, 29.941553115844727, 33.26284408569336, 36.584136962890625, 39.905426025390625, 43.22671890258789, 46.548011779785156, 49.869300842285156, 53.19059371948242, 56.51188659667969, 59.83317565917969, 63.15446853637695, 66.47576141357422, 69.79705047607422, 73.11833953857422, 76.43963623046875, 79.76092529296875, 83.08221435546875, 86.40350341796875, 89.72480010986328, 93.04608917236328, 96.36738586425781, 99.68867492675781, 103.00997161865234, 106.33126068115234, 109.65254974365234, 112.97384643554688, 116.29513549804688, 119.61642456054688, 122.93771362304688]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 4.0, 6.0, 9.0, 9.0, 18.0, 22.0, 23.0, 39.0, 61.0, 77.0, 82.0, 151.0, 272.0, 510.0, 1108.0, 3276.0, 18571.0, 260432.0, 701620.0, 52344.0, 6600.0, 1666.0, 699.0, 334.0, 189.0, 123.0, 77.0, 64.0, 45.0, 28.0, 21.0, 16.0, 14.0, 9.0, 9.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.4180908203125, -8.070556640625, -7.7230224609375, -7.37548828125, -7.0279541015625, -6.680419921875, -6.3328857421875, -5.9853515625, -5.6378173828125, -5.290283203125, -4.9427490234375, -4.59521484375, -4.2476806640625, -3.900146484375, -3.5526123046875, -3.205078125, -2.8575439453125, -2.510009765625, -2.1624755859375, -1.81494140625, -1.4674072265625, -1.119873046875, -0.7723388671875, -0.4248046875, -0.0772705078125, 0.270263671875, 0.6177978515625, 0.96533203125, 1.3128662109375, 1.660400390625, 2.0079345703125, 2.35546875, 2.7030029296875, 3.050537109375, 3.3980712890625, 3.74560546875, 4.0931396484375, 4.440673828125, 4.7882080078125, 5.1357421875, 5.4832763671875, 5.830810546875, 6.1783447265625, 6.52587890625, 6.8734130859375, 7.220947265625, 7.5684814453125, 7.916015625, 8.2635498046875, 8.611083984375, 8.9586181640625, 9.30615234375, 9.6536865234375, 10.001220703125, 10.3487548828125, 10.6962890625, 11.0438232421875, 11.391357421875, 11.7388916015625, 12.08642578125, 12.4339599609375, 12.781494140625, 13.1290283203125, 13.4765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 10.0, 18.0, 45.0, 70.0, 111.0, 139.0, 161.0, 153.0, 122.0, 78.0, 58.0, 25.0, 10.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03125, -5.726806640625, -5.42236328125, -5.117919921875, -4.8134765625, -4.509033203125, -4.20458984375, -3.900146484375, -3.595703125, -3.291259765625, -2.98681640625, -2.682373046875, -2.3779296875, -2.073486328125, -1.76904296875, -1.464599609375, -1.16015625, -0.855712890625, -0.55126953125, -0.246826171875, 0.0576171875, 0.362060546875, 0.66650390625, 0.970947265625, 1.275390625, 1.579833984375, 1.88427734375, 2.188720703125, 2.4931640625, 2.797607421875, 3.10205078125, 3.406494140625, 3.7109375, 4.015380859375, 4.31982421875, 4.624267578125, 4.9287109375, 5.233154296875, 5.53759765625, 5.842041015625, 6.146484375, 6.450927734375, 6.75537109375, 7.059814453125, 7.3642578125, 7.668701171875, 7.97314453125, 8.277587890625, 8.58203125, 8.886474609375, 9.19091796875, 9.495361328125, 9.7998046875, 10.104248046875, 10.40869140625, 10.713134765625, 11.017578125, 11.322021484375, 11.62646484375, 11.930908203125, 12.2353515625, 12.539794921875, 12.84423828125, 13.148681640625, 13.453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 0.0, 5.0, 7.0, 10.0, 15.0, 18.0, 28.0, 39.0, 53.0, 82.0, 140.0, 205.0, 427.0, 910.0, 2223.0, 6295.0, 25710.0, 204307.0, 708422.0, 79179.0, 13591.0, 3881.0, 1472.0, 691.0, 340.0, 185.0, 106.0, 56.0, 44.0, 22.0, 36.0, 10.0, 13.0, 7.0, 4.0, 6.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.515625, -10.233642578125, -9.95166015625, -9.669677734375, -9.3876953125, -9.105712890625, -8.82373046875, -8.541748046875, -8.259765625, -7.977783203125, -7.69580078125, -7.413818359375, -7.1318359375, -6.849853515625, -6.56787109375, -6.285888671875, -6.00390625, -5.721923828125, -5.43994140625, -5.157958984375, -4.8759765625, -4.593994140625, -4.31201171875, -4.030029296875, -3.748046875, -3.466064453125, -3.18408203125, -2.902099609375, -2.6201171875, -2.338134765625, -2.05615234375, -1.774169921875, -1.4921875, -1.210205078125, -0.92822265625, -0.646240234375, -0.3642578125, -0.082275390625, 0.19970703125, 0.481689453125, 0.763671875, 1.045654296875, 1.32763671875, 1.609619140625, 1.8916015625, 2.173583984375, 2.45556640625, 2.737548828125, 3.01953125, 3.301513671875, 3.58349609375, 3.865478515625, 4.1474609375, 4.429443359375, 4.71142578125, 4.993408203125, 5.275390625, 5.557373046875, 5.83935546875, 6.121337890625, 6.4033203125, 6.685302734375, 6.96728515625, 7.249267578125, 7.53125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 10.0, 11.0, 9.0, 13.0, 12.0, 32.0, 28.0, 26.0, 45.0, 64.0, 59.0, 53.0, 60.0, 60.0, 66.0, 54.0, 60.0, 54.0, 56.0, 40.0, 33.0, 24.0, 20.0, 20.0, 21.0, 20.0, 13.0, 8.0, 7.0, 2.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.328125, -16.8753662109375, -16.422607421875, -15.9698486328125, -15.51708984375, -15.0643310546875, -14.611572265625, -14.1588134765625, -13.7060546875, -13.2532958984375, -12.800537109375, -12.3477783203125, -11.89501953125, -11.4422607421875, -10.989501953125, -10.5367431640625, -10.083984375, -9.6312255859375, -9.178466796875, -8.7257080078125, -8.27294921875, -7.8201904296875, -7.367431640625, -6.9146728515625, -6.4619140625, -6.0091552734375, -5.556396484375, -5.1036376953125, -4.65087890625, -4.1981201171875, -3.745361328125, -3.2926025390625, -2.83984375, -2.3870849609375, -1.934326171875, -1.4815673828125, -1.02880859375, -0.5760498046875, -0.123291015625, 0.3294677734375, 0.7822265625, 1.2349853515625, 1.687744140625, 2.1405029296875, 2.59326171875, 3.0460205078125, 3.498779296875, 3.9515380859375, 4.404296875, 4.8570556640625, 5.309814453125, 5.7625732421875, 6.21533203125, 6.6680908203125, 7.120849609375, 7.5736083984375, 8.0263671875, 8.4791259765625, 8.931884765625, 9.3846435546875, 9.83740234375, 10.2901611328125, 10.742919921875, 11.1956787109375, 11.6484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 13.0, 7.0, 28.0, 45.0, 134.0, 201.0, 479.0, 1383.0, 4603.0, 24953.0, 760008.0, 237176.0, 14534.0, 3173.0, 1047.0, 409.0, 166.0, 74.0, 55.0, 25.0, 15.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.015625, -5.814208984375, -5.61279296875, -5.411376953125, -5.2099609375, -5.008544921875, -4.80712890625, -4.605712890625, -4.404296875, -4.202880859375, -4.00146484375, -3.800048828125, -3.5986328125, -3.397216796875, -3.19580078125, -2.994384765625, -2.79296875, -2.591552734375, -2.39013671875, -2.188720703125, -1.9873046875, -1.785888671875, -1.58447265625, -1.383056640625, -1.181640625, -0.980224609375, -0.77880859375, -0.577392578125, -0.3759765625, -0.174560546875, 0.02685546875, 0.228271484375, 0.4296875, 0.631103515625, 0.83251953125, 1.033935546875, 1.2353515625, 1.436767578125, 1.63818359375, 1.839599609375, 2.041015625, 2.242431640625, 2.44384765625, 2.645263671875, 2.8466796875, 3.048095703125, 3.24951171875, 3.450927734375, 3.65234375, 3.853759765625, 4.05517578125, 4.256591796875, 4.4580078125, 4.659423828125, 4.86083984375, 5.062255859375, 5.263671875, 5.465087890625, 5.66650390625, 5.867919921875, 6.0693359375, 6.270751953125, 6.47216796875, 6.673583984375, 6.875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 8.0, 19.0, 30.0, 40.0, 60.0, 100.0, 166.0, 196.0, 139.0, 78.0, 49.0, 31.0, 14.0, 16.0, 10.0, 6.0, 4.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011043548583984375, -0.0010690689086914062, -0.001033782958984375, -0.0009984970092773438, -0.0009632110595703125, -0.0009279251098632812, -0.00089263916015625, -0.0008573532104492188, -0.0008220672607421875, -0.0007867813110351562, -0.000751495361328125, -0.0007162094116210938, -0.0006809234619140625, -0.0006456375122070312, -0.0006103515625, -0.0005750656127929688, -0.0005397796630859375, -0.0005044937133789062, -0.000469207763671875, -0.00043392181396484375, -0.0003986358642578125, -0.00036334991455078125, -0.00032806396484375, -0.00029277801513671875, -0.0002574920654296875, -0.00022220611572265625, -0.000186920166015625, -0.00015163421630859375, -0.0001163482666015625, -8.106231689453125e-05, -4.57763671875e-05, -1.049041748046875e-05, 2.47955322265625e-05, 6.008148193359375e-05, 9.5367431640625e-05, 0.00013065338134765625, 0.0001659393310546875, 0.00020122528076171875, 0.00023651123046875, 0.00027179718017578125, 0.0003070831298828125, 0.00034236907958984375, 0.000377655029296875, 0.00041294097900390625, 0.0004482269287109375, 0.00048351287841796875, 0.000518798828125, 0.0005540847778320312, 0.0005893707275390625, 0.0006246566772460938, 0.000659942626953125, 0.0006952285766601562, 0.0007305145263671875, 0.0007658004760742188, 0.00080108642578125, 0.0008363723754882812, 0.0008716583251953125, 0.0009069442749023438, 0.000942230224609375, 0.0009775161743164062, 0.0010128021240234375, 0.0010480880737304688, 0.0010833740234375, 0.0011186599731445312, 0.0011539459228515625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 3.0, 5.0, 11.0, 17.0, 25.0, 42.0, 53.0, 95.0, 144.0, 218.0, 408.0, 629.0, 1195.0, 2525.0, 5976.0, 17726.0, 88137.0, 707480.0, 180097.0, 28830.0, 8328.0, 3184.0, 1506.0, 724.0, 466.0, 288.0, 156.0, 97.0, 53.0, 35.0, 33.0, 17.0, 9.0, 11.0, 4.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-4.00390625, -3.888427734375, -3.77294921875, -3.657470703125, -3.5419921875, -3.426513671875, -3.31103515625, -3.195556640625, -3.080078125, -2.964599609375, -2.84912109375, -2.733642578125, -2.6181640625, -2.502685546875, -2.38720703125, -2.271728515625, -2.15625, -2.040771484375, -1.92529296875, -1.809814453125, -1.6943359375, -1.578857421875, -1.46337890625, -1.347900390625, -1.232421875, -1.116943359375, -1.00146484375, -0.885986328125, -0.7705078125, -0.655029296875, -0.53955078125, -0.424072265625, -0.30859375, -0.193115234375, -0.07763671875, 0.037841796875, 0.1533203125, 0.268798828125, 0.38427734375, 0.499755859375, 0.615234375, 0.730712890625, 0.84619140625, 0.961669921875, 1.0771484375, 1.192626953125, 1.30810546875, 1.423583984375, 1.5390625, 1.654541015625, 1.77001953125, 1.885498046875, 2.0009765625, 2.116455078125, 2.23193359375, 2.347412109375, 2.462890625, 2.578369140625, 2.69384765625, 2.809326171875, 2.9248046875, 3.040283203125, 3.15576171875, 3.271240234375, 3.38671875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 7.0, 8.0, 7.0, 16.0, 21.0, 28.0, 46.0, 59.0, 59.0, 79.0, 108.0, 102.0, 92.0, 95.0, 48.0, 45.0, 35.0, 38.0, 19.0, 13.0, 14.0, 15.0, 3.0, 3.0, 4.0, 8.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.126953125, -3.0338134765625, -2.940673828125, -2.8475341796875, -2.75439453125, -2.6612548828125, -2.568115234375, -2.4749755859375, -2.3818359375, -2.2886962890625, -2.195556640625, -2.1024169921875, -2.00927734375, -1.9161376953125, -1.822998046875, -1.7298583984375, -1.63671875, -1.5435791015625, -1.450439453125, -1.3572998046875, -1.26416015625, -1.1710205078125, -1.077880859375, -0.9847412109375, -0.8916015625, -0.7984619140625, -0.705322265625, -0.6121826171875, -0.51904296875, -0.4259033203125, -0.332763671875, -0.2396240234375, -0.146484375, -0.0533447265625, 0.039794921875, 0.1329345703125, 0.22607421875, 0.3192138671875, 0.412353515625, 0.5054931640625, 0.5986328125, 0.6917724609375, 0.784912109375, 0.8780517578125, 0.97119140625, 1.0643310546875, 1.157470703125, 1.2506103515625, 1.34375, 1.4368896484375, 1.530029296875, 1.6231689453125, 1.71630859375, 1.8094482421875, 1.902587890625, 1.9957275390625, 2.0888671875, 2.1820068359375, 2.275146484375, 2.3682861328125, 2.46142578125, 2.5545654296875, 2.647705078125, 2.7408447265625, 2.833984375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 15.0, 26.0, 102.0, 336.0, 363.0, 107.0, 29.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-150.0928192138672, -145.80345153808594, -141.51406860351562, -137.22470092773438, -132.93531799316406, -128.6459503173828, -124.35657501220703, -120.06719970703125, -115.77783203125, -111.48845672607422, -107.19908142089844, -102.90971374511719, -98.6203384399414, -94.33096313476562, -90.04158782958984, -85.75221252441406, -81.46283721923828, -77.1734619140625, -72.88408660888672, -68.59471130371094, -64.30534362792969, -60.015968322753906, -55.726593017578125, -51.437217712402344, -47.14784622192383, -42.85847091674805, -38.56909942626953, -34.27972412109375, -29.9903507232666, -25.700977325439453, -21.411602020263672, -17.122228622436523, -12.832862854003906, -8.543489456176758, -4.254115104675293, 0.035259246826171875, 4.32463264465332, 8.614006042480469, 12.90338134765625, 17.1927547454834, 21.482128143310547, 25.771501541137695, 30.060874938964844, 34.350250244140625, 38.639625549316406, 42.92899703979492, 47.2183723449707, 51.50774383544922, 55.797119140625, 60.08649444580078, 64.37586975097656, 68.66523742675781, 72.9546127319336, 77.24398803710938, 81.53336334228516, 85.82273864746094, 90.11210632324219, 94.40148162841797, 98.69085693359375, 102.980224609375, 107.26959991455078, 111.55897521972656, 115.84835052490234, 120.13772583007812, 124.4271011352539]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 13.0, 15.0, 26.0, 31.0, 34.0, 54.0, 47.0, 61.0, 107.0, 147.0, 124.0, 89.0, 56.0, 50.0, 39.0, 46.0, 19.0, 16.0, 7.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.91080474853516, -94.33076477050781, -91.75072479248047, -89.17069244384766, -86.59065246582031, -84.01061248779297, -81.43057250976562, -78.85053253173828, -76.27049255371094, -73.6904525756836, -71.11041259765625, -68.53038024902344, -65.9503402709961, -63.37030029296875, -60.790260314941406, -58.21022033691406, -55.63018798828125, -53.050148010253906, -50.47011184692383, -47.890071868896484, -45.310035705566406, -42.72999572753906, -40.14995574951172, -37.569915771484375, -34.9898796081543, -32.40983963012695, -29.829803466796875, -27.24976348876953, -24.66972541809082, -22.08968734741211, -19.509647369384766, -16.929609298706055, -14.349578857421875, -11.769540786743164, -9.189501762390137, -6.609463214874268, -4.029424667358398, -1.4493865966796875, 1.1306524276733398, 3.710691452026367, 6.290729522705078, 8.870767593383789, 11.450806617736816, 14.030845642089844, 16.610883712768555, 19.190921783447266, 21.77096176147461, 24.35099983215332, 26.93103790283203, 29.511075973510742, 32.09111404418945, 34.6711540222168, 37.251190185546875, 39.83123016357422, 42.41127014160156, 44.991310119628906, 47.571346282958984, 50.15138626098633, 52.731422424316406, 55.31146240234375, 57.891502380371094, 60.47153854370117, 63.051578521728516, 65.6316146850586, 68.21165466308594]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 9.0, 15.0, 33.0, 45.0, 113.0, 230.0, 493.0, 976.0, 2145.0, 6648.0, 41553.0, 3578301.0, 544380.0, 13698.0, 3091.0, 1291.0, 581.0, 303.0, 113.0, 74.0, 46.0, 33.0, 20.0, 13.0, 16.0, 12.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-12.859375, -12.51904296875, -12.1787109375, -11.83837890625, -11.498046875, -11.15771484375, -10.8173828125, -10.47705078125, -10.13671875, -9.79638671875, -9.4560546875, -9.11572265625, -8.775390625, -8.43505859375, -8.0947265625, -7.75439453125, -7.4140625, -7.07373046875, -6.7333984375, -6.39306640625, -6.052734375, -5.71240234375, -5.3720703125, -5.03173828125, -4.69140625, -4.35107421875, -4.0107421875, -3.67041015625, -3.330078125, -2.98974609375, -2.6494140625, -2.30908203125, -1.96875, -1.62841796875, -1.2880859375, -0.94775390625, -0.607421875, -0.26708984375, 0.0732421875, 0.41357421875, 0.75390625, 1.09423828125, 1.4345703125, 1.77490234375, 2.115234375, 2.45556640625, 2.7958984375, 3.13623046875, 3.4765625, 3.81689453125, 4.1572265625, 4.49755859375, 4.837890625, 5.17822265625, 5.5185546875, 5.85888671875, 6.19921875, 6.53955078125, 6.8798828125, 7.22021484375, 7.560546875, 7.90087890625, 8.2412109375, 8.58154296875, 8.921875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 15.0, 24.0, 38.0, 68.0, 81.0, 125.0, 130.0, 133.0, 115.0, 106.0, 66.0, 48.0, 26.0, 15.0, 10.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.490234375, -3.245269775390625, -3.00030517578125, -2.755340576171875, -2.5103759765625, -2.265411376953125, -2.02044677734375, -1.775482177734375, -1.530517578125, -1.285552978515625, -1.04058837890625, -0.795623779296875, -0.5506591796875, -0.305694580078125, -0.06072998046875, 0.184234619140625, 0.42919921875, 0.674163818359375, 0.91912841796875, 1.164093017578125, 1.4090576171875, 1.654022216796875, 1.89898681640625, 2.143951416015625, 2.388916015625, 2.633880615234375, 2.87884521484375, 3.123809814453125, 3.3687744140625, 3.613739013671875, 3.85870361328125, 4.103668212890625, 4.3486328125, 4.593597412109375, 4.83856201171875, 5.083526611328125, 5.3284912109375, 5.573455810546875, 5.81842041015625, 6.063385009765625, 6.308349609375, 6.553314208984375, 6.79827880859375, 7.043243408203125, 7.2882080078125, 7.533172607421875, 7.77813720703125, 8.023101806640625, 8.26806640625, 8.513031005859375, 8.75799560546875, 9.002960205078125, 9.2479248046875, 9.492889404296875, 9.73785400390625, 9.982818603515625, 10.227783203125, 10.472747802734375, 10.71771240234375, 10.962677001953125, 11.2076416015625, 11.452606201171875, 11.69757080078125, 11.942535400390625, 12.1875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 9.0, 29.0, 46.0, 105.0, 312.0, 1037.0, 4024.0, 34869.0, 3851699.0, 290520.0, 9166.0, 1669.0, 467.0, 156.0, 61.0, 41.0, 15.0, 6.0, 11.0, 4.0, 1.0, 2.0, 5.0, 7.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.46875, -17.0291748046875, -16.589599609375, -16.1500244140625, -15.71044921875, -15.2708740234375, -14.831298828125, -14.3917236328125, -13.9521484375, -13.5125732421875, -13.072998046875, -12.6334228515625, -12.19384765625, -11.7542724609375, -11.314697265625, -10.8751220703125, -10.435546875, -9.9959716796875, -9.556396484375, -9.1168212890625, -8.67724609375, -8.2376708984375, -7.798095703125, -7.3585205078125, -6.9189453125, -6.4793701171875, -6.039794921875, -5.6002197265625, -5.16064453125, -4.7210693359375, -4.281494140625, -3.8419189453125, -3.40234375, -2.9627685546875, -2.523193359375, -2.0836181640625, -1.64404296875, -1.2044677734375, -0.764892578125, -0.3253173828125, 0.1142578125, 0.5538330078125, 0.993408203125, 1.4329833984375, 1.87255859375, 2.3121337890625, 2.751708984375, 3.1912841796875, 3.630859375, 4.0704345703125, 4.510009765625, 4.9495849609375, 5.38916015625, 5.8287353515625, 6.268310546875, 6.7078857421875, 7.1474609375, 7.5870361328125, 8.026611328125, 8.4661865234375, 8.90576171875, 9.3453369140625, 9.784912109375, 10.2244873046875, 10.6640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 2.0, 4.0, 6.0, 3.0, 17.0, 24.0, 40.0, 75.0, 111.0, 219.0, 455.0, 836.0, 937.0, 646.0, 306.0, 166.0, 83.0, 43.0, 34.0, 20.0, 14.0, 11.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0625, -5.82275390625, -5.5830078125, -5.34326171875, -5.103515625, -4.86376953125, -4.6240234375, -4.38427734375, -4.14453125, -3.90478515625, -3.6650390625, -3.42529296875, -3.185546875, -2.94580078125, -2.7060546875, -2.46630859375, -2.2265625, -1.98681640625, -1.7470703125, -1.50732421875, -1.267578125, -1.02783203125, -0.7880859375, -0.54833984375, -0.30859375, -0.06884765625, 0.1708984375, 0.41064453125, 0.650390625, 0.89013671875, 1.1298828125, 1.36962890625, 1.609375, 1.84912109375, 2.0888671875, 2.32861328125, 2.568359375, 2.80810546875, 3.0478515625, 3.28759765625, 3.52734375, 3.76708984375, 4.0068359375, 4.24658203125, 4.486328125, 4.72607421875, 4.9658203125, 5.20556640625, 5.4453125, 5.68505859375, 5.9248046875, 6.16455078125, 6.404296875, 6.64404296875, 6.8837890625, 7.12353515625, 7.36328125, 7.60302734375, 7.8427734375, 8.08251953125, 8.322265625, 8.56201171875, 8.8017578125, 9.04150390625, 9.28125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 27.0, 43.0, 114.0, 194.0, 236.0, 217.0, 89.0, 34.0, 21.0, 9.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.98811340332031, -92.37798309326172, -89.76785278320312, -87.15772247314453, -84.54759216308594, -81.93746185302734, -79.32733154296875, -76.71720123291016, -74.10707092285156, -71.49694061279297, -68.88681030273438, -66.27667999267578, -63.66654968261719, -61.056419372558594, -58.4462890625, -55.836158752441406, -53.22602844238281, -50.61589813232422, -48.005767822265625, -45.39563751220703, -42.78550720214844, -40.175376892089844, -37.56524658203125, -34.955116271972656, -32.34498596191406, -29.73485565185547, -27.124725341796875, -24.51459503173828, -21.904464721679688, -19.294334411621094, -16.6842041015625, -14.074073791503906, -11.463943481445312, -8.853813171386719, -6.243682861328125, -3.6335525512695312, -1.0234222412109375, 1.5867080688476562, 4.19683837890625, 6.806968688964844, 9.417098999023438, 12.027229309082031, 14.637359619140625, 17.24748992919922, 19.857620239257812, 22.467750549316406, 25.077880859375, 27.688011169433594, 30.298141479492188, 32.90827178955078, 35.518402099609375, 38.12853240966797, 40.73866271972656, 43.348793029785156, 45.95892333984375, 48.569053649902344, 51.17918395996094, 53.78931427001953, 56.399444580078125, 59.00957489013672, 61.61970520019531, 64.2298355102539, 66.8399658203125, 69.4500961303711, 72.06022644042969]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 5.0, 10.0, 10.0, 10.0, 12.0, 22.0, 19.0, 21.0, 28.0, 30.0, 32.0, 36.0, 45.0, 38.0, 52.0, 41.0, 51.0, 44.0, 39.0, 46.0, 59.0, 46.0, 36.0, 40.0, 34.0, 26.0, 16.0, 19.0, 27.0, 17.0, 10.0, 17.0, 10.0, 17.0, 9.0, 6.0, 6.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.73415756225586, -22.01416015625, -21.294164657592773, -20.574167251586914, -19.854169845581055, -19.134174346923828, -18.41417694091797, -17.69417953491211, -16.974184036254883, -16.254186630249023, -15.53419017791748, -14.814193725585938, -14.094197273254395, -13.374200820922852, -12.654203414916992, -11.93420696258545, -11.21420955657959, -10.494213104248047, -9.774215698242188, -9.054219245910645, -8.334222793579102, -7.6142258644104, -6.894228935241699, -6.174232482910156, -5.454235553741455, -4.734238624572754, -4.014242172241211, -3.2942452430725098, -2.5742485523223877, -1.8542518615722656, -1.1342549324035645, -0.4142584800720215, 0.3057384490966797, 1.0257351398468018, 1.7457319498062134, 2.465728759765625, 3.185725450515747, 3.905722141265869, 4.62571907043457, 5.345715522766113, 6.0657124519348145, 6.785709381103516, 7.505705833435059, 8.225702285766602, 8.945699691772461, 9.665696144104004, 10.385692596435547, 11.105690002441406, 11.82568645477295, 12.545682907104492, 13.265680313110352, 13.985676765441895, 14.705673217773438, 15.425670623779297, 16.145668029785156, 16.865663528442383, 17.585660934448242, 18.3056583404541, 19.025653839111328, 19.745651245117188, 20.465648651123047, 21.185644149780273, 21.905641555786133, 22.62563705444336, 23.34563446044922]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 4.0, 9.0, 12.0, 19.0, 27.0, 29.0, 39.0, 64.0, 95.0, 146.0, 358.0, 774.0, 2811.0, 14376.0, 165611.0, 783135.0, 69744.0, 8151.0, 1835.0, 610.0, 273.0, 154.0, 75.0, 57.0, 34.0, 22.0, 24.0, 15.0, 8.0, 9.0, 5.0, 5.0, 4.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.8359375, -13.43310546875, -13.0302734375, -12.62744140625, -12.224609375, -11.82177734375, -11.4189453125, -11.01611328125, -10.61328125, -10.21044921875, -9.8076171875, -9.40478515625, -9.001953125, -8.59912109375, -8.1962890625, -7.79345703125, -7.390625, -6.98779296875, -6.5849609375, -6.18212890625, -5.779296875, -5.37646484375, -4.9736328125, -4.57080078125, -4.16796875, -3.76513671875, -3.3623046875, -2.95947265625, -2.556640625, -2.15380859375, -1.7509765625, -1.34814453125, -0.9453125, -0.54248046875, -0.1396484375, 0.26318359375, 0.666015625, 1.06884765625, 1.4716796875, 1.87451171875, 2.27734375, 2.68017578125, 3.0830078125, 3.48583984375, 3.888671875, 4.29150390625, 4.6943359375, 5.09716796875, 5.5, 5.90283203125, 6.3056640625, 6.70849609375, 7.111328125, 7.51416015625, 7.9169921875, 8.31982421875, 8.72265625, 9.12548828125, 9.5283203125, 9.93115234375, 10.333984375, 10.73681640625, 11.1396484375, 11.54248046875, 11.9453125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 11.0, 21.0, 47.0, 63.0, 96.0, 104.0, 120.0, 139.0, 124.0, 108.0, 74.0, 47.0, 21.0, 16.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.34130859375, -4.0732421875, -3.80517578125, -3.537109375, -3.26904296875, -3.0009765625, -2.73291015625, -2.46484375, -2.19677734375, -1.9287109375, -1.66064453125, -1.392578125, -1.12451171875, -0.8564453125, -0.58837890625, -0.3203125, -0.05224609375, 0.2158203125, 0.48388671875, 0.751953125, 1.02001953125, 1.2880859375, 1.55615234375, 1.82421875, 2.09228515625, 2.3603515625, 2.62841796875, 2.896484375, 3.16455078125, 3.4326171875, 3.70068359375, 3.96875, 4.23681640625, 4.5048828125, 4.77294921875, 5.041015625, 5.30908203125, 5.5771484375, 5.84521484375, 6.11328125, 6.38134765625, 6.6494140625, 6.91748046875, 7.185546875, 7.45361328125, 7.7216796875, 7.98974609375, 8.2578125, 8.52587890625, 8.7939453125, 9.06201171875, 9.330078125, 9.59814453125, 9.8662109375, 10.13427734375, 10.40234375, 10.67041015625, 10.9384765625, 11.20654296875, 11.474609375, 11.74267578125, 12.0107421875, 12.27880859375, 12.546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 20.0, 19.0, 39.0, 50.0, 89.0, 124.0, 297.0, 622.0, 1731.0, 5794.0, 38732.0, 864360.0, 122156.0, 10208.0, 2517.0, 920.0, 402.0, 200.0, 101.0, 59.0, 33.0, 22.0, 10.0, 9.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.46875, -12.00146484375, -11.5341796875, -11.06689453125, -10.599609375, -10.13232421875, -9.6650390625, -9.19775390625, -8.73046875, -8.26318359375, -7.7958984375, -7.32861328125, -6.861328125, -6.39404296875, -5.9267578125, -5.45947265625, -4.9921875, -4.52490234375, -4.0576171875, -3.59033203125, -3.123046875, -2.65576171875, -2.1884765625, -1.72119140625, -1.25390625, -0.78662109375, -0.3193359375, 0.14794921875, 0.615234375, 1.08251953125, 1.5498046875, 2.01708984375, 2.484375, 2.95166015625, 3.4189453125, 3.88623046875, 4.353515625, 4.82080078125, 5.2880859375, 5.75537109375, 6.22265625, 6.68994140625, 7.1572265625, 7.62451171875, 8.091796875, 8.55908203125, 9.0263671875, 9.49365234375, 9.9609375, 10.42822265625, 10.8955078125, 11.36279296875, 11.830078125, 12.29736328125, 12.7646484375, 13.23193359375, 13.69921875, 14.16650390625, 14.6337890625, 15.10107421875, 15.568359375, 16.03564453125, 16.5029296875, 16.97021484375, 17.4375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 0.0, 11.0, 6.0, 12.0, 13.0, 23.0, 27.0, 28.0, 37.0, 47.0, 59.0, 78.0, 80.0, 82.0, 90.0, 69.0, 59.0, 64.0, 58.0, 40.0, 28.0, 31.0, 17.0, 10.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.65625, -19.040283203125, -18.42431640625, -17.808349609375, -17.1923828125, -16.576416015625, -15.96044921875, -15.344482421875, -14.728515625, -14.112548828125, -13.49658203125, -12.880615234375, -12.2646484375, -11.648681640625, -11.03271484375, -10.416748046875, -9.80078125, -9.184814453125, -8.56884765625, -7.952880859375, -7.3369140625, -6.720947265625, -6.10498046875, -5.489013671875, -4.873046875, -4.257080078125, -3.64111328125, -3.025146484375, -2.4091796875, -1.793212890625, -1.17724609375, -0.561279296875, 0.0546875, 0.670654296875, 1.28662109375, 1.902587890625, 2.5185546875, 3.134521484375, 3.75048828125, 4.366455078125, 4.982421875, 5.598388671875, 6.21435546875, 6.830322265625, 7.4462890625, 8.062255859375, 8.67822265625, 9.294189453125, 9.91015625, 10.526123046875, 11.14208984375, 11.758056640625, 12.3740234375, 12.989990234375, 13.60595703125, 14.221923828125, 14.837890625, 15.453857421875, 16.06982421875, 16.685791015625, 17.3017578125, 17.917724609375, 18.53369140625, 19.149658203125, 19.765625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 3.0, 11.0, 15.0, 13.0, 24.0, 36.0, 35.0, 65.0, 103.0, 152.0, 230.0, 403.0, 713.0, 1237.0, 2437.0, 5557.0, 15060.0, 60342.0, 750968.0, 166584.0, 28262.0, 8689.0, 3587.0, 1666.0, 916.0, 521.0, 303.0, 197.0, 123.0, 88.0, 49.0, 41.0, 30.0, 20.0, 13.0, 9.0, 6.0, 12.0, 4.0, 9.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.70703125, -4.55877685546875, -4.4105224609375, -4.26226806640625, -4.114013671875, -3.96575927734375, -3.8175048828125, -3.66925048828125, -3.52099609375, -3.37274169921875, -3.2244873046875, -3.07623291015625, -2.927978515625, -2.77972412109375, -2.6314697265625, -2.48321533203125, -2.3349609375, -2.18670654296875, -2.0384521484375, -1.89019775390625, -1.741943359375, -1.59368896484375, -1.4454345703125, -1.29718017578125, -1.14892578125, -1.00067138671875, -0.8524169921875, -0.70416259765625, -0.555908203125, -0.40765380859375, -0.2593994140625, -0.11114501953125, 0.037109375, 0.18536376953125, 0.3336181640625, 0.48187255859375, 0.630126953125, 0.77838134765625, 0.9266357421875, 1.07489013671875, 1.22314453125, 1.37139892578125, 1.5196533203125, 1.66790771484375, 1.816162109375, 1.96441650390625, 2.1126708984375, 2.26092529296875, 2.4091796875, 2.55743408203125, 2.7056884765625, 2.85394287109375, 3.002197265625, 3.15045166015625, 3.2987060546875, 3.44696044921875, 3.59521484375, 3.74346923828125, 3.8917236328125, 4.03997802734375, 4.188232421875, 4.33648681640625, 4.4847412109375, 4.63299560546875, 4.78125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 6.0, 8.0, 32.0, 20.0, 64.0, 111.0, 231.0, 244.0, 106.0, 66.0, 35.0, 9.0, 15.0, 9.0, 4.0, 9.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001964569091796875, -0.0019100606441497803, -0.0018555521965026855, -0.0018010437488555908, -0.001746535301208496, -0.0016920268535614014, -0.0016375184059143066, -0.001583009958267212, -0.0015285015106201172, -0.0014739930629730225, -0.0014194846153259277, -0.001364976167678833, -0.0013104677200317383, -0.0012559592723846436, -0.0012014508247375488, -0.001146942377090454, -0.0010924339294433594, -0.0010379254817962646, -0.00098341703414917, -0.0009289085865020752, -0.0008744001388549805, -0.0008198916912078857, -0.000765383243560791, -0.0007108747959136963, -0.0006563663482666016, -0.0006018579006195068, -0.0005473494529724121, -0.0004928410053253174, -0.00043833255767822266, -0.00038382411003112793, -0.0003293156623840332, -0.0002748072147369385, -0.00022029876708984375, -0.00016579031944274902, -0.0001112818717956543, -5.677342414855957e-05, -2.2649765014648438e-06, 5.224347114562988e-05, 0.00010675191879272461, 0.00016126036643981934, 0.00021576881408691406, 0.0002702772617340088, 0.0003247857093811035, 0.00037929415702819824, 0.00043380260467529297, 0.0004883110523223877, 0.0005428194999694824, 0.0005973279476165771, 0.0006518363952636719, 0.0007063448429107666, 0.0007608532905578613, 0.0008153617382049561, 0.0008698701858520508, 0.0009243786334991455, 0.0009788870811462402, 0.001033395528793335, 0.0010879039764404297, 0.0011424124240875244, 0.0011969208717346191, 0.0012514293193817139, 0.0013059377670288086, 0.0013604462146759033, 0.001414954662322998, 0.0014694631099700928, 0.0015239715576171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 9.0, 10.0, 9.0, 8.0, 27.0, 26.0, 31.0, 34.0, 57.0, 85.0, 140.0, 213.0, 357.0, 613.0, 1191.0, 2243.0, 5301.0, 14441.0, 61782.0, 759058.0, 161994.0, 26037.0, 7982.0, 3254.0, 1517.0, 820.0, 488.0, 240.0, 170.0, 118.0, 90.0, 54.0, 34.0, 35.0, 19.0, 17.0, 14.0, 11.0, 5.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-5.296875, -5.13983154296875, -4.9827880859375, -4.82574462890625, -4.668701171875, -4.51165771484375, -4.3546142578125, -4.19757080078125, -4.04052734375, -3.88348388671875, -3.7264404296875, -3.56939697265625, -3.412353515625, -3.25531005859375, -3.0982666015625, -2.94122314453125, -2.7841796875, -2.62713623046875, -2.4700927734375, -2.31304931640625, -2.156005859375, -1.99896240234375, -1.8419189453125, -1.68487548828125, -1.52783203125, -1.37078857421875, -1.2137451171875, -1.05670166015625, -0.899658203125, -0.74261474609375, -0.5855712890625, -0.42852783203125, -0.271484375, -0.11444091796875, 0.0426025390625, 0.19964599609375, 0.356689453125, 0.51373291015625, 0.6707763671875, 0.82781982421875, 0.98486328125, 1.14190673828125, 1.2989501953125, 1.45599365234375, 1.613037109375, 1.77008056640625, 1.9271240234375, 2.08416748046875, 2.2412109375, 2.39825439453125, 2.5552978515625, 2.71234130859375, 2.869384765625, 3.02642822265625, 3.1834716796875, 3.34051513671875, 3.49755859375, 3.65460205078125, 3.8116455078125, 3.96868896484375, 4.125732421875, 4.28277587890625, 4.4398193359375, 4.59686279296875, 4.75390625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 8.0, 8.0, 5.0, 14.0, 19.0, 28.0, 30.0, 36.0, 51.0, 73.0, 114.0, 149.0, 114.0, 90.0, 63.0, 41.0, 27.0, 22.0, 25.0, 15.0, 12.0, 11.0, 11.0, 10.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5390625, -4.408172607421875, -4.27728271484375, -4.146392822265625, -4.0155029296875, -3.884613037109375, -3.75372314453125, -3.622833251953125, -3.491943359375, -3.361053466796875, -3.23016357421875, -3.099273681640625, -2.9683837890625, -2.837493896484375, -2.70660400390625, -2.575714111328125, -2.44482421875, -2.313934326171875, -2.18304443359375, -2.052154541015625, -1.9212646484375, -1.790374755859375, -1.65948486328125, -1.528594970703125, -1.397705078125, -1.266815185546875, -1.13592529296875, -1.005035400390625, -0.8741455078125, -0.743255615234375, -0.61236572265625, -0.481475830078125, -0.3505859375, -0.219696044921875, -0.08880615234375, 0.042083740234375, 0.1729736328125, 0.303863525390625, 0.43475341796875, 0.565643310546875, 0.696533203125, 0.827423095703125, 0.95831298828125, 1.089202880859375, 1.2200927734375, 1.350982666015625, 1.48187255859375, 1.612762451171875, 1.74365234375, 1.874542236328125, 2.00543212890625, 2.136322021484375, 2.2672119140625, 2.398101806640625, 2.52899169921875, 2.659881591796875, 2.790771484375, 2.921661376953125, 3.05255126953125, 3.183441162109375, 3.3143310546875, 3.445220947265625, 3.57611083984375, 3.707000732421875, 3.837890625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 10.0, 41.0, 195.0, 540.0, 127.0, 56.0, 20.0, 7.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.6819152832031, -281.6935119628906, -274.705078125, -267.7166748046875, -260.728271484375, -253.73983764648438, -246.75143432617188, -239.7630157470703, -232.77459716796875, -225.7861785888672, -218.7977752685547, -211.80935668945312, -204.82093811035156, -197.83251953125, -190.8441162109375, -183.85569763183594, -176.86727905273438, -169.8788604736328, -162.8904571533203, -155.90203857421875, -148.9136199951172, -141.92520141601562, -134.93679809570312, -127.94837951660156, -120.95997619628906, -113.97156524658203, -106.98314666748047, -99.99473571777344, -93.00631713867188, -86.01790618896484, -79.02949523925781, -72.04107666015625, -65.05265808105469, -58.06424331665039, -51.075828552246094, -44.08741760253906, -37.0989990234375, -30.11058807373047, -23.122173309326172, -16.133758544921875, -9.145343780517578, -2.1569294929504395, 4.831484794616699, 11.81989860534668, 18.808313369750977, 25.79672622680664, 32.78514099121094, 39.773555755615234, 46.76197052001953, 53.75038528442383, 60.738800048828125, 67.72721099853516, 74.71562957763672, 81.70404052734375, 88.69245910644531, 95.68087005615234, 102.66928100585938, 109.6576919555664, 116.64611053466797, 123.634521484375, 130.62294006347656, 137.61135864257812, 144.59976196289062, 151.5881805419922, 158.57659912109375]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 7.0, 10.0, 11.0, 11.0, 26.0, 24.0, 21.0, 23.0, 24.0, 28.0, 34.0, 37.0, 48.0, 111.0, 112.0, 86.0, 68.0, 48.0, 36.0, 34.0, 33.0, 22.0, 21.0, 25.0, 16.0, 18.0, 14.0, 5.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-73.50515747070312, -71.64508056640625, -69.78500366210938, -67.9249267578125, -66.06484985351562, -64.20477294921875, -62.34469223022461, -60.484615325927734, -58.62453842163086, -56.764461517333984, -54.90438461303711, -53.04430389404297, -51.184226989746094, -49.32415008544922, -47.464073181152344, -45.60399627685547, -43.743919372558594, -41.88384246826172, -40.023765563964844, -38.16368865966797, -36.30360794067383, -34.44353103637695, -32.58345413208008, -30.723377227783203, -28.863296508789062, -27.003219604492188, -25.14314079284668, -23.283063888549805, -21.42298698425293, -19.562908172607422, -17.702831268310547, -15.842754364013672, -13.982677459716797, -12.122599601745605, -10.26252269744873, -8.402444839477539, -6.542367458343506, -4.682290077209473, -2.8222122192382812, -0.9621353149414062, 0.8979425430297852, 2.7580199241638184, 4.618097305297852, 6.478175163269043, 8.338253021240234, 10.19832992553711, 12.0584077835083, 13.918484687805176, 15.778562545776367, 17.638639450073242, 19.49871826171875, 21.358795166015625, 23.2188720703125, 25.078948974609375, 26.939027786254883, 28.799104690551758, 30.659183502197266, 32.51926040649414, 34.379337310791016, 36.239418029785156, 38.09949493408203, 39.959571838378906, 41.81964874267578, 43.679725646972656, 45.53980255126953]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 6.0, 11.0, 10.0, 45.0, 37.0, 57.0, 83.0, 146.0, 276.0, 834.0, 2602.0, 11417.0, 374085.0, 3769743.0, 28891.0, 3988.0, 1079.0, 425.0, 202.0, 110.0, 77.0, 49.0, 35.0, 26.0, 9.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.359375, -14.8829345703125, -14.406494140625, -13.9300537109375, -13.45361328125, -12.9771728515625, -12.500732421875, -12.0242919921875, -11.5478515625, -11.0714111328125, -10.594970703125, -10.1185302734375, -9.64208984375, -9.1656494140625, -8.689208984375, -8.2127685546875, -7.736328125, -7.2598876953125, -6.783447265625, -6.3070068359375, -5.83056640625, -5.3541259765625, -4.877685546875, -4.4012451171875, -3.9248046875, -3.4483642578125, -2.971923828125, -2.4954833984375, -2.01904296875, -1.5426025390625, -1.066162109375, -0.5897216796875, -0.11328125, 0.3631591796875, 0.839599609375, 1.3160400390625, 1.79248046875, 2.2689208984375, 2.745361328125, 3.2218017578125, 3.6982421875, 4.1746826171875, 4.651123046875, 5.1275634765625, 5.60400390625, 6.0804443359375, 6.556884765625, 7.0333251953125, 7.509765625, 7.9862060546875, 8.462646484375, 8.9390869140625, 9.41552734375, 9.8919677734375, 10.368408203125, 10.8448486328125, 11.3212890625, 11.7977294921875, 12.274169921875, 12.7506103515625, 13.22705078125, 13.7034912109375, 14.179931640625, 14.6563720703125, 15.1328125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 15.0, 11.0, 22.0, 29.0, 40.0, 45.0, 53.0, 64.0, 73.0, 89.0, 78.0, 87.0, 86.0, 55.0, 52.0, 43.0, 41.0, 31.0, 26.0, 16.0, 18.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73046875, -2.56781005859375, -2.4051513671875, -2.24249267578125, -2.079833984375, -1.91717529296875, -1.7545166015625, -1.59185791015625, -1.42919921875, -1.26654052734375, -1.1038818359375, -0.94122314453125, -0.778564453125, -0.61590576171875, -0.4532470703125, -0.29058837890625, -0.1279296875, 0.03472900390625, 0.1973876953125, 0.36004638671875, 0.522705078125, 0.68536376953125, 0.8480224609375, 1.01068115234375, 1.17333984375, 1.33599853515625, 1.4986572265625, 1.66131591796875, 1.823974609375, 1.98663330078125, 2.1492919921875, 2.31195068359375, 2.474609375, 2.63726806640625, 2.7999267578125, 2.96258544921875, 3.125244140625, 3.28790283203125, 3.4505615234375, 3.61322021484375, 3.77587890625, 3.93853759765625, 4.1011962890625, 4.26385498046875, 4.426513671875, 4.58917236328125, 4.7518310546875, 4.91448974609375, 5.0771484375, 5.23980712890625, 5.4024658203125, 5.56512451171875, 5.727783203125, 5.89044189453125, 6.0531005859375, 6.21575927734375, 6.37841796875, 6.54107666015625, 6.7037353515625, 6.86639404296875, 7.029052734375, 7.19171142578125, 7.3543701171875, 7.51702880859375, 7.6796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 14.0, 31.0, 51.0, 86.0, 203.0, 520.0, 2967.0, 508593.0, 3675781.0, 4765.0, 674.0, 272.0, 180.0, 62.0, 30.0, 16.0, 16.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.546875, -24.567626953125, -23.58837890625, -22.609130859375, -21.6298828125, -20.650634765625, -19.67138671875, -18.692138671875, -17.712890625, -16.733642578125, -15.75439453125, -14.775146484375, -13.7958984375, -12.816650390625, -11.83740234375, -10.858154296875, -9.87890625, -8.899658203125, -7.92041015625, -6.941162109375, -5.9619140625, -4.982666015625, -4.00341796875, -3.024169921875, -2.044921875, -1.065673828125, -0.08642578125, 0.892822265625, 1.8720703125, 2.851318359375, 3.83056640625, 4.809814453125, 5.7890625, 6.768310546875, 7.74755859375, 8.726806640625, 9.7060546875, 10.685302734375, 11.66455078125, 12.643798828125, 13.623046875, 14.602294921875, 15.58154296875, 16.560791015625, 17.5400390625, 18.519287109375, 19.49853515625, 20.477783203125, 21.45703125, 22.436279296875, 23.41552734375, 24.394775390625, 25.3740234375, 26.353271484375, 27.33251953125, 28.311767578125, 29.291015625, 30.270263671875, 31.24951171875, 32.228759765625, 33.2080078125, 34.187255859375, 35.16650390625, 36.145751953125, 37.125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 11.0, 13.0, 22.0, 45.0, 137.0, 445.0, 1288.0, 1310.0, 494.0, 176.0, 56.0, 37.0, 14.0, 12.0, 8.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.421875, -9.927978515625, -9.43408203125, -8.940185546875, -8.4462890625, -7.952392578125, -7.45849609375, -6.964599609375, -6.470703125, -5.976806640625, -5.48291015625, -4.989013671875, -4.4951171875, -4.001220703125, -3.50732421875, -3.013427734375, -2.51953125, -2.025634765625, -1.53173828125, -1.037841796875, -0.5439453125, -0.050048828125, 0.44384765625, 0.937744140625, 1.431640625, 1.925537109375, 2.41943359375, 2.913330078125, 3.4072265625, 3.901123046875, 4.39501953125, 4.888916015625, 5.3828125, 5.876708984375, 6.37060546875, 6.864501953125, 7.3583984375, 7.852294921875, 8.34619140625, 8.840087890625, 9.333984375, 9.827880859375, 10.32177734375, 10.815673828125, 11.3095703125, 11.803466796875, 12.29736328125, 12.791259765625, 13.28515625, 13.779052734375, 14.27294921875, 14.766845703125, 15.2607421875, 15.754638671875, 16.24853515625, 16.742431640625, 17.236328125, 17.730224609375, 18.22412109375, 18.718017578125, 19.2119140625, 19.705810546875, 20.19970703125, 20.693603515625, 21.1875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 16.0, 23.0, 60.0, 175.0, 300.0, 226.0, 100.0, 47.0, 24.0, 11.0, 9.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.48389434814453, -29.59547233581543, -25.707050323486328, -21.818626403808594, -17.930204391479492, -14.04178237915039, -10.153358459472656, -6.264936447143555, -2.376514434814453, 1.5119080543518066, 5.400330543518066, 9.288753509521484, 13.177175521850586, 17.065597534179688, 20.954021453857422, 24.842443466186523, 28.730865478515625, 32.61928939819336, 36.50770950317383, 40.39613342285156, 44.28455352783203, 48.172977447509766, 52.0614013671875, 55.94982147216797, 59.8382453918457, 63.72666931152344, 67.6150894165039, 71.50350952148438, 75.39193725585938, 79.28035736083984, 83.16877746582031, 87.05720520019531, 90.94561767578125, 94.83403778076172, 98.72246551513672, 102.61088562011719, 106.49930572509766, 110.38772583007812, 114.27615356445312, 118.1645736694336, 122.05299377441406, 125.94141387939453, 129.829833984375, 133.71826171875, 137.606689453125, 141.49510192871094, 145.38352966308594, 149.27195739746094, 153.16036987304688, 157.04879760742188, 160.9372100830078, 164.8256378173828, 168.7140655517578, 172.60247802734375, 176.49090576171875, 180.37933349609375, 184.26776123046875, 188.15618896484375, 192.0446014404297, 195.9330291748047, 199.8214569091797, 203.70986938476562, 207.59829711914062, 211.48672485351562, 215.37513732910156]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 14.0, 17.0, 17.0, 11.0, 21.0, 21.0, 35.0, 43.0, 44.0, 63.0, 70.0, 78.0, 88.0, 67.0, 63.0, 73.0, 45.0, 51.0, 36.0, 38.0, 25.0, 15.0, 19.0, 14.0, 14.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.201595306396484, -60.464229583740234, -58.726863861083984, -56.989498138427734, -55.252132415771484, -53.51476287841797, -51.77739715576172, -50.04003143310547, -48.30266571044922, -46.56529998779297, -44.82793426513672, -43.09056854248047, -41.35320281982422, -39.61583709716797, -37.87847137451172, -36.1411018371582, -34.40373992919922, -32.66637420654297, -30.92900848388672, -29.19164276123047, -27.454275131225586, -25.716909408569336, -23.979543685913086, -22.242176055908203, -20.504810333251953, -18.767444610595703, -17.030078887939453, -15.292712211608887, -13.55534553527832, -11.81797981262207, -10.08061408996582, -8.343247413635254, -6.6058807373046875, -4.868514537811279, -3.13114857673645, -1.393782615661621, 0.3435835838317871, 2.0809497833251953, 3.8183155059814453, 5.555682182312012, 7.293047904968262, 9.030413627624512, 10.767780303955078, 12.505146026611328, 14.242511749267578, 15.979878425598145, 17.717243194580078, 19.45461082458496, 21.19197654724121, 22.92934226989746, 24.66670799255371, 26.404075622558594, 28.141441345214844, 29.878807067871094, 31.616172790527344, 33.353538513183594, 35.090904235839844, 36.828269958496094, 38.565635681152344, 40.303001403808594, 42.040367126464844, 43.777732849121094, 45.515098571777344, 47.25246810913086, 48.98983383178711]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 1.0, 10.0, 4.0, 10.0, 9.0, 19.0, 33.0, 68.0, 101.0, 165.0, 328.0, 746.0, 2188.0, 6940.0, 29397.0, 193299.0, 667039.0, 119652.0, 20460.0, 5114.0, 1600.0, 676.0, 282.0, 148.0, 92.0, 57.0, 34.0, 25.0, 14.0, 4.0, 11.0, 10.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.84375, -8.578857421875, -8.31396484375, -8.049072265625, -7.7841796875, -7.519287109375, -7.25439453125, -6.989501953125, -6.724609375, -6.459716796875, -6.19482421875, -5.929931640625, -5.6650390625, -5.400146484375, -5.13525390625, -4.870361328125, -4.60546875, -4.340576171875, -4.07568359375, -3.810791015625, -3.5458984375, -3.281005859375, -3.01611328125, -2.751220703125, -2.486328125, -2.221435546875, -1.95654296875, -1.691650390625, -1.4267578125, -1.161865234375, -0.89697265625, -0.632080078125, -0.3671875, -0.102294921875, 0.16259765625, 0.427490234375, 0.6923828125, 0.957275390625, 1.22216796875, 1.487060546875, 1.751953125, 2.016845703125, 2.28173828125, 2.546630859375, 2.8115234375, 3.076416015625, 3.34130859375, 3.606201171875, 3.87109375, 4.135986328125, 4.40087890625, 4.665771484375, 4.9306640625, 5.195556640625, 5.46044921875, 5.725341796875, 5.990234375, 6.255126953125, 6.52001953125, 6.784912109375, 7.0498046875, 7.314697265625, 7.57958984375, 7.844482421875, 8.109375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 7.0, 11.0, 23.0, 29.0, 23.0, 41.0, 44.0, 38.0, 40.0, 55.0, 54.0, 65.0, 70.0, 59.0, 68.0, 50.0, 64.0, 37.0, 32.0, 29.0, 28.0, 29.0, 21.0, 18.0, 18.0, 9.0, 11.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.302734375, -3.157928466796875, -3.01312255859375, -2.868316650390625, -2.7235107421875, -2.578704833984375, -2.43389892578125, -2.289093017578125, -2.144287109375, -1.999481201171875, -1.85467529296875, -1.709869384765625, -1.5650634765625, -1.420257568359375, -1.27545166015625, -1.130645751953125, -0.98583984375, -0.841033935546875, -0.69622802734375, -0.551422119140625, -0.4066162109375, -0.261810302734375, -0.11700439453125, 0.027801513671875, 0.172607421875, 0.317413330078125, 0.46221923828125, 0.607025146484375, 0.7518310546875, 0.896636962890625, 1.04144287109375, 1.186248779296875, 1.3310546875, 1.475860595703125, 1.62066650390625, 1.765472412109375, 1.9102783203125, 2.055084228515625, 2.19989013671875, 2.344696044921875, 2.489501953125, 2.634307861328125, 2.77911376953125, 2.923919677734375, 3.0687255859375, 3.213531494140625, 3.35833740234375, 3.503143310546875, 3.64794921875, 3.792755126953125, 3.93756103515625, 4.082366943359375, 4.2271728515625, 4.371978759765625, 4.51678466796875, 4.661590576171875, 4.806396484375, 4.951202392578125, 5.09600830078125, 5.240814208984375, 5.3856201171875, 5.530426025390625, 5.67523193359375, 5.820037841796875, 5.96484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 12.0, 13.0, 23.0, 25.0, 34.0, 36.0, 79.0, 123.0, 192.0, 324.0, 581.0, 1215.0, 3294.0, 13628.0, 123488.0, 834747.0, 57633.0, 8447.0, 2469.0, 966.0, 476.0, 267.0, 162.0, 111.0, 65.0, 32.0, 36.0, 22.0, 10.0, 10.0, 8.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.5625, -11.1937255859375, -10.824951171875, -10.4561767578125, -10.08740234375, -9.7186279296875, -9.349853515625, -8.9810791015625, -8.6123046875, -8.2435302734375, -7.874755859375, -7.5059814453125, -7.13720703125, -6.7684326171875, -6.399658203125, -6.0308837890625, -5.662109375, -5.2933349609375, -4.924560546875, -4.5557861328125, -4.18701171875, -3.8182373046875, -3.449462890625, -3.0806884765625, -2.7119140625, -2.3431396484375, -1.974365234375, -1.6055908203125, -1.23681640625, -0.8680419921875, -0.499267578125, -0.1304931640625, 0.23828125, 0.6070556640625, 0.975830078125, 1.3446044921875, 1.71337890625, 2.0821533203125, 2.450927734375, 2.8197021484375, 3.1884765625, 3.5572509765625, 3.926025390625, 4.2947998046875, 4.66357421875, 5.0323486328125, 5.401123046875, 5.7698974609375, 6.138671875, 6.5074462890625, 6.876220703125, 7.2449951171875, 7.61376953125, 7.9825439453125, 8.351318359375, 8.7200927734375, 9.0888671875, 9.4576416015625, 9.826416015625, 10.1951904296875, 10.56396484375, 10.9327392578125, 11.301513671875, 11.6702880859375, 12.0390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 11.0, 8.0, 17.0, 14.0, 19.0, 25.0, 35.0, 42.0, 44.0, 55.0, 65.0, 73.0, 71.0, 72.0, 54.0, 76.0, 55.0, 49.0, 34.0, 32.0, 38.0, 18.0, 22.0, 17.0, 13.0, 9.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.09375, -18.4794921875, -17.865234375, -17.2509765625, -16.63671875, -16.0224609375, -15.408203125, -14.7939453125, -14.1796875, -13.5654296875, -12.951171875, -12.3369140625, -11.72265625, -11.1083984375, -10.494140625, -9.8798828125, -9.265625, -8.6513671875, -8.037109375, -7.4228515625, -6.80859375, -6.1943359375, -5.580078125, -4.9658203125, -4.3515625, -3.7373046875, -3.123046875, -2.5087890625, -1.89453125, -1.2802734375, -0.666015625, -0.0517578125, 0.5625, 1.1767578125, 1.791015625, 2.4052734375, 3.01953125, 3.6337890625, 4.248046875, 4.8623046875, 5.4765625, 6.0908203125, 6.705078125, 7.3193359375, 7.93359375, 8.5478515625, 9.162109375, 9.7763671875, 10.390625, 11.0048828125, 11.619140625, 12.2333984375, 12.84765625, 13.4619140625, 14.076171875, 14.6904296875, 15.3046875, 15.9189453125, 16.533203125, 17.1474609375, 17.76171875, 18.3759765625, 18.990234375, 19.6044921875, 20.21875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 2.0, 9.0, 5.0, 5.0, 15.0, 20.0, 24.0, 42.0, 68.0, 113.0, 185.0, 413.0, 1089.0, 3352.0, 16412.0, 781850.0, 228127.0, 12188.0, 2805.0, 949.0, 376.0, 174.0, 115.0, 67.0, 55.0, 19.0, 15.0, 15.0, 10.0, 9.0, 4.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4609375, -6.258544921875, -6.05615234375, -5.853759765625, -5.6513671875, -5.448974609375, -5.24658203125, -5.044189453125, -4.841796875, -4.639404296875, -4.43701171875, -4.234619140625, -4.0322265625, -3.829833984375, -3.62744140625, -3.425048828125, -3.22265625, -3.020263671875, -2.81787109375, -2.615478515625, -2.4130859375, -2.210693359375, -2.00830078125, -1.805908203125, -1.603515625, -1.401123046875, -1.19873046875, -0.996337890625, -0.7939453125, -0.591552734375, -0.38916015625, -0.186767578125, 0.015625, 0.218017578125, 0.42041015625, 0.622802734375, 0.8251953125, 1.027587890625, 1.22998046875, 1.432373046875, 1.634765625, 1.837158203125, 2.03955078125, 2.241943359375, 2.4443359375, 2.646728515625, 2.84912109375, 3.051513671875, 3.25390625, 3.456298828125, 3.65869140625, 3.861083984375, 4.0634765625, 4.265869140625, 4.46826171875, 4.670654296875, 4.873046875, 5.075439453125, 5.27783203125, 5.480224609375, 5.6826171875, 5.885009765625, 6.08740234375, 6.289794921875, 6.4921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 4.0, 6.0, 8.0, 6.0, 13.0, 22.0, 30.0, 58.0, 112.0, 245.0, 206.0, 107.0, 55.0, 36.0, 26.0, 11.0, 6.0, 11.0, 5.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00136566162109375, -0.0013295933604240417, -0.0012935250997543335, -0.0012574568390846252, -0.001221388578414917, -0.0011853203177452087, -0.0011492520570755005, -0.0011131837964057922, -0.001077115535736084, -0.0010410472750663757, -0.0010049790143966675, -0.0009689107537269592, -0.000932842493057251, -0.0008967742323875427, -0.0008607059717178345, -0.0008246377110481262, -0.000788569450378418, -0.0007525011897087097, -0.0007164329290390015, -0.0006803646683692932, -0.000644296407699585, -0.0006082281470298767, -0.0005721598863601685, -0.0005360916256904602, -0.000500023365020752, -0.0004639551043510437, -0.00042788684368133545, -0.0003918185830116272, -0.00035575032234191895, -0.0003196820616722107, -0.00028361380100250244, -0.0002475455403327942, -0.00021147727966308594, -0.00017540901899337769, -0.00013934075832366943, -0.00010327249765396118, -6.720423698425293e-05, -3.113597631454468e-05, 4.932284355163574e-06, 4.1000545024871826e-05, 7.706880569458008e-05, 0.00011313706636428833, 0.00014920532703399658, 0.00018527358770370483, 0.00022134184837341309, 0.00025741010904312134, 0.0002934783697128296, 0.00032954663038253784, 0.0003656148910522461, 0.00040168315172195435, 0.0004377514123916626, 0.00047381967306137085, 0.0005098879337310791, 0.0005459561944007874, 0.0005820244550704956, 0.0006180927157402039, 0.0006541609764099121, 0.0006902292370796204, 0.0007262974977493286, 0.0007623657584190369, 0.0007984340190887451, 0.0008345022797584534, 0.0008705705404281616, 0.0009066388010978699, 0.0009427070617675781]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 16.0, 20.0, 35.0, 58.0, 78.0, 158.0, 357.0, 853.0, 2694.0, 14222.0, 374535.0, 636047.0, 15035.0, 2811.0, 880.0, 348.0, 179.0, 89.0, 38.0, 30.0, 19.0, 12.0, 8.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.09765625, -6.9058837890625, -6.714111328125, -6.5223388671875, -6.33056640625, -6.1387939453125, -5.947021484375, -5.7552490234375, -5.5634765625, -5.3717041015625, -5.179931640625, -4.9881591796875, -4.79638671875, -4.6046142578125, -4.412841796875, -4.2210693359375, -4.029296875, -3.8375244140625, -3.645751953125, -3.4539794921875, -3.26220703125, -3.0704345703125, -2.878662109375, -2.6868896484375, -2.4951171875, -2.3033447265625, -2.111572265625, -1.9197998046875, -1.72802734375, -1.5362548828125, -1.344482421875, -1.1527099609375, -0.9609375, -0.7691650390625, -0.577392578125, -0.3856201171875, -0.19384765625, -0.0020751953125, 0.189697265625, 0.3814697265625, 0.5732421875, 0.7650146484375, 0.956787109375, 1.1485595703125, 1.34033203125, 1.5321044921875, 1.723876953125, 1.9156494140625, 2.107421875, 2.2991943359375, 2.490966796875, 2.6827392578125, 2.87451171875, 3.0662841796875, 3.258056640625, 3.4498291015625, 3.6416015625, 3.8333740234375, 4.025146484375, 4.2169189453125, 4.40869140625, 4.6004638671875, 4.792236328125, 4.9840087890625, 5.17578125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 8.0, 25.0, 21.0, 33.0, 45.0, 79.0, 157.0, 233.0, 148.0, 100.0, 45.0, 25.0, 24.0, 18.0, 3.0, 8.0, 2.0, 6.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.80859375, -5.640380859375, -5.47216796875, -5.303955078125, -5.1357421875, -4.967529296875, -4.79931640625, -4.631103515625, -4.462890625, -4.294677734375, -4.12646484375, -3.958251953125, -3.7900390625, -3.621826171875, -3.45361328125, -3.285400390625, -3.1171875, -2.948974609375, -2.78076171875, -2.612548828125, -2.4443359375, -2.276123046875, -2.10791015625, -1.939697265625, -1.771484375, -1.603271484375, -1.43505859375, -1.266845703125, -1.0986328125, -0.930419921875, -0.76220703125, -0.593994140625, -0.42578125, -0.257568359375, -0.08935546875, 0.078857421875, 0.2470703125, 0.415283203125, 0.58349609375, 0.751708984375, 0.919921875, 1.088134765625, 1.25634765625, 1.424560546875, 1.5927734375, 1.760986328125, 1.92919921875, 2.097412109375, 2.265625, 2.433837890625, 2.60205078125, 2.770263671875, 2.9384765625, 3.106689453125, 3.27490234375, 3.443115234375, 3.611328125, 3.779541015625, 3.94775390625, 4.115966796875, 4.2841796875, 4.452392578125, 4.62060546875, 4.788818359375, 4.95703125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 15.0, 52.0, 164.0, 529.0, 158.0, 41.0, 15.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-182.13070678710938, -176.99607849121094, -171.86143493652344, -166.726806640625, -161.59217834472656, -156.45755004882812, -151.32290649414062, -146.1882781982422, -141.05364990234375, -135.9190216064453, -130.7843780517578, -125.64974975585938, -120.51512145996094, -115.38048553466797, -110.245849609375, -105.11122131347656, -99.9765853881836, -94.84194946289062, -89.70732116699219, -84.57268524169922, -79.43805694580078, -74.30342102050781, -69.16879272460938, -64.0341567993164, -58.8995246887207, -53.764892578125, -48.6302604675293, -43.495628356933594, -38.360992431640625, -33.22636413574219, -28.09172821044922, -22.957096099853516, -17.822463989257812, -12.68783187866211, -7.55319881439209, -2.4185657501220703, 2.716066360473633, 7.850698471069336, 12.985332489013672, 18.119964599609375, 23.254596710205078, 28.38922882080078, 33.523860931396484, 38.65849304199219, 43.793128967285156, 48.927757263183594, 54.06239318847656, 59.197025299072266, 64.33165740966797, 69.46629333496094, 74.60092163085938, 79.73555755615234, 84.87018585205078, 90.00482177734375, 95.13945007324219, 100.27408599853516, 105.40872192382812, 110.5433578491211, 115.67798614501953, 120.8126220703125, 125.94725036621094, 131.08187866210938, 136.21652221679688, 141.3511505126953, 146.48577880859375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 7.0, 10.0, 6.0, 7.0, 12.0, 21.0, 17.0, 24.0, 19.0, 29.0, 23.0, 34.0, 63.0, 95.0, 120.0, 108.0, 81.0, 42.0, 36.0, 32.0, 42.0, 33.0, 25.0, 15.0, 15.0, 12.0, 16.0, 8.0, 12.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-87.9195785522461, -85.53974151611328, -83.159912109375, -80.78007507324219, -78.40023803710938, -76.02040100097656, -73.64056396484375, -71.26073455810547, -68.88089752197266, -66.50106048583984, -64.12123107910156, -61.74139404296875, -59.36155700683594, -56.981719970703125, -54.60188674926758, -52.22205352783203, -49.84221649169922, -47.462379455566406, -45.08254623413086, -42.70271301269531, -40.3228759765625, -37.94303894042969, -35.56320571899414, -33.183372497558594, -30.80353546142578, -28.4237003326416, -26.043865203857422, -23.664030075073242, -21.284194946289062, -18.904359817504883, -16.524524688720703, -14.144689559936523, -11.764846801757812, -9.385011672973633, -7.005176544189453, -4.625341415405273, -2.2455062866210938, 0.13432884216308594, 2.5141639709472656, 4.893999099731445, 7.273834228515625, 9.653669357299805, 12.033504486083984, 14.413339614868164, 16.793174743652344, 19.173009872436523, 21.552845001220703, 23.932680130004883, 26.312515258789062, 28.692350387573242, 31.072185516357422, 33.45201873779297, 35.83185577392578, 38.211692810058594, 40.59152603149414, 42.97135925292969, 45.3511962890625, 47.73103332519531, 50.11086654663086, 52.490699768066406, 54.87053680419922, 57.25037384033203, 59.63020706176758, 62.010040283203125, 64.38987731933594]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 16.0, 26.0, 34.0, 67.0, 89.0, 159.0, 303.0, 516.0, 1083.0, 2380.0, 5697.0, 15959.0, 82775.0, 1550567.0, 2374720.0, 131933.0, 18185.0, 5385.0, 2033.0, 940.0, 457.0, 314.0, 198.0, 109.0, 87.0, 61.0, 52.0, 28.0, 21.0, 18.0, 12.0, 7.0, 9.0, 9.0, 5.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.9296875, -8.60009765625, -8.2705078125, -7.94091796875, -7.611328125, -7.28173828125, -6.9521484375, -6.62255859375, -6.29296875, -5.96337890625, -5.6337890625, -5.30419921875, -4.974609375, -4.64501953125, -4.3154296875, -3.98583984375, -3.65625, -3.32666015625, -2.9970703125, -2.66748046875, -2.337890625, -2.00830078125, -1.6787109375, -1.34912109375, -1.01953125, -0.68994140625, -0.3603515625, -0.03076171875, 0.298828125, 0.62841796875, 0.9580078125, 1.28759765625, 1.6171875, 1.94677734375, 2.2763671875, 2.60595703125, 2.935546875, 3.26513671875, 3.5947265625, 3.92431640625, 4.25390625, 4.58349609375, 4.9130859375, 5.24267578125, 5.572265625, 5.90185546875, 6.2314453125, 6.56103515625, 6.890625, 7.22021484375, 7.5498046875, 7.87939453125, 8.208984375, 8.53857421875, 8.8681640625, 9.19775390625, 9.52734375, 9.85693359375, 10.1865234375, 10.51611328125, 10.845703125, 11.17529296875, 11.5048828125, 11.83447265625, 12.1640625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 13.0, 18.0, 24.0, 37.0, 50.0, 79.0, 73.0, 101.0, 106.0, 113.0, 100.0, 88.0, 54.0, 53.0, 35.0, 22.0, 19.0, 13.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.64453125, -3.41510009765625, -3.1856689453125, -2.95623779296875, -2.726806640625, -2.49737548828125, -2.2679443359375, -2.03851318359375, -1.80908203125, -1.57965087890625, -1.3502197265625, -1.12078857421875, -0.891357421875, -0.66192626953125, -0.4324951171875, -0.20306396484375, 0.0263671875, 0.25579833984375, 0.4852294921875, 0.71466064453125, 0.944091796875, 1.17352294921875, 1.4029541015625, 1.63238525390625, 1.86181640625, 2.09124755859375, 2.3206787109375, 2.55010986328125, 2.779541015625, 3.00897216796875, 3.2384033203125, 3.46783447265625, 3.697265625, 3.92669677734375, 4.1561279296875, 4.38555908203125, 4.614990234375, 4.84442138671875, 5.0738525390625, 5.30328369140625, 5.53271484375, 5.76214599609375, 5.9915771484375, 6.22100830078125, 6.450439453125, 6.67987060546875, 6.9093017578125, 7.13873291015625, 7.3681640625, 7.59759521484375, 7.8270263671875, 8.05645751953125, 8.285888671875, 8.51531982421875, 8.7447509765625, 8.97418212890625, 9.20361328125, 9.43304443359375, 9.6624755859375, 9.89190673828125, 10.121337890625, 10.35076904296875, 10.5802001953125, 10.80963134765625, 11.0390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 8.0, 18.0, 49.0, 107.0, 320.0, 1107.0, 6904.0, 4153733.0, 29612.0, 1765.0, 384.0, 133.0, 52.0, 36.0, 18.0, 7.0, 6.0, 6.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.75, -68.76708984375, -66.7841796875, -64.80126953125, -62.818359375, -60.83544921875, -58.8525390625, -56.86962890625, -54.88671875, -52.90380859375, -50.9208984375, -48.93798828125, -46.955078125, -44.97216796875, -42.9892578125, -41.00634765625, -39.0234375, -37.04052734375, -35.0576171875, -33.07470703125, -31.091796875, -29.10888671875, -27.1259765625, -25.14306640625, -23.16015625, -21.17724609375, -19.1943359375, -17.21142578125, -15.228515625, -13.24560546875, -11.2626953125, -9.27978515625, -7.296875, -5.31396484375, -3.3310546875, -1.34814453125, 0.634765625, 2.61767578125, 4.6005859375, 6.58349609375, 8.56640625, 10.54931640625, 12.5322265625, 14.51513671875, 16.498046875, 18.48095703125, 20.4638671875, 22.44677734375, 24.4296875, 26.41259765625, 28.3955078125, 30.37841796875, 32.361328125, 34.34423828125, 36.3271484375, 38.31005859375, 40.29296875, 42.27587890625, 44.2587890625, 46.24169921875, 48.224609375, 50.20751953125, 52.1904296875, 54.17333984375, 56.15625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 14.0, 27.0, 58.0, 179.0, 455.0, 1220.0, 1230.0, 543.0, 208.0, 89.0, 30.0, 11.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6875, -33.77685546875, -32.8662109375, -31.95556640625, -31.044921875, -30.13427734375, -29.2236328125, -28.31298828125, -27.40234375, -26.49169921875, -25.5810546875, -24.67041015625, -23.759765625, -22.84912109375, -21.9384765625, -21.02783203125, -20.1171875, -19.20654296875, -18.2958984375, -17.38525390625, -16.474609375, -15.56396484375, -14.6533203125, -13.74267578125, -12.83203125, -11.92138671875, -11.0107421875, -10.10009765625, -9.189453125, -8.27880859375, -7.3681640625, -6.45751953125, -5.546875, -4.63623046875, -3.7255859375, -2.81494140625, -1.904296875, -0.99365234375, -0.0830078125, 0.82763671875, 1.73828125, 2.64892578125, 3.5595703125, 4.47021484375, 5.380859375, 6.29150390625, 7.2021484375, 8.11279296875, 9.0234375, 9.93408203125, 10.8447265625, 11.75537109375, 12.666015625, 13.57666015625, 14.4873046875, 15.39794921875, 16.30859375, 17.21923828125, 18.1298828125, 19.04052734375, 19.951171875, 20.86181640625, 21.7724609375, 22.68310546875, 23.59375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 2.0, 5.0, 6.0, 13.0, 16.0, 21.0, 43.0, 56.0, 101.0, 145.0, 191.0, 129.0, 96.0, 52.0, 43.0, 19.0, 6.0, 17.0, 4.0, 9.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.18042755126953, -114.42601013183594, -110.67159271240234, -106.91717529296875, -103.16276550292969, -99.4083480834961, -95.6539306640625, -91.8995132446289, -88.14509582519531, -84.39067840576172, -80.63626098632812, -76.88185119628906, -73.12743377685547, -69.37301635742188, -65.61859893798828, -61.86418151855469, -58.109771728515625, -54.35535430908203, -50.6009407043457, -46.84652328491211, -43.09210968017578, -39.33769226074219, -35.583274841308594, -31.828859329223633, -28.074443817138672, -24.32002830505371, -20.56561279296875, -16.811195373535156, -13.056779861450195, -9.302364349365234, -5.547946929931641, -1.7935314178466797, 1.96087646484375, 5.715292453765869, 9.469708442687988, 13.224124908447266, 16.978540420532227, 20.732955932617188, 24.48737335205078, 28.241788864135742, 31.996204376220703, 35.7506217956543, 39.505035400390625, 43.25945281982422, 47.01387023925781, 50.76828384399414, 54.522701263427734, 58.27711486816406, 62.031532287597656, 65.78594970703125, 69.54036712646484, 73.29478454589844, 77.0491943359375, 80.8036117553711, 84.55802917480469, 88.31244659423828, 92.06686401367188, 95.82128143310547, 99.57569885253906, 103.33010864257812, 107.08452606201172, 110.83894348144531, 114.5933609008789, 118.3477783203125, 122.10218811035156]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 10.0, 17.0, 25.0, 61.0, 83.0, 86.0, 123.0, 122.0, 148.0, 94.0, 75.0, 56.0, 47.0, 25.0, 10.0, 9.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-164.6021270751953, -159.8663330078125, -155.1305389404297, -150.39474487304688, -145.658935546875, -140.9231414794922, -136.18734741210938, -131.45155334472656, -126.71575927734375, -121.97996520996094, -117.24417114257812, -112.50836944580078, -107.77257537841797, -103.03678131103516, -98.30097961425781, -93.565185546875, -88.82939147949219, -84.09359741210938, -79.35780334472656, -74.62200164794922, -69.8862075805664, -65.1504135131836, -60.414615631103516, -55.67881774902344, -50.943023681640625, -46.20722961425781, -41.471431732177734, -36.735633850097656, -31.999839782714844, -27.2640438079834, -22.528247833251953, -17.792449951171875, -13.056671142578125, -8.32087516784668, -3.5850791931152344, 1.150716781616211, 5.886512756347656, 10.622308731079102, 15.358104705810547, 20.093902587890625, 24.829696655273438, 29.565492630004883, 34.30128860473633, 39.037086486816406, 43.77288055419922, 48.50867462158203, 53.24447250366211, 57.98027038574219, 62.716064453125, 67.45185852050781, 72.18765258789062, 76.92345428466797, 81.65924835205078, 86.3950424194336, 91.13084411621094, 95.86663818359375, 100.60243225097656, 105.33822631835938, 110.07402038574219, 114.80982208251953, 119.54561614990234, 124.28141021728516, 129.0172119140625, 133.7530059814453, 138.48880004882812]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 17.0, 19.0, 56.0, 108.0, 238.0, 481.0, 1395.0, 4868.0, 31319.0, 757488.0, 232834.0, 14990.0, 3095.0, 927.0, 349.0, 166.0, 83.0, 48.0, 21.0, 8.0, 7.0, 13.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6015625, -13.1456298828125, -12.689697265625, -12.2337646484375, -11.77783203125, -11.3218994140625, -10.865966796875, -10.4100341796875, -9.9541015625, -9.4981689453125, -9.042236328125, -8.5863037109375, -8.13037109375, -7.6744384765625, -7.218505859375, -6.7625732421875, -6.306640625, -5.8507080078125, -5.394775390625, -4.9388427734375, -4.48291015625, -4.0269775390625, -3.571044921875, -3.1151123046875, -2.6591796875, -2.2032470703125, -1.747314453125, -1.2913818359375, -0.83544921875, -0.3795166015625, 0.076416015625, 0.5323486328125, 0.98828125, 1.4442138671875, 1.900146484375, 2.3560791015625, 2.81201171875, 3.2679443359375, 3.723876953125, 4.1798095703125, 4.6357421875, 5.0916748046875, 5.547607421875, 6.0035400390625, 6.45947265625, 6.9154052734375, 7.371337890625, 7.8272705078125, 8.283203125, 8.7391357421875, 9.195068359375, 9.6510009765625, 10.10693359375, 10.5628662109375, 11.018798828125, 11.4747314453125, 11.9306640625, 12.3865966796875, 12.842529296875, 13.2984619140625, 13.75439453125, 14.2103271484375, 14.666259765625, 15.1221923828125, 15.578125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 16.0, 32.0, 34.0, 70.0, 111.0, 140.0, 105.0, 152.0, 101.0, 95.0, 53.0, 47.0, 23.0, 13.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.09375, -10.7225341796875, -10.351318359375, -9.9801025390625, -9.60888671875, -9.2376708984375, -8.866455078125, -8.4952392578125, -8.1240234375, -7.7528076171875, -7.381591796875, -7.0103759765625, -6.63916015625, -6.2679443359375, -5.896728515625, -5.5255126953125, -5.154296875, -4.7830810546875, -4.411865234375, -4.0406494140625, -3.66943359375, -3.2982177734375, -2.927001953125, -2.5557861328125, -2.1845703125, -1.8133544921875, -1.442138671875, -1.0709228515625, -0.69970703125, -0.3284912109375, 0.042724609375, 0.4139404296875, 0.78515625, 1.1563720703125, 1.527587890625, 1.8988037109375, 2.27001953125, 2.6412353515625, 3.012451171875, 3.3836669921875, 3.7548828125, 4.1260986328125, 4.497314453125, 4.8685302734375, 5.23974609375, 5.6109619140625, 5.982177734375, 6.3533935546875, 6.724609375, 7.0958251953125, 7.467041015625, 7.8382568359375, 8.20947265625, 8.5806884765625, 8.951904296875, 9.3231201171875, 9.6943359375, 10.0655517578125, 10.436767578125, 10.8079833984375, 11.17919921875, 11.5504150390625, 11.921630859375, 12.2928466796875, 12.6640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 10.0, 7.0, 12.0, 10.0, 14.0, 19.0, 21.0, 20.0, 33.0, 56.0, 70.0, 119.0, 184.0, 313.0, 566.0, 1228.0, 3540.0, 17947.0, 282883.0, 712465.0, 22263.0, 3891.0, 1341.0, 633.0, 323.0, 172.0, 124.0, 74.0, 56.0, 34.0, 33.0, 24.0, 12.0, 13.0, 11.0, 10.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.3671875, -10.062744140625, -9.75830078125, -9.453857421875, -9.1494140625, -8.844970703125, -8.54052734375, -8.236083984375, -7.931640625, -7.627197265625, -7.32275390625, -7.018310546875, -6.7138671875, -6.409423828125, -6.10498046875, -5.800537109375, -5.49609375, -5.191650390625, -4.88720703125, -4.582763671875, -4.2783203125, -3.973876953125, -3.66943359375, -3.364990234375, -3.060546875, -2.756103515625, -2.45166015625, -2.147216796875, -1.8427734375, -1.538330078125, -1.23388671875, -0.929443359375, -0.625, -0.320556640625, -0.01611328125, 0.288330078125, 0.5927734375, 0.897216796875, 1.20166015625, 1.506103515625, 1.810546875, 2.114990234375, 2.41943359375, 2.723876953125, 3.0283203125, 3.332763671875, 3.63720703125, 3.941650390625, 4.24609375, 4.550537109375, 4.85498046875, 5.159423828125, 5.4638671875, 5.768310546875, 6.07275390625, 6.377197265625, 6.681640625, 6.986083984375, 7.29052734375, 7.594970703125, 7.8994140625, 8.203857421875, 8.50830078125, 8.812744140625, 9.1171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 13.0, 12.0, 17.0, 12.0, 16.0, 19.0, 31.0, 34.0, 35.0, 41.0, 49.0, 60.0, 53.0, 62.0, 60.0, 56.0, 52.0, 53.0, 44.0, 39.0, 28.0, 31.0, 28.0, 18.0, 11.0, 18.0, 5.0, 12.0, 12.0, 17.0, 8.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-16.890625, -16.394287109375, -15.89794921875, -15.401611328125, -14.9052734375, -14.408935546875, -13.91259765625, -13.416259765625, -12.919921875, -12.423583984375, -11.92724609375, -11.430908203125, -10.9345703125, -10.438232421875, -9.94189453125, -9.445556640625, -8.94921875, -8.452880859375, -7.95654296875, -7.460205078125, -6.9638671875, -6.467529296875, -5.97119140625, -5.474853515625, -4.978515625, -4.482177734375, -3.98583984375, -3.489501953125, -2.9931640625, -2.496826171875, -2.00048828125, -1.504150390625, -1.0078125, -0.511474609375, -0.01513671875, 0.481201171875, 0.9775390625, 1.473876953125, 1.97021484375, 2.466552734375, 2.962890625, 3.459228515625, 3.95556640625, 4.451904296875, 4.9482421875, 5.444580078125, 5.94091796875, 6.437255859375, 6.93359375, 7.429931640625, 7.92626953125, 8.422607421875, 8.9189453125, 9.415283203125, 9.91162109375, 10.407958984375, 10.904296875, 11.400634765625, 11.89697265625, 12.393310546875, 12.8896484375, 13.385986328125, 13.88232421875, 14.378662109375, 14.875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 7.0, 8.0, 17.0, 21.0, 22.0, 38.0, 61.0, 80.0, 123.0, 231.0, 468.0, 908.0, 2019.0, 5176.0, 17986.0, 117561.0, 843139.0, 44367.0, 10103.0, 3282.0, 1360.0, 663.0, 346.0, 216.0, 113.0, 76.0, 39.0, 32.0, 29.0, 19.0, 14.0, 8.0, 3.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.69921875, -1.646575927734375, -1.59393310546875, -1.541290283203125, -1.4886474609375, -1.436004638671875, -1.38336181640625, -1.330718994140625, -1.278076171875, -1.225433349609375, -1.17279052734375, -1.120147705078125, -1.0675048828125, -1.014862060546875, -0.96221923828125, -0.909576416015625, -0.85693359375, -0.804290771484375, -0.75164794921875, -0.699005126953125, -0.6463623046875, -0.593719482421875, -0.54107666015625, -0.488433837890625, -0.435791015625, -0.383148193359375, -0.33050537109375, -0.277862548828125, -0.2252197265625, -0.172576904296875, -0.11993408203125, -0.067291259765625, -0.0146484375, 0.037994384765625, 0.09063720703125, 0.143280029296875, 0.1959228515625, 0.248565673828125, 0.30120849609375, 0.353851318359375, 0.406494140625, 0.459136962890625, 0.51177978515625, 0.564422607421875, 0.6170654296875, 0.669708251953125, 0.72235107421875, 0.774993896484375, 0.82763671875, 0.880279541015625, 0.93292236328125, 0.985565185546875, 1.0382080078125, 1.090850830078125, 1.14349365234375, 1.196136474609375, 1.248779296875, 1.301422119140625, 1.35406494140625, 1.406707763671875, 1.4593505859375, 1.511993408203125, 1.56463623046875, 1.617279052734375, 1.669921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 2.0, 6.0, 5.0, 9.0, 11.0, 9.0, 11.0, 22.0, 27.0, 24.0, 39.0, 35.0, 57.0, 94.0, 95.0, 111.0, 105.0, 72.0, 63.0, 47.0, 42.0, 20.0, 15.0, 18.0, 9.0, 7.0, 5.0, 6.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 7.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004165172576904297, -0.00040328875184059143, -0.0003900602459907532, -0.0003768317401409149, -0.00036360323429107666, -0.0003503747284412384, -0.00033714622259140015, -0.0003239177167415619, -0.00031068921089172363, -0.0002974607050418854, -0.0002842321991920471, -0.00027100369334220886, -0.0002577751874923706, -0.00024454668164253235, -0.0002313181757926941, -0.00021808966994285583, -0.00020486116409301758, -0.00019163265824317932, -0.00017840415239334106, -0.0001651756465435028, -0.00015194714069366455, -0.0001387186348438263, -0.00012549012899398804, -0.00011226162314414978, -9.903311729431152e-05, -8.580461144447327e-05, -7.257610559463501e-05, -5.934759974479675e-05, -4.6119093894958496e-05, -3.289058804512024e-05, -1.9662082195281982e-05, -6.433576345443726e-06, 6.794929504394531e-06, 2.0023435354232788e-05, 3.3251941204071045e-05, 4.64804470539093e-05, 5.970895290374756e-05, 7.293745875358582e-05, 8.616596460342407e-05, 9.939447045326233e-05, 0.00011262297630310059, 0.00012585148215293884, 0.0001390799880027771, 0.00015230849385261536, 0.0001655369997024536, 0.00017876550555229187, 0.00019199401140213013, 0.00020522251725196838, 0.00021845102310180664, 0.0002316795289516449, 0.00024490803480148315, 0.0002581365406513214, 0.00027136504650115967, 0.0002845935523509979, 0.0002978220582008362, 0.00031105056405067444, 0.0003242790699005127, 0.00033750757575035095, 0.0003507360816001892, 0.00036396458745002747, 0.0003771930932998657, 0.000390421599149704, 0.00040365010499954224, 0.0004168786108493805, 0.00043010711669921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 8.0, 11.0, 15.0, 23.0, 40.0, 52.0, 59.0, 95.0, 150.0, 265.0, 458.0, 937.0, 2005.0, 5010.0, 15526.0, 74395.0, 833565.0, 88155.0, 17875.0, 5559.0, 2094.0, 992.0, 519.0, 275.0, 165.0, 78.0, 71.0, 35.0, 32.0, 22.0, 16.0, 9.0, 6.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.4943389892578125, -1.443756103515625, -1.3931732177734375, -1.34259033203125, -1.2920074462890625, -1.241424560546875, -1.1908416748046875, -1.1402587890625, -1.0896759033203125, -1.039093017578125, -0.9885101318359375, -0.93792724609375, -0.8873443603515625, -0.836761474609375, -0.7861785888671875, -0.735595703125, -0.6850128173828125, -0.634429931640625, -0.5838470458984375, -0.53326416015625, -0.4826812744140625, -0.432098388671875, -0.3815155029296875, -0.3309326171875, -0.2803497314453125, -0.229766845703125, -0.1791839599609375, -0.12860107421875, -0.0780181884765625, -0.027435302734375, 0.0231475830078125, 0.07373046875, 0.1243133544921875, 0.174896240234375, 0.2254791259765625, 0.27606201171875, 0.3266448974609375, 0.377227783203125, 0.4278106689453125, 0.4783935546875, 0.5289764404296875, 0.579559326171875, 0.6301422119140625, 0.68072509765625, 0.7313079833984375, 0.781890869140625, 0.8324737548828125, 0.883056640625, 0.9336395263671875, 0.984222412109375, 1.0348052978515625, 1.08538818359375, 1.1359710693359375, 1.186553955078125, 1.2371368408203125, 1.2877197265625, 1.3383026123046875, 1.388885498046875, 1.4394683837890625, 1.49005126953125, 1.5406341552734375, 1.591217041015625, 1.6417999267578125, 1.6923828125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 6.0, 7.0, 6.0, 7.0, 10.0, 9.0, 9.0, 16.0, 24.0, 32.0, 26.0, 40.0, 64.0, 94.0, 116.0, 124.0, 114.0, 85.0, 44.0, 37.0, 32.0, 22.0, 18.0, 15.0, 8.0, 5.0, 11.0, 4.0, 4.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.828125, -1.7692108154296875, -1.710296630859375, -1.6513824462890625, -1.59246826171875, -1.5335540771484375, -1.474639892578125, -1.4157257080078125, -1.3568115234375, -1.2978973388671875, -1.238983154296875, -1.1800689697265625, -1.12115478515625, -1.0622406005859375, -1.003326416015625, -0.9444122314453125, -0.885498046875, -0.8265838623046875, -0.767669677734375, -0.7087554931640625, -0.64984130859375, -0.5909271240234375, -0.532012939453125, -0.4730987548828125, -0.4141845703125, -0.3552703857421875, -0.296356201171875, -0.2374420166015625, -0.17852783203125, -0.1196136474609375, -0.060699462890625, -0.0017852783203125, 0.05712890625, 0.1160430908203125, 0.174957275390625, 0.2338714599609375, 0.29278564453125, 0.3516998291015625, 0.410614013671875, 0.4695281982421875, 0.5284423828125, 0.5873565673828125, 0.646270751953125, 0.7051849365234375, 0.76409912109375, 0.8230133056640625, 0.881927490234375, 0.9408416748046875, 0.999755859375, 1.0586700439453125, 1.117584228515625, 1.1764984130859375, 1.23541259765625, 1.2943267822265625, 1.353240966796875, 1.4121551513671875, 1.4710693359375, 1.5299835205078125, 1.588897705078125, 1.6478118896484375, 1.70672607421875, 1.7656402587890625, 1.824554443359375, 1.8834686279296875, 1.9423828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 18.0, 61.0, 239.0, 487.0, 81.0, 47.0, 23.0, 16.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.95459747314453, -64.57491302490234, -61.19522476196289, -57.81553649902344, -54.43585205078125, -51.05616760253906, -47.67647933959961, -44.296791076660156, -40.91710662841797, -37.53742218017578, -34.15773391723633, -30.778047561645508, -27.398361206054688, -24.018674850463867, -20.638988494873047, -17.259302139282227, -13.879615783691406, -10.499929428100586, -7.120243072509766, -3.7405567169189453, -0.360870361328125, 3.0188159942626953, 6.398502349853516, 9.778188705444336, 13.157875061035156, 16.537561416625977, 19.917247772216797, 23.296934127807617, 26.676620483398438, 30.056306838989258, 33.43599319458008, 36.81568145751953, 40.19537353515625, 43.57505798339844, 46.95474624633789, 50.334434509277344, 53.71411895751953, 57.09380340576172, 60.47349166870117, 63.853179931640625, 67.23286437988281, 70.612548828125, 73.99223327636719, 77.3719253540039, 80.7516098022461, 84.13129425048828, 87.510986328125, 90.89067077636719, 94.27035522460938, 97.65003967285156, 101.02972412109375, 104.40941619873047, 107.78910064697266, 111.16878509521484, 114.54847717285156, 117.92816162109375, 121.30784606933594, 124.68753051757812, 128.0672149658203, 131.4468994140625, 134.82659912109375, 138.20628356933594, 141.58596801757812, 144.9656524658203, 148.3453369140625]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 12.0, 18.0, 23.0, 21.0, 15.0, 41.0, 30.0, 92.0, 173.0, 228.0, 108.0, 47.0, 31.0, 30.0, 31.0, 18.0, 12.0, 14.0, 11.0, 9.0, 10.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-96.24513244628906, -93.96099853515625, -91.67687225341797, -89.39273834228516, -87.10860443115234, -84.82447814941406, -82.54034423828125, -80.25621032714844, -77.97207641601562, -75.68794250488281, -73.40381622314453, -71.11968231201172, -68.8355484008789, -66.55142211914062, -64.26728820800781, -61.983154296875, -59.69902801513672, -57.41489791870117, -55.13076400756836, -52.84663391113281, -50.5625, -48.27836990356445, -45.994239807128906, -43.710105895996094, -41.42597579956055, -39.141845703125, -36.85771179199219, -34.57358169555664, -32.289451599121094, -30.00531768798828, -27.721187591552734, -25.437055587768555, -23.152923583984375, -20.868791580200195, -18.584659576416016, -16.30052947998047, -14.016397476196289, -11.73226547241211, -9.448134422302246, -7.164003372192383, -4.879871368408203, -2.5957398414611816, -0.31160831451416016, 1.9725232124328613, 4.256654739379883, 6.5407867431640625, 8.824917793273926, 11.109048843383789, 13.393180847167969, 15.677312850952148, 17.961444854736328, 20.245574951171875, 22.529706954956055, 24.813838958740234, 27.09796905517578, 29.38210105895996, 31.66623306274414, 33.95036315917969, 36.2344970703125, 38.51862716674805, 40.802757263183594, 43.086891174316406, 45.37102127075195, 47.6551513671875, 49.93928527832031]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 8.0, 11.0, 17.0, 17.0, 34.0, 47.0, 47.0, 62.0, 89.0, 280.0, 107.0, 66.0, 42.0, 44.0, 41.0, 19.0, 21.0, 13.0, 14.0, 7.0, 3.0, 5.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.7109375, -10.4710693359375, -10.231201171875, -9.9913330078125, -9.75146484375, -9.5115966796875, -9.271728515625, -9.0318603515625, -8.7919921875, -8.5521240234375, -8.312255859375, -8.0723876953125, -7.83251953125, -7.5926513671875, -7.352783203125, -7.1129150390625, -6.873046875, -6.6331787109375, -6.393310546875, -6.1534423828125, -5.91357421875, -5.6737060546875, -5.433837890625, -5.1939697265625, -4.9541015625, -4.7142333984375, -4.474365234375, -4.2344970703125, -3.99462890625, -3.7547607421875, -3.514892578125, -3.2750244140625, -3.03515625, -2.7952880859375, -2.555419921875, -2.3155517578125, -2.07568359375, -1.8358154296875, -1.595947265625, -1.3560791015625, -1.1162109375, -0.8763427734375, -0.636474609375, -0.3966064453125, -0.15673828125, 0.0831298828125, 0.322998046875, 0.5628662109375, 0.802734375, 1.0426025390625, 1.282470703125, 1.5223388671875, 1.76220703125, 2.0020751953125, 2.241943359375, 2.4818115234375, 2.7216796875, 2.9615478515625, 3.201416015625, 3.4412841796875, 3.68115234375, 3.9210205078125, 4.160888671875, 4.4007568359375, 4.640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 5.0, 2.0, 6.0, 4.0, 9.0, 17.0, 24.0, 37.0, 52.0, 80.0, 113.0, 239.0, 694.0, 2653.0, 26119.0, 8347808.0, 8300.0, 1411.0, 471.0, 203.0, 119.0, 68.0, 32.0, 28.0, 29.0, 15.0, 10.0, 9.0, 11.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.46763610839844, -45.8476676940918, -44.227699279785156, -42.60772705078125, -40.98775863647461, -39.36779022216797, -37.74782180786133, -36.12785339355469, -34.50788116455078, -32.88791275024414, -31.267942428588867, -29.647974014282227, -28.028003692626953, -26.408035278320312, -24.788066864013672, -23.16809844970703, -21.54813003540039, -19.92816162109375, -18.308191299438477, -16.688222885131836, -15.068253517150879, -13.448284149169922, -11.828315734863281, -10.208346366882324, -8.588376998901367, -6.96840763092041, -5.348438739776611, -3.7284698486328125, -2.1085004806518555, -0.48853111267089844, 1.1314373016357422, 2.751406669616699, 4.371372222900391, 5.991341590881348, 7.6113104820251465, 9.231279373168945, 10.851248741149902, 12.47121810913086, 14.0911865234375, 15.711155891418457, 17.331125259399414, 18.951093673706055, 20.571063995361328, 22.19103240966797, 23.81100082397461, 25.430971145629883, 27.050939559936523, 28.670909881591797, 30.290878295898438, 31.910846710205078, 33.53081512451172, 35.150787353515625, 36.770755767822266, 38.390724182128906, 40.01069259643555, 41.63066101074219, 43.250633239746094, 44.870601654052734, 46.490570068359375, 48.11054229736328, 49.73051071166992, 51.35047912597656, 52.9704475402832, 54.590415954589844, 56.210384368896484]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 7.0, 2.0, 8.0, 7.0, 3.0, 1.0, 7.0, 9.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-86.96797943115234, -83.19800567626953, -79.42802429199219, -75.65805053710938, -71.88807678222656, -68.11810302734375, -64.34812927246094, -60.578147888183594, -56.80817413330078, -53.03820037841797, -49.26822280883789, -45.49824523925781, -41.728271484375, -37.95829772949219, -34.18832015991211, -30.418344497680664, -26.64836883544922, -22.878393173217773, -19.108417510986328, -15.338441848754883, -11.568466186523438, -7.798490524291992, -4.028514862060547, -0.25853919982910156, 3.5114364624023438, 7.281412124633789, 11.051387786865234, 14.82136344909668, 18.591339111328125, 22.36131477355957, 26.131290435791016, 29.90126609802246, 33.671234130859375, 37.44120788574219, 41.211185455322266, 44.981163024902344, 48.751136779785156, 52.52111053466797, 56.29108810424805, 60.061065673828125, 63.83103942871094, 67.60101318359375, 71.37098693847656, 75.1409683227539, 78.91094207763672, 82.68091583251953, 86.45089721679688, 90.22087097167969, 93.9908447265625, 97.76081848144531, 101.53079223632812, 105.30077362060547, 109.07074737548828, 112.8407211303711, 116.61070251464844, 120.38067626953125, 124.15065002441406, 127.92062377929688, 131.6905975341797, 135.4605712890625, 139.23056030273438, 143.0005340576172, 146.7705078125, 150.5404815673828, 154.31045532226562]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 4.0, 9.0, 7.0, 11.0, 11.0, 24.0, 21.0, 43.0, 53.0, 76.0, 75.0, 94.0, 100.0, 93.0, 84.0, 85.0, 45.0, 39.0, 26.0, 24.0, 22.0, 23.0, 16.0, 10.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.701171875, -2.575347900390625, -2.44952392578125, -2.323699951171875, -2.1978759765625, -2.072052001953125, -1.94622802734375, -1.820404052734375, -1.694580078125, -1.568756103515625, -1.44293212890625, -1.317108154296875, -1.1912841796875, -1.065460205078125, -0.93963623046875, -0.813812255859375, -0.68798828125, -0.562164306640625, -0.43634033203125, -0.310516357421875, -0.1846923828125, -0.058868408203125, 0.06695556640625, 0.192779541015625, 0.318603515625, 0.444427490234375, 0.57025146484375, 0.696075439453125, 0.8218994140625, 0.947723388671875, 1.07354736328125, 1.199371337890625, 1.3251953125, 1.451019287109375, 1.57684326171875, 1.702667236328125, 1.8284912109375, 1.954315185546875, 2.08013916015625, 2.205963134765625, 2.331787109375, 2.457611083984375, 2.58343505859375, 2.709259033203125, 2.8350830078125, 2.960906982421875, 3.08673095703125, 3.212554931640625, 3.33837890625, 3.464202880859375, 3.59002685546875, 3.715850830078125, 3.8416748046875, 3.967498779296875, 4.09332275390625, 4.219146728515625, 4.344970703125, 4.470794677734375, 4.59661865234375, 4.722442626953125, 4.8482666015625, 4.974090576171875, 5.09991455078125, 5.225738525390625, 5.3515625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 11.0, 16.0, 15.0, 37.0, 38.0, 67.0, 103.0, 216.0, 327.0, 724.0, 1559.0, 4053.0, 12142.0, 42144.0, 152598.0, 213533.0, 67892.0, 18820.0, 5914.0, 2118.0, 890.0, 470.0, 224.0, 126.0, 80.0, 47.0, 35.0, 24.0, 15.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-45.25, -44.1513671875, -43.052734375, -41.9541015625, -40.85546875, -39.7568359375, -38.658203125, -37.5595703125, -36.4609375, -35.3623046875, -34.263671875, -33.1650390625, -32.06640625, -30.9677734375, -29.869140625, -28.7705078125, -27.671875, -26.5732421875, -25.474609375, -24.3759765625, -23.27734375, -22.1787109375, -21.080078125, -19.9814453125, -18.8828125, -17.7841796875, -16.685546875, -15.5869140625, -14.48828125, -13.3896484375, -12.291015625, -11.1923828125, -10.09375, -8.9951171875, -7.896484375, -6.7978515625, -5.69921875, -4.6005859375, -3.501953125, -2.4033203125, -1.3046875, -0.2060546875, 0.892578125, 1.9912109375, 3.08984375, 4.1884765625, 5.287109375, 6.3857421875, 7.484375, 8.5830078125, 9.681640625, 10.7802734375, 11.87890625, 12.9775390625, 14.076171875, 15.1748046875, 16.2734375, 17.3720703125, 18.470703125, 19.5693359375, 20.66796875, 21.7666015625, 22.865234375, 23.9638671875, 25.0625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 5.0, 10.0, 12.0, 11.0, 14.0, 26.0, 33.0, 42.0, 53.0, 70.0, 78.0, 98.0, 85.0, 77.0, 95.0, 58.0, 66.0, 42.0, 37.0, 30.0, 17.0, 13.0, 7.0, 12.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9453125, -8.7205810546875, -8.495849609375, -8.2711181640625, -8.04638671875, -7.8216552734375, -7.596923828125, -7.3721923828125, -7.1474609375, -6.9227294921875, -6.697998046875, -6.4732666015625, -6.24853515625, -6.0238037109375, -5.799072265625, -5.5743408203125, -5.349609375, -5.1248779296875, -4.900146484375, -4.6754150390625, -4.45068359375, -4.2259521484375, -4.001220703125, -3.7764892578125, -3.5517578125, -3.3270263671875, -3.102294921875, -2.8775634765625, -2.65283203125, -2.4281005859375, -2.203369140625, -1.9786376953125, -1.75390625, -1.5291748046875, -1.304443359375, -1.0797119140625, -0.85498046875, -0.6302490234375, -0.405517578125, -0.1807861328125, 0.0439453125, 0.2686767578125, 0.493408203125, 0.7181396484375, 0.94287109375, 1.1676025390625, 1.392333984375, 1.6170654296875, 1.841796875, 2.0665283203125, 2.291259765625, 2.5159912109375, 2.74072265625, 2.9654541015625, 3.190185546875, 3.4149169921875, 3.6396484375, 3.8643798828125, 4.089111328125, 4.3138427734375, 4.53857421875, 4.7633056640625, 4.988037109375, 5.2127685546875, 5.4375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 7.0, 14.0, 37.0, 51.0, 84.0, 95.0, 67.0, 55.0, 23.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.075550079345703, -29.563095092773438, -28.050642013549805, -26.538188934326172, -25.025733947753906, -23.51327896118164, -22.000825881958008, -20.488372802734375, -18.97591781616211, -17.463462829589844, -15.951009750366211, -14.438555717468262, -12.926101684570312, -11.413647651672363, -9.901193618774414, -8.388739585876465, -6.876285552978516, -5.363831520080566, -3.851377487182617, -2.338923454284668, -0.8264694213867188, 0.6859846115112305, 2.1984386444091797, 3.710892677307129, 5.223346710205078, 6.735800743103027, 8.248254776000977, 9.760708808898926, 11.273162841796875, 12.785616874694824, 14.298070907592773, 15.810524940490723, 17.322975158691406, 18.835430145263672, 20.347883224487305, 21.860336303710938, 23.372791290283203, 24.88524627685547, 26.3976993560791, 27.910152435302734, 29.422607421875, 30.935062408447266, 32.44751739501953, 33.95996856689453, 35.4724235534668, 36.98487854003906, 38.49732971191406, 40.00978469848633, 41.522239685058594, 43.03469467163086, 44.547149658203125, 46.059600830078125, 47.57205581665039, 49.084510803222656, 50.596961975097656, 52.10941696166992, 53.62187194824219, 55.13432693481445, 56.64678192138672, 58.15923309326172, 59.671688079833984, 61.18414306640625, 62.69659423828125, 64.20905303955078, 65.72150421142578]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 15.0, 10.0, 17.0, 47.0, 64.0, 104.0, 72.0, 49.0, 24.0, 14.0, 11.0, 5.0, 2.0, 3.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.65226745605469, -35.617313385009766, -34.582359313964844, -33.54740524291992, -32.512451171875, -31.477495193481445, -30.44253921508789, -29.40758514404297, -28.372631072998047, -27.337677001953125, -26.302722930908203, -25.26776695251465, -24.232812881469727, -23.197858810424805, -22.16290283203125, -21.127948760986328, -20.092994689941406, -19.058040618896484, -18.023086547851562, -16.988130569458008, -15.953176498413086, -14.918222427368164, -13.883267402648926, -12.848312377929688, -11.813358306884766, -10.778404235839844, -9.743449211120605, -8.708494186401367, -7.673540115356445, -6.638585567474365, -5.603631019592285, -4.568676471710205, -3.533721923828125, -2.498767375946045, -1.4638128280639648, -0.42885828018188477, 0.6060962677001953, 1.6410508155822754, 2.6760053634643555, 3.7109599113464355, 4.745914459228516, 5.780869007110596, 6.815823554992676, 7.850778102874756, 8.885732650756836, 9.920686721801758, 10.955641746520996, 11.990596771240234, 13.025550842285156, 14.060504913330078, 15.095459938049316, 16.130414962768555, 17.165369033813477, 18.2003231048584, 19.235279083251953, 20.270233154296875, 21.305187225341797, 22.34014129638672, 23.37509536743164, 24.410051345825195, 25.445005416870117, 26.47995948791504, 27.514915466308594, 28.549869537353516, 29.584823608398438]}, "eval/loss": 5.443604946136475, "eval/wer": 1.5227687425624752, "eval/runtime": 664.731, "eval/samples_per_second": 3.975, "eval/steps_per_second": 0.498} \ No newline at end of file