diff --git "a/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" "b/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" --- "a/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" +++ "b/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 5.1696, "train/learning_rate": 2.6438836104513065e-05, "train/epoch": 3.36, "train/global_step": 3000, "_runtime": 17413, "_timestamp": 1646964652, "_step": 3001, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 5.0, 7.0, 5.0, 8.0, 8.0, 7.0, 11.0, 22.0, 14.0, 17.0, 26.0, 24.0, 38.0, 35.0, 35.0, 32.0, 49.0, 43.0, 38.0, 47.0, 41.0, 48.0, 46.0, 38.0, 36.0, 43.0, 45.0, 32.0, 26.0, 32.0, 21.0, 24.0, 19.0, 17.0, 16.0, 12.0, 5.0, 5.0, 8.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-75.23033142089844, -73.39999389648438, -71.56965637207031, -69.73931884765625, -67.90898132324219, -66.0786361694336, -64.24829864501953, -62.41796112060547, -60.587623596191406, -58.757286071777344, -56.92694854736328, -55.09660720825195, -53.26626968383789, -51.43593215942383, -49.6055908203125, -47.77525329589844, -45.944915771484375, -44.11457824707031, -42.28424072265625, -40.45389938354492, -38.62356185913086, -36.7932243347168, -34.96288299560547, -33.132545471191406, -31.302207946777344, -29.47187042236328, -27.641530990600586, -25.81119155883789, -23.980854034423828, -22.150516510009766, -20.32017707824707, -18.489837646484375, -16.659503936767578, -14.8291654586792, -12.99882698059082, -11.168488502502441, -9.338150024414062, -7.507811546325684, -5.677473068237305, -3.847134590148926, -2.016796112060547, -0.18645763397216797, 1.643880844116211, 3.47421932220459, 5.304557800292969, 7.134896278381348, 8.965234756469727, 10.795573234558105, 12.625911712646484, 14.456250190734863, 16.286588668823242, 18.116928100585938, 19.947265625, 21.777603149414062, 23.607942581176758, 25.438282012939453, 27.268619537353516, 29.098957061767578, 30.929296493530273, 32.75963592529297, 34.58997344970703, 36.420310974121094, 38.250648498535156, 40.080989837646484, 41.91132736206055]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 9.0, 11.0, 10.0, 13.0, 3.0, 14.0, 20.0, 14.0, 24.0, 25.0, 24.0, 26.0, 31.0, 36.0, 28.0, 41.0, 36.0, 39.0, 51.0, 47.0, 51.0, 36.0, 48.0, 45.0, 32.0, 34.0, 42.0, 28.0, 23.0, 26.0, 27.0, 15.0, 20.0, 23.0, 10.0, 19.0, 11.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.66462326049805, -53.80124282836914, -51.937862396240234, -50.074485778808594, -48.21110534667969, -46.34772491455078, -44.484344482421875, -42.62096405029297, -40.75758361816406, -38.894203186035156, -37.03082275390625, -35.167442321777344, -33.3040657043457, -31.440685272216797, -29.57730484008789, -27.713924407958984, -25.850547790527344, -23.987167358398438, -22.123788833618164, -20.260408401489258, -18.397029876708984, -16.533649444580078, -14.670269012451172, -12.806889533996582, -10.943510055541992, -9.080130577087402, -7.216750621795654, -5.353370666503906, -3.4899911880493164, -1.6266117095947266, 0.2367687225341797, 2.1001482009887695, 3.963531494140625, 5.826910972595215, 7.690290927886963, 9.553670883178711, 11.4170503616333, 13.28042984008789, 15.143810272216797, 17.007190704345703, 18.870569229125977, 20.733949661254883, 22.597328186035156, 24.460708618164062, 26.32408905029297, 28.187467575073242, 30.05084800720215, 31.914226531982422, 33.77760696411133, 35.640987396240234, 37.50436782836914, 39.36774444580078, 41.23112487792969, 43.094505310058594, 44.9578857421875, 46.821266174316406, 48.68464660644531, 50.54802703857422, 52.411407470703125, 54.27478790283203, 56.13816452026367, 58.00154495239258, 59.864925384521484, 61.72830581665039, 63.59168243408203]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 7.0, 15.0, 32.0, 49.0, 84.0, 120.0, 195.0, 287.0, 497.0, 793.0, 1211.0, 2051.0, 3158.0, 5232.0, 8679.0, 14639.0, 24190.0, 41076.0, 70709.0, 120204.0, 202519.0, 330330.0, 494004.0, 641447.0, 673062.0, 561723.0, 391936.0, 245942.0, 147515.0, 87204.0, 50511.0, 29710.0, 17683.0, 10581.0, 6296.0, 3789.0, 2492.0, 1579.0, 970.0, 626.0, 467.0, 239.0, 161.0, 90.0, 70.0, 45.0, 28.0, 17.0, 7.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-48.71875, -47.20556640625, -45.6923828125, -44.17919921875, -42.666015625, -41.15283203125, -39.6396484375, -38.12646484375, -36.61328125, -35.10009765625, -33.5869140625, -32.07373046875, -30.560546875, -29.04736328125, -27.5341796875, -26.02099609375, -24.5078125, -22.99462890625, -21.4814453125, -19.96826171875, -18.455078125, -16.94189453125, -15.4287109375, -13.91552734375, -12.40234375, -10.88916015625, -9.3759765625, -7.86279296875, -6.349609375, -4.83642578125, -3.3232421875, -1.81005859375, -0.296875, 1.21630859375, 2.7294921875, 4.24267578125, 5.755859375, 7.26904296875, 8.7822265625, 10.29541015625, 11.80859375, 13.32177734375, 14.8349609375, 16.34814453125, 17.861328125, 19.37451171875, 20.8876953125, 22.40087890625, 23.9140625, 25.42724609375, 26.9404296875, 28.45361328125, 29.966796875, 31.47998046875, 32.9931640625, 34.50634765625, 36.01953125, 37.53271484375, 39.0458984375, 40.55908203125, 42.072265625, 43.58544921875, 45.0986328125, 46.61181640625, 48.125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 8.0, 15.0, 13.0, 13.0, 16.0, 18.0, 14.0, 20.0, 20.0, 23.0, 26.0, 36.0, 31.0, 26.0, 35.0, 37.0, 42.0, 42.0, 38.0, 34.0, 45.0, 43.0, 49.0, 47.0, 31.0, 25.0, 29.0, 29.0, 27.0, 23.0, 23.0, 21.0, 14.0, 16.0, 16.0, 13.0, 11.0, 5.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.78125, -36.52099609375, -35.2607421875, -34.00048828125, -32.740234375, -31.47998046875, -30.2197265625, -28.95947265625, -27.69921875, -26.43896484375, -25.1787109375, -23.91845703125, -22.658203125, -21.39794921875, -20.1376953125, -18.87744140625, -17.6171875, -16.35693359375, -15.0966796875, -13.83642578125, -12.576171875, -11.31591796875, -10.0556640625, -8.79541015625, -7.53515625, -6.27490234375, -5.0146484375, -3.75439453125, -2.494140625, -1.23388671875, 0.0263671875, 1.28662109375, 2.546875, 3.80712890625, 5.0673828125, 6.32763671875, 7.587890625, 8.84814453125, 10.1083984375, 11.36865234375, 12.62890625, 13.88916015625, 15.1494140625, 16.40966796875, 17.669921875, 18.93017578125, 20.1904296875, 21.45068359375, 22.7109375, 23.97119140625, 25.2314453125, 26.49169921875, 27.751953125, 29.01220703125, 30.2724609375, 31.53271484375, 32.79296875, 34.05322265625, 35.3134765625, 36.57373046875, 37.833984375, 39.09423828125, 40.3544921875, 41.61474609375, 42.875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 24.0, 29.0, 53.0, 103.0, 136.0, 232.0, 402.0, 599.0, 982.0, 1600.0, 2526.0, 3896.0, 6369.0, 10157.0, 15663.0, 24476.0, 37620.0, 55779.0, 84020.0, 121783.0, 172486.0, 235664.0, 308766.0, 381079.0, 436514.0, 456172.0, 430021.0, 371025.0, 298360.0, 226304.0, 165178.0, 115549.0, 79671.0, 53051.0, 35292.0, 22628.0, 14770.0, 9545.0, 6016.0, 3622.0, 2365.0, 1426.0, 867.0, 552.0, 330.0, 229.0, 126.0, 76.0, 64.0, 42.0, 12.0, 12.0, 6.0, 13.0, 2.0, 1.0], "bins": [-36.1875, -35.10498046875, -34.0224609375, -32.93994140625, -31.857421875, -30.77490234375, -29.6923828125, -28.60986328125, -27.52734375, -26.44482421875, -25.3623046875, -24.27978515625, -23.197265625, -22.11474609375, -21.0322265625, -19.94970703125, -18.8671875, -17.78466796875, -16.7021484375, -15.61962890625, -14.537109375, -13.45458984375, -12.3720703125, -11.28955078125, -10.20703125, -9.12451171875, -8.0419921875, -6.95947265625, -5.876953125, -4.79443359375, -3.7119140625, -2.62939453125, -1.546875, -0.46435546875, 0.6181640625, 1.70068359375, 2.783203125, 3.86572265625, 4.9482421875, 6.03076171875, 7.11328125, 8.19580078125, 9.2783203125, 10.36083984375, 11.443359375, 12.52587890625, 13.6083984375, 14.69091796875, 15.7734375, 16.85595703125, 17.9384765625, 19.02099609375, 20.103515625, 21.18603515625, 22.2685546875, 23.35107421875, 24.43359375, 25.51611328125, 26.5986328125, 27.68115234375, 28.763671875, 29.84619140625, 30.9287109375, 32.01123046875, 33.09375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 6.0, 12.0, 20.0, 26.0, 24.0, 40.0, 53.0, 61.0, 61.0, 81.0, 104.0, 165.0, 152.0, 179.0, 193.0, 223.0, 224.0, 223.0, 257.0, 218.0, 271.0, 235.0, 196.0, 179.0, 154.0, 146.0, 119.0, 82.0, 75.0, 61.0, 58.0, 38.0, 31.0, 28.0, 13.0, 23.0, 15.0, 7.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-23.21875, -22.57763671875, -21.9365234375, -21.29541015625, -20.654296875, -20.01318359375, -19.3720703125, -18.73095703125, -18.08984375, -17.44873046875, -16.8076171875, -16.16650390625, -15.525390625, -14.88427734375, -14.2431640625, -13.60205078125, -12.9609375, -12.31982421875, -11.6787109375, -11.03759765625, -10.396484375, -9.75537109375, -9.1142578125, -8.47314453125, -7.83203125, -7.19091796875, -6.5498046875, -5.90869140625, -5.267578125, -4.62646484375, -3.9853515625, -3.34423828125, -2.703125, -2.06201171875, -1.4208984375, -0.77978515625, -0.138671875, 0.50244140625, 1.1435546875, 1.78466796875, 2.42578125, 3.06689453125, 3.7080078125, 4.34912109375, 4.990234375, 5.63134765625, 6.2724609375, 6.91357421875, 7.5546875, 8.19580078125, 8.8369140625, 9.47802734375, 10.119140625, 10.76025390625, 11.4013671875, 12.04248046875, 12.68359375, 13.32470703125, 13.9658203125, 14.60693359375, 15.248046875, 15.88916015625, 16.5302734375, 17.17138671875, 17.8125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 0.0, 2.0, 3.0, 4.0, 8.0, 4.0, 11.0, 12.0, 9.0, 12.0, 15.0, 23.0, 20.0, 20.0, 26.0, 29.0, 28.0, 33.0, 37.0, 28.0, 34.0, 43.0, 40.0, 49.0, 44.0, 48.0, 43.0, 30.0, 36.0, 22.0, 35.0, 26.0, 25.0, 31.0, 31.0, 22.0, 16.0, 23.0, 13.0, 6.0, 10.0, 12.0, 9.0, 2.0, 13.0, 1.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-44.08357620239258, -42.78725051879883, -41.49092483520508, -40.194602966308594, -38.898277282714844, -37.601951599121094, -36.305625915527344, -35.009300231933594, -33.712974548339844, -32.416648864746094, -31.120325088500977, -29.823999404907227, -28.52767562866211, -27.23134994506836, -25.93502426147461, -24.63869857788086, -23.342376708984375, -22.046051025390625, -20.749727249145508, -19.453401565551758, -18.15707778930664, -16.86075210571289, -15.56442642211914, -14.268101692199707, -12.971776962280273, -11.67545223236084, -10.379127502441406, -9.082801818847656, -7.786477088928223, -6.490152359008789, -5.193827152252197, -3.8975019454956055, -2.6011810302734375, -1.3048560619354248, -0.00853109359741211, 1.2877938747406006, 2.5841188430786133, 3.880443572998047, 5.176768779754639, 6.4730939865112305, 7.769418716430664, 9.065743446350098, 10.362068176269531, 11.658393859863281, 12.954718589782715, 14.251043319702148, 15.547369003295898, 16.843692779541016, 18.140018463134766, 19.436344146728516, 20.732667922973633, 22.028993606567383, 23.3253173828125, 24.62164306640625, 25.91796875, 27.21429443359375, 28.510618209838867, 29.806943893432617, 31.103267669677734, 32.399593353271484, 33.695919036865234, 34.99224090576172, 36.28856658935547, 37.58489227294922, 38.88121795654297]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 9.0, 6.0, 10.0, 15.0, 14.0, 15.0, 16.0, 14.0, 26.0, 15.0, 27.0, 19.0, 25.0, 37.0, 29.0, 24.0, 42.0, 37.0, 39.0, 52.0, 46.0, 32.0, 34.0, 43.0, 42.0, 37.0, 29.0, 39.0, 22.0, 29.0, 35.0, 22.0, 17.0, 15.0, 19.0, 14.0, 15.0, 11.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.623435974121094, -41.187992095947266, -39.75254440307617, -38.317100524902344, -36.881656646728516, -35.44620895385742, -34.010765075683594, -32.5753173828125, -31.139873504638672, -29.70442771911621, -28.268983840942383, -26.833538055419922, -25.39809226989746, -23.962646484375, -22.527202606201172, -21.09175682067871, -19.656312942504883, -18.220867156982422, -16.785423278808594, -15.349977493286133, -13.914531707763672, -12.479086875915527, -11.043642044067383, -9.608196258544922, -8.172751426696777, -6.737306118011475, -5.301860809326172, -3.8664159774780273, -2.4309706687927246, -0.9955253601074219, 0.43991947174072266, 1.8753652572631836, 3.310810089111328, 4.746255397796631, 6.181700706481934, 7.617145538330078, 9.052591323852539, 10.488036155700684, 11.923480987548828, 13.358926773071289, 14.794371604919434, 16.229816436767578, 17.66526222229004, 19.1007080078125, 20.536151885986328, 21.97159767150879, 23.40704345703125, 24.842487335205078, 26.27793312072754, 27.71337890625, 29.148822784423828, 30.58426856994629, 32.01971435546875, 33.45515823364258, 34.890602111816406, 36.3260498046875, 37.76149368286133, 39.196937561035156, 40.63238525390625, 42.06782913208008, 43.503273010253906, 44.938720703125, 46.37416458129883, 47.809608459472656, 49.24505615234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 0.0, 7.0, 7.0, 1.0, 10.0, 23.0, 33.0, 32.0, 48.0, 99.0, 104.0, 180.0, 264.0, 385.0, 576.0, 823.0, 1295.0, 1964.0, 3104.0, 5213.0, 9100.0, 17874.0, 38821.0, 104639.0, 326536.0, 343998.0, 110292.0, 40724.0, 18428.0, 9273.0, 5384.0, 3312.0, 1966.0, 1351.0, 882.0, 568.0, 409.0, 259.0, 168.0, 119.0, 86.0, 68.0, 38.0, 24.0, 25.0, 25.0, 11.0, 2.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.8125, -38.5693359375, -37.326171875, -36.0830078125, -34.83984375, -33.5966796875, -32.353515625, -31.1103515625, -29.8671875, -28.6240234375, -27.380859375, -26.1376953125, -24.89453125, -23.6513671875, -22.408203125, -21.1650390625, -19.921875, -18.6787109375, -17.435546875, -16.1923828125, -14.94921875, -13.7060546875, -12.462890625, -11.2197265625, -9.9765625, -8.7333984375, -7.490234375, -6.2470703125, -5.00390625, -3.7607421875, -2.517578125, -1.2744140625, -0.03125, 1.2119140625, 2.455078125, 3.6982421875, 4.94140625, 6.1845703125, 7.427734375, 8.6708984375, 9.9140625, 11.1572265625, 12.400390625, 13.6435546875, 14.88671875, 16.1298828125, 17.373046875, 18.6162109375, 19.859375, 21.1025390625, 22.345703125, 23.5888671875, 24.83203125, 26.0751953125, 27.318359375, 28.5615234375, 29.8046875, 31.0478515625, 32.291015625, 33.5341796875, 34.77734375, 36.0205078125, 37.263671875, 38.5068359375, 39.75]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 9.0, 6.0, 9.0, 16.0, 15.0, 13.0, 18.0, 13.0, 25.0, 21.0, 21.0, 18.0, 24.0, 34.0, 34.0, 27.0, 41.0, 31.0, 44.0, 48.0, 47.0, 33.0, 31.0, 46.0, 40.0, 33.0, 36.0, 37.0, 25.0, 27.0, 36.0, 19.0, 20.0, 17.0, 19.0, 14.0, 12.0, 12.0, 10.0, 10.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.0625, -40.6494140625, -39.236328125, -37.8232421875, -36.41015625, -34.9970703125, -33.583984375, -32.1708984375, -30.7578125, -29.3447265625, -27.931640625, -26.5185546875, -25.10546875, -23.6923828125, -22.279296875, -20.8662109375, -19.453125, -18.0400390625, -16.626953125, -15.2138671875, -13.80078125, -12.3876953125, -10.974609375, -9.5615234375, -8.1484375, -6.7353515625, -5.322265625, -3.9091796875, -2.49609375, -1.0830078125, 0.330078125, 1.7431640625, 3.15625, 4.5693359375, 5.982421875, 7.3955078125, 8.80859375, 10.2216796875, 11.634765625, 13.0478515625, 14.4609375, 15.8740234375, 17.287109375, 18.7001953125, 20.11328125, 21.5263671875, 22.939453125, 24.3525390625, 25.765625, 27.1787109375, 28.591796875, 30.0048828125, 31.41796875, 32.8310546875, 34.244140625, 35.6572265625, 37.0703125, 38.4833984375, 39.896484375, 41.3095703125, 42.72265625, 44.1357421875, 45.548828125, 46.9619140625, 48.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 7.0, 11.0, 17.0, 14.0, 19.0, 32.0, 29.0, 33.0, 44.0, 48.0, 91.0, 120.0, 160.0, 216.0, 316.0, 437.0, 650.0, 988.0, 1579.0, 2695.0, 4965.0, 10595.0, 28452.0, 122287.0, 634093.0, 178301.0, 36153.0, 12626.0, 5656.0, 2950.0, 1755.0, 980.0, 621.0, 438.0, 304.0, 233.0, 174.0, 101.0, 108.0, 63.0, 39.0, 42.0, 38.0, 23.0, 13.0, 6.0, 8.0, 5.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-37.03125, -35.859375, -34.6875, -33.515625, -32.34375, -31.171875, -30.0, -28.828125, -27.65625, -26.484375, -25.3125, -24.140625, -22.96875, -21.796875, -20.625, -19.453125, -18.28125, -17.109375, -15.9375, -14.765625, -13.59375, -12.421875, -11.25, -10.078125, -8.90625, -7.734375, -6.5625, -5.390625, -4.21875, -3.046875, -1.875, -0.703125, 0.46875, 1.640625, 2.8125, 3.984375, 5.15625, 6.328125, 7.5, 8.671875, 9.84375, 11.015625, 12.1875, 13.359375, 14.53125, 15.703125, 16.875, 18.046875, 19.21875, 20.390625, 21.5625, 22.734375, 23.90625, 25.078125, 26.25, 27.421875, 28.59375, 29.765625, 30.9375, 32.109375, 33.28125, 34.453125, 35.625, 36.796875, 37.96875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 6.0, 14.0, 10.0, 13.0, 12.0, 12.0, 28.0, 28.0, 25.0, 32.0, 41.0, 32.0, 34.0, 53.0, 32.0, 39.0, 43.0, 43.0, 59.0, 43.0, 40.0, 41.0, 39.0, 37.0, 34.0, 35.0, 26.0, 28.0, 34.0, 16.0, 15.0, 14.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.5, -36.42041015625, -35.3408203125, -34.26123046875, -33.181640625, -32.10205078125, -31.0224609375, -29.94287109375, -28.86328125, -27.78369140625, -26.7041015625, -25.62451171875, -24.544921875, -23.46533203125, -22.3857421875, -21.30615234375, -20.2265625, -19.14697265625, -18.0673828125, -16.98779296875, -15.908203125, -14.82861328125, -13.7490234375, -12.66943359375, -11.58984375, -10.51025390625, -9.4306640625, -8.35107421875, -7.271484375, -6.19189453125, -5.1123046875, -4.03271484375, -2.953125, -1.87353515625, -0.7939453125, 0.28564453125, 1.365234375, 2.44482421875, 3.5244140625, 4.60400390625, 5.68359375, 6.76318359375, 7.8427734375, 8.92236328125, 10.001953125, 11.08154296875, 12.1611328125, 13.24072265625, 14.3203125, 15.39990234375, 16.4794921875, 17.55908203125, 18.638671875, 19.71826171875, 20.7978515625, 21.87744140625, 22.95703125, 24.03662109375, 25.1162109375, 26.19580078125, 27.275390625, 28.35498046875, 29.4345703125, 30.51416015625, 31.59375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 11.0, 7.0, 8.0, 17.0, 24.0, 25.0, 42.0, 35.0, 64.0, 76.0, 74.0, 141.0, 202.0, 273.0, 436.0, 643.0, 962.0, 1547.0, 2714.0, 4787.0, 9583.0, 22268.0, 75823.0, 632027.0, 225906.0, 40170.0, 14689.0, 6732.0, 3588.0, 2061.0, 1246.0, 776.0, 536.0, 271.0, 197.0, 161.0, 121.0, 76.0, 87.0, 24.0, 32.0, 24.0, 19.0, 15.0, 16.0, 11.0, 2.0, 8.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-16.140625, -15.6480712890625, -15.155517578125, -14.6629638671875, -14.17041015625, -13.6778564453125, -13.185302734375, -12.6927490234375, -12.2001953125, -11.7076416015625, -11.215087890625, -10.7225341796875, -10.22998046875, -9.7374267578125, -9.244873046875, -8.7523193359375, -8.259765625, -7.7672119140625, -7.274658203125, -6.7821044921875, -6.28955078125, -5.7969970703125, -5.304443359375, -4.8118896484375, -4.3193359375, -3.8267822265625, -3.334228515625, -2.8416748046875, -2.34912109375, -1.8565673828125, -1.364013671875, -0.8714599609375, -0.37890625, 0.1136474609375, 0.606201171875, 1.0987548828125, 1.59130859375, 2.0838623046875, 2.576416015625, 3.0689697265625, 3.5615234375, 4.0540771484375, 4.546630859375, 5.0391845703125, 5.53173828125, 6.0242919921875, 6.516845703125, 7.0093994140625, 7.501953125, 7.9945068359375, 8.487060546875, 8.9796142578125, 9.47216796875, 9.9647216796875, 10.457275390625, 10.9498291015625, 11.4423828125, 11.9349365234375, 12.427490234375, 12.9200439453125, 13.41259765625, 13.9051513671875, 14.397705078125, 14.8902587890625, 15.3828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 10.0, 15.0, 10.0, 22.0, 27.0, 54.0, 91.0, 159.0, 213.0, 164.0, 88.0, 56.0, 22.0, 22.0, 21.0, 6.0, 9.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002490997314453125, -0.0024187564849853516, -0.002346515655517578, -0.0022742748260498047, -0.0022020339965820312, -0.002129793167114258, -0.0020575523376464844, -0.001985311508178711, -0.0019130706787109375, -0.001840829849243164, -0.0017685890197753906, -0.0016963481903076172, -0.0016241073608398438, -0.0015518665313720703, -0.0014796257019042969, -0.0014073848724365234, -0.00133514404296875, -0.0012629032135009766, -0.0011906623840332031, -0.0011184215545654297, -0.0010461807250976562, -0.0009739398956298828, -0.0009016990661621094, -0.0008294582366943359, -0.0007572174072265625, -0.0006849765777587891, -0.0006127357482910156, -0.0005404949188232422, -0.00046825408935546875, -0.0003960132598876953, -0.0003237724304199219, -0.00025153160095214844, -0.000179290771484375, -0.00010704994201660156, -3.4809112548828125e-05, 3.743171691894531e-05, 0.00010967254638671875, 0.0001819133758544922, 0.0002541542053222656, 0.00032639503479003906, 0.0003986358642578125, 0.00047087669372558594, 0.0005431175231933594, 0.0006153583526611328, 0.0006875991821289062, 0.0007598400115966797, 0.0008320808410644531, 0.0009043216705322266, 0.0009765625, 0.0010488033294677734, 0.0011210441589355469, 0.0011932849884033203, 0.0012655258178710938, 0.0013377666473388672, 0.0014100074768066406, 0.001482248306274414, 0.0015544891357421875, 0.001626729965209961, 0.0016989707946777344, 0.0017712116241455078, 0.0018434524536132812, 0.0019156932830810547, 0.001987934112548828, 0.0020601749420166016, 0.002132415771484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 8.0, 11.0, 10.0, 9.0, 23.0, 25.0, 52.0, 58.0, 112.0, 169.0, 276.0, 403.0, 658.0, 1174.0, 1897.0, 3123.0, 5325.0, 9759.0, 18208.0, 35023.0, 73823.0, 163263.0, 309577.0, 223327.0, 102018.0, 47250.0, 23696.0, 12426.0, 7011.0, 3897.0, 2314.0, 1426.0, 849.0, 482.0, 322.0, 189.0, 122.0, 88.0, 52.0, 29.0, 28.0, 12.0, 14.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.5390625, -10.2066650390625, -9.874267578125, -9.5418701171875, -9.20947265625, -8.8770751953125, -8.544677734375, -8.2122802734375, -7.8798828125, -7.5474853515625, -7.215087890625, -6.8826904296875, -6.55029296875, -6.2178955078125, -5.885498046875, -5.5531005859375, -5.220703125, -4.8883056640625, -4.555908203125, -4.2235107421875, -3.89111328125, -3.5587158203125, -3.226318359375, -2.8939208984375, -2.5615234375, -2.2291259765625, -1.896728515625, -1.5643310546875, -1.23193359375, -0.8995361328125, -0.567138671875, -0.2347412109375, 0.09765625, 0.4300537109375, 0.762451171875, 1.0948486328125, 1.42724609375, 1.7596435546875, 2.092041015625, 2.4244384765625, 2.7568359375, 3.0892333984375, 3.421630859375, 3.7540283203125, 4.08642578125, 4.4188232421875, 4.751220703125, 5.0836181640625, 5.416015625, 5.7484130859375, 6.080810546875, 6.4132080078125, 6.74560546875, 7.0780029296875, 7.410400390625, 7.7427978515625, 8.0751953125, 8.4075927734375, 8.739990234375, 9.0723876953125, 9.40478515625, 9.7371826171875, 10.069580078125, 10.4019775390625, 10.734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 9.0, 5.0, 6.0, 9.0, 11.0, 11.0, 12.0, 14.0, 19.0, 31.0, 39.0, 76.0, 87.0, 84.0, 79.0, 90.0, 82.0, 80.0, 63.0, 31.0, 23.0, 23.0, 24.0, 13.0, 16.0, 11.0, 10.0, 7.0, 8.0, 7.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4921875, -4.35150146484375, -4.2108154296875, -4.07012939453125, -3.929443359375, -3.78875732421875, -3.6480712890625, -3.50738525390625, -3.36669921875, -3.22601318359375, -3.0853271484375, -2.94464111328125, -2.803955078125, -2.66326904296875, -2.5225830078125, -2.38189697265625, -2.2412109375, -2.10052490234375, -1.9598388671875, -1.81915283203125, -1.678466796875, -1.53778076171875, -1.3970947265625, -1.25640869140625, -1.11572265625, -0.97503662109375, -0.8343505859375, -0.69366455078125, -0.552978515625, -0.41229248046875, -0.2716064453125, -0.13092041015625, 0.009765625, 0.15045166015625, 0.2911376953125, 0.43182373046875, 0.572509765625, 0.71319580078125, 0.8538818359375, 0.99456787109375, 1.13525390625, 1.27593994140625, 1.4166259765625, 1.55731201171875, 1.697998046875, 1.83868408203125, 1.9793701171875, 2.12005615234375, 2.2607421875, 2.40142822265625, 2.5421142578125, 2.68280029296875, 2.823486328125, 2.96417236328125, 3.1048583984375, 3.24554443359375, 3.38623046875, 3.52691650390625, 3.6676025390625, 3.80828857421875, 3.948974609375, 4.08966064453125, 4.2303466796875, 4.37103271484375, 4.51171875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 6.0, 2.0, 8.0, 15.0, 16.0, 15.0, 20.0, 16.0, 24.0, 26.0, 26.0, 43.0, 29.0, 38.0, 47.0, 35.0, 40.0, 42.0, 46.0, 51.0, 37.0, 42.0, 30.0, 42.0, 33.0, 40.0, 15.0, 29.0, 25.0, 21.0, 24.0, 19.0, 18.0, 12.0, 10.0, 7.0, 13.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-45.258750915527344, -43.90234375, -42.545936584472656, -41.18952560424805, -39.8331184387207, -38.47671127319336, -37.120304107666016, -35.763893127441406, -34.40748596191406, -33.05107879638672, -31.694669723510742, -30.3382625579834, -28.981853485107422, -27.625446319580078, -26.269039154052734, -24.912630081176758, -23.556222915649414, -22.19981575012207, -20.843406677246094, -19.48699951171875, -18.130590438842773, -16.77418327331543, -15.41777515411377, -14.06136703491211, -12.70495891571045, -11.348550796508789, -9.992142677307129, -8.635734558105469, -7.279326915740967, -5.922918796539307, -4.566511154174805, -3.2101030349731445, -1.8536949157714844, -0.49728691577911377, 0.8591210842132568, 2.215528964996338, 3.571937084197998, 4.928345203399658, 6.28475284576416, 7.64116096496582, 8.99756908416748, 10.35397720336914, 11.7103853225708, 13.066793441772461, 14.423200607299805, 15.779609680175781, 17.136016845703125, 18.49242401123047, 19.848833084106445, 21.20524024963379, 22.561649322509766, 23.91805648803711, 25.274465560913086, 26.63087272644043, 27.987281799316406, 29.34368896484375, 30.700096130371094, 32.05650329589844, 33.41291046142578, 34.76932144165039, 36.125728607177734, 37.48213577270508, 38.83854293823242, 40.19495391845703, 41.551361083984375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 7.0, 7.0, 6.0, 23.0, 11.0, 18.0, 19.0, 18.0, 19.0, 19.0, 23.0, 20.0, 27.0, 44.0, 27.0, 28.0, 42.0, 39.0, 37.0, 47.0, 38.0, 45.0, 36.0, 33.0, 45.0, 30.0, 36.0, 35.0, 26.0, 20.0, 38.0, 19.0, 15.0, 24.0, 14.0, 9.0, 19.0, 7.0, 7.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.987335205078125, -40.55349349975586, -39.119651794433594, -37.68581008911133, -36.25196838378906, -34.8181266784668, -33.38428497314453, -31.950443267822266, -30.5166015625, -29.082759857177734, -27.64891815185547, -26.215076446533203, -24.781234741210938, -23.347393035888672, -21.913551330566406, -20.47970962524414, -19.045866012573242, -17.612024307250977, -16.17818260192871, -14.744340896606445, -13.31049919128418, -11.876657485961914, -10.442814826965332, -9.008973121643066, -7.575131416320801, -6.141289710998535, -4.7074480056762695, -3.2736058235168457, -1.83976411819458, -0.40592241287231445, 1.0279197692871094, 2.461761474609375, 3.8956031799316406, 5.329444885253906, 6.763286590576172, 8.197128295898438, 9.630970001220703, 11.064811706542969, 12.49865436553955, 13.932496070861816, 15.366337776184082, 16.800180435180664, 18.23402214050293, 19.667863845825195, 21.10170555114746, 22.535547256469727, 23.969388961791992, 25.403230667114258, 26.837072372436523, 28.27091407775879, 29.704755783081055, 31.13859748840332, 32.57244110107422, 34.006282806396484, 35.44012451171875, 36.873966217041016, 38.30780792236328, 39.74164962768555, 41.17549133300781, 42.60933303833008, 44.043174743652344, 45.47701644897461, 46.910858154296875, 48.34469985961914, 49.778541564941406]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 12.0, 19.0, 20.0, 40.0, 48.0, 98.0, 145.0, 208.0, 344.0, 512.0, 820.0, 1223.0, 1984.0, 3030.0, 4924.0, 7483.0, 11477.0, 17409.0, 25219.0, 36729.0, 49683.0, 66324.0, 81787.0, 96290.0, 104496.0, 105671.0, 99201.0, 86217.0, 70340.0, 54166.0, 39634.0, 27784.0, 19171.0, 12593.0, 8319.0, 5506.0, 3435.0, 2246.0, 1454.0, 858.0, 562.0, 393.0, 221.0, 166.0, 97.0, 66.0, 31.0, 32.0, 19.0, 20.0, 6.0, 7.0, 6.0, 7.0, 0.0, 1.0, 2.0], "bins": [-31.421875, -30.44384765625, -29.4658203125, -28.48779296875, -27.509765625, -26.53173828125, -25.5537109375, -24.57568359375, -23.59765625, -22.61962890625, -21.6416015625, -20.66357421875, -19.685546875, -18.70751953125, -17.7294921875, -16.75146484375, -15.7734375, -14.79541015625, -13.8173828125, -12.83935546875, -11.861328125, -10.88330078125, -9.9052734375, -8.92724609375, -7.94921875, -6.97119140625, -5.9931640625, -5.01513671875, -4.037109375, -3.05908203125, -2.0810546875, -1.10302734375, -0.125, 0.85302734375, 1.8310546875, 2.80908203125, 3.787109375, 4.76513671875, 5.7431640625, 6.72119140625, 7.69921875, 8.67724609375, 9.6552734375, 10.63330078125, 11.611328125, 12.58935546875, 13.5673828125, 14.54541015625, 15.5234375, 16.50146484375, 17.4794921875, 18.45751953125, 19.435546875, 20.41357421875, 21.3916015625, 22.36962890625, 23.34765625, 24.32568359375, 25.3037109375, 26.28173828125, 27.259765625, 28.23779296875, 29.2158203125, 30.19384765625, 31.171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 6.0, 9.0, 6.0, 23.0, 11.0, 15.0, 22.0, 17.0, 21.0, 16.0, 27.0, 19.0, 27.0, 41.0, 27.0, 34.0, 35.0, 42.0, 44.0, 39.0, 38.0, 41.0, 41.0, 33.0, 40.0, 35.0, 30.0, 36.0, 27.0, 21.0, 37.0, 20.0, 12.0, 22.0, 19.0, 11.0, 17.0, 7.0, 10.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.125, -38.75390625, -37.3828125, -36.01171875, -34.640625, -33.26953125, -31.8984375, -30.52734375, -29.15625, -27.78515625, -26.4140625, -25.04296875, -23.671875, -22.30078125, -20.9296875, -19.55859375, -18.1875, -16.81640625, -15.4453125, -14.07421875, -12.703125, -11.33203125, -9.9609375, -8.58984375, -7.21875, -5.84765625, -4.4765625, -3.10546875, -1.734375, -0.36328125, 1.0078125, 2.37890625, 3.75, 5.12109375, 6.4921875, 7.86328125, 9.234375, 10.60546875, 11.9765625, 13.34765625, 14.71875, 16.08984375, 17.4609375, 18.83203125, 20.203125, 21.57421875, 22.9453125, 24.31640625, 25.6875, 27.05859375, 28.4296875, 29.80078125, 31.171875, 32.54296875, 33.9140625, 35.28515625, 36.65625, 38.02734375, 39.3984375, 40.76953125, 42.140625, 43.51171875, 44.8828125, 46.25390625, 47.625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 16.0, 23.0, 27.0, 45.0, 67.0, 111.0, 177.0, 258.0, 426.0, 612.0, 1105.0, 1711.0, 2703.0, 4543.0, 7073.0, 11077.0, 17523.0, 27024.0, 39790.0, 57137.0, 77125.0, 96573.0, 112370.0, 119149.0, 114114.0, 99679.0, 79163.0, 59059.0, 41509.0, 28101.0, 18427.0, 11731.0, 7526.0, 4708.0, 2873.0, 1901.0, 1135.0, 755.0, 448.0, 291.0, 163.0, 127.0, 70.0, 34.0, 25.0, 20.0, 9.0, 8.0, 6.0, 5.0, 2.0, 0.0, 2.0], "bins": [-40.53125, -39.3583984375, -38.185546875, -37.0126953125, -35.83984375, -34.6669921875, -33.494140625, -32.3212890625, -31.1484375, -29.9755859375, -28.802734375, -27.6298828125, -26.45703125, -25.2841796875, -24.111328125, -22.9384765625, -21.765625, -20.5927734375, -19.419921875, -18.2470703125, -17.07421875, -15.9013671875, -14.728515625, -13.5556640625, -12.3828125, -11.2099609375, -10.037109375, -8.8642578125, -7.69140625, -6.5185546875, -5.345703125, -4.1728515625, -3.0, -1.8271484375, -0.654296875, 0.5185546875, 1.69140625, 2.8642578125, 4.037109375, 5.2099609375, 6.3828125, 7.5556640625, 8.728515625, 9.9013671875, 11.07421875, 12.2470703125, 13.419921875, 14.5927734375, 15.765625, 16.9384765625, 18.111328125, 19.2841796875, 20.45703125, 21.6298828125, 22.802734375, 23.9755859375, 25.1484375, 26.3212890625, 27.494140625, 28.6669921875, 29.83984375, 31.0126953125, 32.185546875, 33.3583984375, 34.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 2.0, 10.0, 8.0, 13.0, 12.0, 16.0, 20.0, 26.0, 22.0, 26.0, 27.0, 25.0, 45.0, 41.0, 43.0, 45.0, 45.0, 41.0, 60.0, 49.0, 48.0, 31.0, 44.0, 43.0, 49.0, 45.0, 31.0, 26.0, 19.0, 19.0, 14.0, 12.0, 6.0, 11.0, 4.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.676513671875, -29.61865234375, -28.560791015625, -27.5029296875, -26.445068359375, -25.38720703125, -24.329345703125, -23.271484375, -22.213623046875, -21.15576171875, -20.097900390625, -19.0400390625, -17.982177734375, -16.92431640625, -15.866455078125, -14.80859375, -13.750732421875, -12.69287109375, -11.635009765625, -10.5771484375, -9.519287109375, -8.46142578125, -7.403564453125, -6.345703125, -5.287841796875, -4.22998046875, -3.172119140625, -2.1142578125, -1.056396484375, 0.00146484375, 1.059326171875, 2.1171875, 3.175048828125, 4.23291015625, 5.290771484375, 6.3486328125, 7.406494140625, 8.46435546875, 9.522216796875, 10.580078125, 11.637939453125, 12.69580078125, 13.753662109375, 14.8115234375, 15.869384765625, 16.92724609375, 17.985107421875, 19.04296875, 20.100830078125, 21.15869140625, 22.216552734375, 23.2744140625, 24.332275390625, 25.39013671875, 26.447998046875, 27.505859375, 28.563720703125, 29.62158203125, 30.679443359375, 31.7373046875, 32.795166015625, 33.85302734375, 34.910888671875, 35.96875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 5.0, 10.0, 5.0, 12.0, 25.0, 22.0, 44.0, 50.0, 72.0, 95.0, 164.0, 219.0, 337.0, 532.0, 848.0, 1328.0, 2340.0, 3910.0, 6792.0, 11745.0, 21013.0, 35302.0, 57818.0, 88285.0, 120213.0, 143762.0, 149197.0, 130991.0, 100568.0, 69035.0, 43182.0, 25563.0, 14634.0, 8423.0, 4709.0, 2696.0, 1649.0, 1056.0, 670.0, 402.0, 262.0, 180.0, 131.0, 93.0, 55.0, 36.0, 27.0, 16.0, 14.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.8984375, -11.4908447265625, -11.083251953125, -10.6756591796875, -10.26806640625, -9.8604736328125, -9.452880859375, -9.0452880859375, -8.6376953125, -8.2301025390625, -7.822509765625, -7.4149169921875, -7.00732421875, -6.5997314453125, -6.192138671875, -5.7845458984375, -5.376953125, -4.9693603515625, -4.561767578125, -4.1541748046875, -3.74658203125, -3.3389892578125, -2.931396484375, -2.5238037109375, -2.1162109375, -1.7086181640625, -1.301025390625, -0.8934326171875, -0.48583984375, -0.0782470703125, 0.329345703125, 0.7369384765625, 1.14453125, 1.5521240234375, 1.959716796875, 2.3673095703125, 2.77490234375, 3.1824951171875, 3.590087890625, 3.9976806640625, 4.4052734375, 4.8128662109375, 5.220458984375, 5.6280517578125, 6.03564453125, 6.4432373046875, 6.850830078125, 7.2584228515625, 7.666015625, 8.0736083984375, 8.481201171875, 8.8887939453125, 9.29638671875, 9.7039794921875, 10.111572265625, 10.5191650390625, 10.9267578125, 11.3343505859375, 11.741943359375, 12.1495361328125, 12.55712890625, 12.9647216796875, 13.372314453125, 13.7799072265625, 14.1875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 10.0, 7.0, 11.0, 18.0, 19.0, 29.0, 31.0, 32.0, 43.0, 42.0, 46.0, 45.0, 55.0, 62.0, 61.0, 58.0, 46.0, 58.0, 54.0, 47.0, 52.0, 40.0, 20.0, 22.0, 11.0, 15.0, 6.0, 11.0, 10.0, 7.0, 5.0, 6.0, 6.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00121307373046875, -0.001167595386505127, -0.001122117042541504, -0.0010766386985778809, -0.0010311603546142578, -0.0009856820106506348, -0.0009402036666870117, -0.0008947253227233887, -0.0008492469787597656, -0.0008037686347961426, -0.0007582902908325195, -0.0007128119468688965, -0.0006673336029052734, -0.0006218552589416504, -0.0005763769149780273, -0.0005308985710144043, -0.00048542022705078125, -0.0004399418830871582, -0.00039446353912353516, -0.0003489851951599121, -0.00030350685119628906, -0.000258028507232666, -0.00021255016326904297, -0.00016707181930541992, -0.00012159347534179688, -7.611513137817383e-05, -3.063678741455078e-05, 1.4841556549072266e-05, 6.031990051269531e-05, 0.00010579824447631836, 0.0001512765884399414, 0.00019675493240356445, 0.0002422332763671875, 0.00028771162033081055, 0.0003331899642944336, 0.00037866830825805664, 0.0004241466522216797, 0.00046962499618530273, 0.0005151033401489258, 0.0005605816841125488, 0.0006060600280761719, 0.0006515383720397949, 0.000697016716003418, 0.000742495059967041, 0.0007879734039306641, 0.0008334517478942871, 0.0008789300918579102, 0.0009244084358215332, 0.0009698867797851562, 0.0010153651237487793, 0.0010608434677124023, 0.0011063218116760254, 0.0011518001556396484, 0.0011972784996032715, 0.0012427568435668945, 0.0012882351875305176, 0.0013337135314941406, 0.0013791918754577637, 0.0014246702194213867, 0.0014701485633850098, 0.0015156269073486328, 0.0015611052513122559, 0.001606583595275879, 0.001652061939239502, 0.001697540283203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 14.0, 14.0, 15.0, 41.0, 58.0, 97.0, 143.0, 236.0, 369.0, 556.0, 1012.0, 1554.0, 2434.0, 4047.0, 6848.0, 11157.0, 18315.0, 28627.0, 43411.0, 63394.0, 85308.0, 107491.0, 121933.0, 124740.0, 115042.0, 95653.0, 72457.0, 51526.0, 34394.0, 22262.0, 13952.0, 8322.0, 5123.0, 3009.0, 1863.0, 1165.0, 768.0, 434.0, 270.0, 186.0, 101.0, 69.0, 46.0, 32.0, 13.0, 15.0, 11.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.984375, -9.6539306640625, -9.323486328125, -8.9930419921875, -8.66259765625, -8.3321533203125, -8.001708984375, -7.6712646484375, -7.3408203125, -7.0103759765625, -6.679931640625, -6.3494873046875, -6.01904296875, -5.6885986328125, -5.358154296875, -5.0277099609375, -4.697265625, -4.3668212890625, -4.036376953125, -3.7059326171875, -3.37548828125, -3.0450439453125, -2.714599609375, -2.3841552734375, -2.0537109375, -1.7232666015625, -1.392822265625, -1.0623779296875, -0.73193359375, -0.4014892578125, -0.071044921875, 0.2593994140625, 0.58984375, 0.9202880859375, 1.250732421875, 1.5811767578125, 1.91162109375, 2.2420654296875, 2.572509765625, 2.9029541015625, 3.2333984375, 3.5638427734375, 3.894287109375, 4.2247314453125, 4.55517578125, 4.8856201171875, 5.216064453125, 5.5465087890625, 5.876953125, 6.2073974609375, 6.537841796875, 6.8682861328125, 7.19873046875, 7.5291748046875, 7.859619140625, 8.1900634765625, 8.5205078125, 8.8509521484375, 9.181396484375, 9.5118408203125, 9.84228515625, 10.1727294921875, 10.503173828125, 10.8336181640625, 11.1640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 7.0, 2.0, 8.0, 8.0, 4.0, 10.0, 12.0, 14.0, 19.0, 30.0, 24.0, 26.0, 41.0, 30.0, 50.0, 45.0, 42.0, 49.0, 60.0, 52.0, 61.0, 50.0, 58.0, 45.0, 38.0, 32.0, 26.0, 30.0, 29.0, 22.0, 20.0, 16.0, 10.0, 11.0, 7.0, 6.0, 3.0, 5.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.2109375, -5.0458984375, -4.880859375, -4.7158203125, -4.55078125, -4.3857421875, -4.220703125, -4.0556640625, -3.890625, -3.7255859375, -3.560546875, -3.3955078125, -3.23046875, -3.0654296875, -2.900390625, -2.7353515625, -2.5703125, -2.4052734375, -2.240234375, -2.0751953125, -1.91015625, -1.7451171875, -1.580078125, -1.4150390625, -1.25, -1.0849609375, -0.919921875, -0.7548828125, -0.58984375, -0.4248046875, -0.259765625, -0.0947265625, 0.0703125, 0.2353515625, 0.400390625, 0.5654296875, 0.73046875, 0.8955078125, 1.060546875, 1.2255859375, 1.390625, 1.5556640625, 1.720703125, 1.8857421875, 2.05078125, 2.2158203125, 2.380859375, 2.5458984375, 2.7109375, 2.8759765625, 3.041015625, 3.2060546875, 3.37109375, 3.5361328125, 3.701171875, 3.8662109375, 4.03125, 4.1962890625, 4.361328125, 4.5263671875, 4.69140625, 4.8564453125, 5.021484375, 5.1865234375, 5.3515625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 13.0, 13.0, 13.0, 18.0, 11.0, 18.0, 22.0, 17.0, 34.0, 25.0, 26.0, 28.0, 40.0, 37.0, 40.0, 42.0, 46.0, 38.0, 56.0, 31.0, 46.0, 33.0, 33.0, 31.0, 35.0, 25.0, 27.0, 22.0, 23.0, 30.0, 17.0, 12.0, 17.0, 9.0, 8.0, 11.0, 7.0, 11.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.608489990234375, -37.349952697753906, -36.09141540527344, -34.832881927490234, -33.574344635009766, -32.3158073425293, -31.05727195739746, -29.798736572265625, -28.540199279785156, -27.281661987304688, -26.02312660217285, -24.764591217041016, -23.506053924560547, -22.247516632080078, -20.988981246948242, -19.730445861816406, -18.471908569335938, -17.21337127685547, -15.954835891723633, -14.69629955291748, -13.437763214111328, -12.179226875305176, -10.920690536499023, -9.662154197692871, -8.403617858886719, -7.145081520080566, -5.886545181274414, -4.628008842468262, -3.3694725036621094, -2.110936164855957, -0.8523998260498047, 0.40613651275634766, 1.6646728515625, 2.9232091903686523, 4.181745529174805, 5.440281867980957, 6.698818206787109, 7.957354545593262, 9.215890884399414, 10.474427223205566, 11.732963562011719, 12.991499900817871, 14.250036239624023, 15.508572578430176, 16.767108917236328, 18.025646209716797, 19.284181594848633, 20.54271697998047, 21.801254272460938, 23.059791564941406, 24.318326950073242, 25.576862335205078, 26.835399627685547, 28.093936920166016, 29.35247230529785, 30.611007690429688, 31.869544982910156, 33.128082275390625, 34.386619567871094, 35.6451530456543, 36.903690338134766, 38.162227630615234, 39.42076110839844, 40.679298400878906, 41.937835693359375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 9.0, 14.0, 21.0, 14.0, 19.0, 15.0, 21.0, 21.0, 18.0, 32.0, 36.0, 38.0, 31.0, 40.0, 51.0, 46.0, 51.0, 42.0, 44.0, 41.0, 32.0, 47.0, 36.0, 38.0, 33.0, 36.0, 26.0, 26.0, 21.0, 20.0, 18.0, 16.0, 8.0, 7.0, 4.0, 7.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.99409103393555, -54.31796646118164, -52.641841888427734, -50.96571350097656, -49.289588928222656, -47.61346435546875, -45.937339782714844, -44.26121520996094, -42.58509063720703, -40.908966064453125, -39.23284149169922, -37.55671691894531, -35.88058853149414, -34.204463958740234, -32.52833938598633, -30.852214813232422, -29.176088333129883, -27.499963760375977, -25.823837280273438, -24.14771270751953, -22.471588134765625, -20.79546356201172, -19.11933708190918, -17.443212509155273, -15.76708698272705, -14.090961456298828, -12.414836883544922, -10.7387113571167, -9.062585830688477, -7.38646125793457, -5.710335731506348, -4.034211158752441, -2.3580856323242188, -0.6819604635238647, 0.9941647052764893, 2.670289993286133, 4.346415042877197, 6.022540092468262, 7.698665618896484, 9.37479019165039, 11.050915718078613, 12.727041244506836, 14.403165817260742, 16.07929229736328, 17.755416870117188, 19.431541442871094, 21.107666015625, 22.783790588378906, 24.459917068481445, 26.13604164123535, 27.81216812133789, 29.488292694091797, 31.164417266845703, 32.84054183959961, 34.51667022705078, 36.19279479980469, 37.868919372558594, 39.5450439453125, 41.221168518066406, 42.89729309082031, 44.573421478271484, 46.24954605102539, 47.9256706237793, 49.6017951965332, 51.27791976928711]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 20.0, 37.0, 54.0, 82.0, 151.0, 228.0, 398.0, 681.0, 1052.0, 1840.0, 2973.0, 4885.0, 8117.0, 12997.0, 21678.0, 34543.0, 54488.0, 86549.0, 132764.0, 196283.0, 276324.0, 364784.0, 442632.0, 488274.0, 485465.0, 434685.0, 351596.0, 264082.0, 186289.0, 125232.0, 80528.0, 51267.0, 31967.0, 19890.0, 12171.0, 7383.0, 4449.0, 2949.0, 1690.0, 1084.0, 668.0, 395.0, 229.0, 165.0, 106.0, 59.0, 27.0, 18.0, 26.0, 7.0, 12.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.90625, -31.84228515625, -30.7783203125, -29.71435546875, -28.650390625, -27.58642578125, -26.5224609375, -25.45849609375, -24.39453125, -23.33056640625, -22.2666015625, -21.20263671875, -20.138671875, -19.07470703125, -18.0107421875, -16.94677734375, -15.8828125, -14.81884765625, -13.7548828125, -12.69091796875, -11.626953125, -10.56298828125, -9.4990234375, -8.43505859375, -7.37109375, -6.30712890625, -5.2431640625, -4.17919921875, -3.115234375, -2.05126953125, -0.9873046875, 0.07666015625, 1.140625, 2.20458984375, 3.2685546875, 4.33251953125, 5.396484375, 6.46044921875, 7.5244140625, 8.58837890625, 9.65234375, 10.71630859375, 11.7802734375, 12.84423828125, 13.908203125, 14.97216796875, 16.0361328125, 17.10009765625, 18.1640625, 19.22802734375, 20.2919921875, 21.35595703125, 22.419921875, 23.48388671875, 24.5478515625, 25.61181640625, 26.67578125, 27.73974609375, 28.8037109375, 29.86767578125, 30.931640625, 31.99560546875, 33.0595703125, 34.12353515625, 35.1875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 2.0, 6.0, 5.0, 16.0, 19.0, 19.0, 19.0, 18.0, 17.0, 18.0, 20.0, 31.0, 33.0, 40.0, 39.0, 36.0, 46.0, 54.0, 53.0, 43.0, 34.0, 48.0, 36.0, 40.0, 45.0, 36.0, 28.0, 30.0, 32.0, 27.0, 21.0, 19.0, 19.0, 12.0, 12.0, 6.0, 5.0, 2.0, 2.0, 8.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.25, -42.91748046875, -41.5849609375, -40.25244140625, -38.919921875, -37.58740234375, -36.2548828125, -34.92236328125, -33.58984375, -32.25732421875, -30.9248046875, -29.59228515625, -28.259765625, -26.92724609375, -25.5947265625, -24.26220703125, -22.9296875, -21.59716796875, -20.2646484375, -18.93212890625, -17.599609375, -16.26708984375, -14.9345703125, -13.60205078125, -12.26953125, -10.93701171875, -9.6044921875, -8.27197265625, -6.939453125, -5.60693359375, -4.2744140625, -2.94189453125, -1.609375, -0.27685546875, 1.0556640625, 2.38818359375, 3.720703125, 5.05322265625, 6.3857421875, 7.71826171875, 9.05078125, 10.38330078125, 11.7158203125, 13.04833984375, 14.380859375, 15.71337890625, 17.0458984375, 18.37841796875, 19.7109375, 21.04345703125, 22.3759765625, 23.70849609375, 25.041015625, 26.37353515625, 27.7060546875, 29.03857421875, 30.37109375, 31.70361328125, 33.0361328125, 34.36865234375, 35.701171875, 37.03369140625, 38.3662109375, 39.69873046875, 41.03125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 9.0, 18.0, 44.0, 55.0, 109.0, 227.0, 308.0, 556.0, 906.0, 1501.0, 2557.0, 4419.0, 6853.0, 11374.0, 18239.0, 29189.0, 44178.0, 65951.0, 96971.0, 137357.0, 187970.0, 242351.0, 302102.0, 353983.0, 390819.0, 403746.0, 390208.0, 353688.0, 301148.0, 242371.0, 186301.0, 137074.0, 96375.0, 66356.0, 43836.0, 28439.0, 18193.0, 11163.0, 6873.0, 4223.0, 2510.0, 1526.0, 944.0, 540.0, 305.0, 165.0, 104.0, 60.0, 37.0, 13.0, 23.0, 11.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.078125, -28.15478515625, -27.2314453125, -26.30810546875, -25.384765625, -24.46142578125, -23.5380859375, -22.61474609375, -21.69140625, -20.76806640625, -19.8447265625, -18.92138671875, -17.998046875, -17.07470703125, -16.1513671875, -15.22802734375, -14.3046875, -13.38134765625, -12.4580078125, -11.53466796875, -10.611328125, -9.68798828125, -8.7646484375, -7.84130859375, -6.91796875, -5.99462890625, -5.0712890625, -4.14794921875, -3.224609375, -2.30126953125, -1.3779296875, -0.45458984375, 0.46875, 1.39208984375, 2.3154296875, 3.23876953125, 4.162109375, 5.08544921875, 6.0087890625, 6.93212890625, 7.85546875, 8.77880859375, 9.7021484375, 10.62548828125, 11.548828125, 12.47216796875, 13.3955078125, 14.31884765625, 15.2421875, 16.16552734375, 17.0888671875, 18.01220703125, 18.935546875, 19.85888671875, 20.7822265625, 21.70556640625, 22.62890625, 23.55224609375, 24.4755859375, 25.39892578125, 26.322265625, 27.24560546875, 28.1689453125, 29.09228515625, 30.015625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 12.0, 12.0, 13.0, 18.0, 28.0, 22.0, 44.0, 54.0, 53.0, 67.0, 73.0, 101.0, 109.0, 126.0, 153.0, 172.0, 177.0, 167.0, 205.0, 205.0, 198.0, 196.0, 199.0, 199.0, 200.0, 176.0, 165.0, 141.0, 131.0, 105.0, 96.0, 81.0, 76.0, 60.0, 59.0, 46.0, 34.0, 17.0, 26.0, 26.0, 7.0, 8.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6796875, -14.1475830078125, -13.615478515625, -13.0833740234375, -12.55126953125, -12.0191650390625, -11.487060546875, -10.9549560546875, -10.4228515625, -9.8907470703125, -9.358642578125, -8.8265380859375, -8.29443359375, -7.7623291015625, -7.230224609375, -6.6981201171875, -6.166015625, -5.6339111328125, -5.101806640625, -4.5697021484375, -4.03759765625, -3.5054931640625, -2.973388671875, -2.4412841796875, -1.9091796875, -1.3770751953125, -0.844970703125, -0.3128662109375, 0.21923828125, 0.7513427734375, 1.283447265625, 1.8155517578125, 2.34765625, 2.8797607421875, 3.411865234375, 3.9439697265625, 4.47607421875, 5.0081787109375, 5.540283203125, 6.0723876953125, 6.6044921875, 7.1365966796875, 7.668701171875, 8.2008056640625, 8.73291015625, 9.2650146484375, 9.797119140625, 10.3292236328125, 10.861328125, 11.3934326171875, 11.925537109375, 12.4576416015625, 12.98974609375, 13.5218505859375, 14.053955078125, 14.5860595703125, 15.1181640625, 15.6502685546875, 16.182373046875, 16.7144775390625, 17.24658203125, 17.7786865234375, 18.310791015625, 18.8428955078125, 19.375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 8.0, 12.0, 9.0, 10.0, 13.0, 10.0, 24.0, 23.0, 27.0, 30.0, 20.0, 41.0, 24.0, 34.0, 32.0, 37.0, 49.0, 40.0, 35.0, 48.0, 36.0, 49.0, 41.0, 40.0, 38.0, 44.0, 22.0, 23.0, 26.0, 18.0, 14.0, 24.0, 17.0, 15.0, 10.0, 16.0, 7.0, 7.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-42.14974594116211, -40.93879318237305, -39.72784423828125, -38.51689147949219, -37.305938720703125, -36.09498596191406, -34.884037017822266, -33.6730842590332, -32.462135314941406, -31.251184463500977, -30.040231704711914, -28.829280853271484, -27.618328094482422, -26.407377243041992, -25.196426391601562, -23.9854736328125, -22.774520874023438, -21.563570022583008, -20.352617263793945, -19.141666412353516, -17.930713653564453, -16.719762802124023, -15.508811950683594, -14.297860145568848, -13.086908340454102, -11.875956535339355, -10.66500473022461, -9.45405387878418, -8.243102073669434, -7.0321502685546875, -5.8211989402771, -4.610247611999512, -3.3992996215820312, -2.1883480548858643, -0.9773964881896973, 0.23355507850646973, 1.4445066452026367, 2.655458450317383, 3.8664097785949707, 5.077361106872559, 6.288312911987305, 7.499264717102051, 8.710216522216797, 9.921167373657227, 11.132119178771973, 12.343070983886719, 13.554021835327148, 14.764973640441895, 15.97592544555664, 17.18687629699707, 18.397829055786133, 19.608779907226562, 20.819732666015625, 22.030683517456055, 23.241634368896484, 24.452587127685547, 25.663537979125977, 26.874488830566406, 28.08544158935547, 29.2963924407959, 30.507343292236328, 31.71829605102539, 32.92924880981445, 34.14019775390625, 35.35115051269531]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 4.0, 9.0, 8.0, 9.0, 12.0, 18.0, 26.0, 16.0, 27.0, 35.0, 26.0, 38.0, 35.0, 48.0, 50.0, 47.0, 47.0, 53.0, 46.0, 32.0, 42.0, 57.0, 39.0, 38.0, 49.0, 45.0, 33.0, 24.0, 23.0, 16.0, 9.0, 12.0, 7.0, 4.0, 6.0, 9.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.21111297607422, -58.52910614013672, -56.84709548950195, -55.16508865356445, -53.48307800292969, -51.80107116699219, -50.11906433105469, -48.43705368041992, -46.755043029785156, -45.073036193847656, -43.39102554321289, -41.70901870727539, -40.027008056640625, -38.345001220703125, -36.662994384765625, -34.98098373413086, -33.29897689819336, -31.616968154907227, -29.934959411621094, -28.252952575683594, -26.570941925048828, -24.888935089111328, -23.206926345825195, -21.524917602539062, -19.84290885925293, -18.160900115966797, -16.478891372680664, -14.796883583068848, -13.114874839782715, -11.432866096496582, -9.750858306884766, -8.068849563598633, -6.3868408203125, -4.704832077026367, -3.0228238105773926, -1.340815544128418, 0.34119319915771484, 2.0232019424438477, 3.705209732055664, 5.387218475341797, 7.06922721862793, 8.751235961914062, 10.433244705200195, 12.115252494812012, 13.797261238098145, 15.479269981384277, 17.161277770996094, 18.843286514282227, 20.52529525756836, 22.207304000854492, 23.889312744140625, 25.571319580078125, 27.25333023071289, 28.93533706665039, 30.617345809936523, 32.299354553222656, 33.981361389160156, 35.663368225097656, 37.34537887573242, 39.02738571166992, 40.70939636230469, 42.39140319824219, 44.07341003417969, 45.75542068481445, 47.43743133544922]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 20.0, 24.0, 28.0, 49.0, 59.0, 102.0, 135.0, 203.0, 322.0, 490.0, 810.0, 1272.0, 2293.0, 4062.0, 7862.0, 17288.0, 43039.0, 118936.0, 335344.0, 325287.0, 115154.0, 41665.0, 16703.0, 7679.0, 3979.0, 2200.0, 1318.0, 778.0, 506.0, 306.0, 216.0, 124.0, 98.0, 65.0, 41.0, 34.0, 26.0, 12.0, 10.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.515625, -28.56298828125, -27.6103515625, -26.65771484375, -25.705078125, -24.75244140625, -23.7998046875, -22.84716796875, -21.89453125, -20.94189453125, -19.9892578125, -19.03662109375, -18.083984375, -17.13134765625, -16.1787109375, -15.22607421875, -14.2734375, -13.32080078125, -12.3681640625, -11.41552734375, -10.462890625, -9.51025390625, -8.5576171875, -7.60498046875, -6.65234375, -5.69970703125, -4.7470703125, -3.79443359375, -2.841796875, -1.88916015625, -0.9365234375, 0.01611328125, 0.96875, 1.92138671875, 2.8740234375, 3.82666015625, 4.779296875, 5.73193359375, 6.6845703125, 7.63720703125, 8.58984375, 9.54248046875, 10.4951171875, 11.44775390625, 12.400390625, 13.35302734375, 14.3056640625, 15.25830078125, 16.2109375, 17.16357421875, 18.1162109375, 19.06884765625, 20.021484375, 20.97412109375, 21.9267578125, 22.87939453125, 23.83203125, 24.78466796875, 25.7373046875, 26.68994140625, 27.642578125, 28.59521484375, 29.5478515625, 30.50048828125, 31.453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 7.0, 9.0, 9.0, 10.0, 21.0, 27.0, 17.0, 26.0, 36.0, 28.0, 36.0, 40.0, 49.0, 48.0, 50.0, 46.0, 46.0, 48.0, 35.0, 40.0, 61.0, 37.0, 36.0, 51.0, 40.0, 32.0, 24.0, 21.0, 16.0, 11.0, 11.0, 6.0, 4.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.75, -58.0771484375, -56.404296875, -54.7314453125, -53.05859375, -51.3857421875, -49.712890625, -48.0400390625, -46.3671875, -44.6943359375, -43.021484375, -41.3486328125, -39.67578125, -38.0029296875, -36.330078125, -34.6572265625, -32.984375, -31.3115234375, -29.638671875, -27.9658203125, -26.29296875, -24.6201171875, -22.947265625, -21.2744140625, -19.6015625, -17.9287109375, -16.255859375, -14.5830078125, -12.91015625, -11.2373046875, -9.564453125, -7.8916015625, -6.21875, -4.5458984375, -2.873046875, -1.2001953125, 0.47265625, 2.1455078125, 3.818359375, 5.4912109375, 7.1640625, 8.8369140625, 10.509765625, 12.1826171875, 13.85546875, 15.5283203125, 17.201171875, 18.8740234375, 20.546875, 22.2197265625, 23.892578125, 25.5654296875, 27.23828125, 28.9111328125, 30.583984375, 32.2568359375, 33.9296875, 35.6025390625, 37.275390625, 38.9482421875, 40.62109375, 42.2939453125, 43.966796875, 45.6396484375, 47.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 8.0, 7.0, 7.0, 8.0, 14.0, 22.0, 21.0, 32.0, 52.0, 68.0, 106.0, 167.0, 275.0, 456.0, 765.0, 1444.0, 2979.0, 6986.0, 20105.0, 78206.0, 404778.0, 416723.0, 80848.0, 20952.0, 7024.0, 2953.0, 1541.0, 766.0, 421.0, 254.0, 190.0, 110.0, 84.0, 44.0, 36.0, 21.0, 17.0, 12.0, 12.0, 10.0, 6.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.40625, -25.5546875, -24.703125, -23.8515625, -23.0, -22.1484375, -21.296875, -20.4453125, -19.59375, -18.7421875, -17.890625, -17.0390625, -16.1875, -15.3359375, -14.484375, -13.6328125, -12.78125, -11.9296875, -11.078125, -10.2265625, -9.375, -8.5234375, -7.671875, -6.8203125, -5.96875, -5.1171875, -4.265625, -3.4140625, -2.5625, -1.7109375, -0.859375, -0.0078125, 0.84375, 1.6953125, 2.546875, 3.3984375, 4.25, 5.1015625, 5.953125, 6.8046875, 7.65625, 8.5078125, 9.359375, 10.2109375, 11.0625, 11.9140625, 12.765625, 13.6171875, 14.46875, 15.3203125, 16.171875, 17.0234375, 17.875, 18.7265625, 19.578125, 20.4296875, 21.28125, 22.1328125, 22.984375, 23.8359375, 24.6875, 25.5390625, 26.390625, 27.2421875, 28.09375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 11.0, 12.0, 12.0, 12.0, 23.0, 12.0, 18.0, 16.0, 25.0, 29.0, 24.0, 24.0, 32.0, 29.0, 40.0, 30.0, 41.0, 39.0, 37.0, 33.0, 38.0, 37.0, 41.0, 31.0, 42.0, 32.0, 25.0, 37.0, 32.0, 19.0, 23.0, 15.0, 15.0, 18.0, 14.0, 12.0, 17.0, 5.0, 8.0, 1.0, 7.0, 6.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.84375, -24.95703125, -24.0703125, -23.18359375, -22.296875, -21.41015625, -20.5234375, -19.63671875, -18.75, -17.86328125, -16.9765625, -16.08984375, -15.203125, -14.31640625, -13.4296875, -12.54296875, -11.65625, -10.76953125, -9.8828125, -8.99609375, -8.109375, -7.22265625, -6.3359375, -5.44921875, -4.5625, -3.67578125, -2.7890625, -1.90234375, -1.015625, -0.12890625, 0.7578125, 1.64453125, 2.53125, 3.41796875, 4.3046875, 5.19140625, 6.078125, 6.96484375, 7.8515625, 8.73828125, 9.625, 10.51171875, 11.3984375, 12.28515625, 13.171875, 14.05859375, 14.9453125, 15.83203125, 16.71875, 17.60546875, 18.4921875, 19.37890625, 20.265625, 21.15234375, 22.0390625, 22.92578125, 23.8125, 24.69921875, 25.5859375, 26.47265625, 27.359375, 28.24609375, 29.1328125, 30.01953125, 30.90625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 7.0, 9.0, 8.0, 8.0, 13.0, 27.0, 33.0, 51.0, 60.0, 57.0, 97.0, 131.0, 181.0, 248.0, 373.0, 490.0, 753.0, 1100.0, 1808.0, 3126.0, 5342.0, 10295.0, 24237.0, 80400.0, 587570.0, 250351.0, 45972.0, 16714.0, 7972.0, 4270.0, 2479.0, 1461.0, 938.0, 601.0, 431.0, 282.0, 187.0, 133.0, 106.0, 53.0, 44.0, 40.0, 20.0, 13.0, 10.0, 12.0, 10.0, 6.0, 9.0, 4.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-15.828125, -15.330322265625, -14.83251953125, -14.334716796875, -13.8369140625, -13.339111328125, -12.84130859375, -12.343505859375, -11.845703125, -11.347900390625, -10.85009765625, -10.352294921875, -9.8544921875, -9.356689453125, -8.85888671875, -8.361083984375, -7.86328125, -7.365478515625, -6.86767578125, -6.369873046875, -5.8720703125, -5.374267578125, -4.87646484375, -4.378662109375, -3.880859375, -3.383056640625, -2.88525390625, -2.387451171875, -1.8896484375, -1.391845703125, -0.89404296875, -0.396240234375, 0.1015625, 0.599365234375, 1.09716796875, 1.594970703125, 2.0927734375, 2.590576171875, 3.08837890625, 3.586181640625, 4.083984375, 4.581787109375, 5.07958984375, 5.577392578125, 6.0751953125, 6.572998046875, 7.07080078125, 7.568603515625, 8.06640625, 8.564208984375, 9.06201171875, 9.559814453125, 10.0576171875, 10.555419921875, 11.05322265625, 11.551025390625, 12.048828125, 12.546630859375, 13.04443359375, 13.542236328125, 14.0400390625, 14.537841796875, 15.03564453125, 15.533447265625, 16.03125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 4.0, 6.0, 11.0, 8.0, 11.0, 11.0, 31.0, 36.0, 37.0, 53.0, 82.0, 132.0, 171.0, 101.0, 58.0, 57.0, 31.0, 35.0, 21.0, 19.0, 13.0, 7.0, 4.0, 8.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0014352798461914062, -0.001380637288093567, -0.0013259947299957275, -0.0012713521718978882, -0.0012167096138000488, -0.0011620670557022095, -0.0011074244976043701, -0.0010527819395065308, -0.0009981393814086914, -0.000943496823310852, -0.0008888542652130127, -0.0008342117071151733, -0.000779569149017334, -0.0007249265909194946, -0.0006702840328216553, -0.0006156414747238159, -0.0005609989166259766, -0.0005063563585281372, -0.00045171380043029785, -0.0003970712423324585, -0.00034242868423461914, -0.0002877861261367798, -0.00023314356803894043, -0.00017850100994110107, -0.00012385845184326172, -6.921589374542236e-05, -1.4573335647583008e-05, 4.006922245025635e-05, 9.47117805480957e-05, 0.00014935433864593506, 0.00020399689674377441, 0.00025863945484161377, 0.0003132820129394531, 0.0003679245710372925, 0.00042256712913513184, 0.0004772096872329712, 0.0005318522453308105, 0.0005864948034286499, 0.0006411373615264893, 0.0006957799196243286, 0.000750422477722168, 0.0008050650358200073, 0.0008597075939178467, 0.000914350152015686, 0.0009689927101135254, 0.0010236352682113647, 0.001078277826309204, 0.0011329203844070435, 0.0011875629425048828, 0.0012422055006027222, 0.0012968480587005615, 0.0013514906167984009, 0.0014061331748962402, 0.0014607757329940796, 0.001515418291091919, 0.0015700608491897583, 0.0016247034072875977, 0.001679345965385437, 0.0017339885234832764, 0.0017886310815811157, 0.001843273639678955, 0.0018979161977767944, 0.0019525587558746338, 0.002007201313972473, 0.0020618438720703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 4.0, 4.0, 9.0, 10.0, 17.0, 35.0, 43.0, 49.0, 84.0, 110.0, 141.0, 202.0, 277.0, 403.0, 537.0, 850.0, 1154.0, 1699.0, 2582.0, 4130.0, 6767.0, 11311.0, 21190.0, 42046.0, 86863.0, 177593.0, 282809.0, 201771.0, 100227.0, 48229.0, 23776.0, 12822.0, 7417.0, 4406.0, 2874.0, 1912.0, 1187.0, 883.0, 583.0, 468.0, 318.0, 217.0, 168.0, 121.0, 88.0, 60.0, 40.0, 17.0, 16.0, 13.0, 12.0, 2.0, 9.0, 5.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.3203125, -10.9503173828125, -10.580322265625, -10.2103271484375, -9.84033203125, -9.4703369140625, -9.100341796875, -8.7303466796875, -8.3603515625, -7.9903564453125, -7.620361328125, -7.2503662109375, -6.88037109375, -6.5103759765625, -6.140380859375, -5.7703857421875, -5.400390625, -5.0303955078125, -4.660400390625, -4.2904052734375, -3.92041015625, -3.5504150390625, -3.180419921875, -2.8104248046875, -2.4404296875, -2.0704345703125, -1.700439453125, -1.3304443359375, -0.96044921875, -0.5904541015625, -0.220458984375, 0.1495361328125, 0.51953125, 0.8895263671875, 1.259521484375, 1.6295166015625, 1.99951171875, 2.3695068359375, 2.739501953125, 3.1094970703125, 3.4794921875, 3.8494873046875, 4.219482421875, 4.5894775390625, 4.95947265625, 5.3294677734375, 5.699462890625, 6.0694580078125, 6.439453125, 6.8094482421875, 7.179443359375, 7.5494384765625, 7.91943359375, 8.2894287109375, 8.659423828125, 9.0294189453125, 9.3994140625, 9.7694091796875, 10.139404296875, 10.5093994140625, 10.87939453125, 11.2493896484375, 11.619384765625, 11.9893798828125, 12.359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 4.0, 15.0, 8.0, 12.0, 14.0, 14.0, 8.0, 15.0, 19.0, 29.0, 22.0, 32.0, 26.0, 31.0, 28.0, 42.0, 38.0, 33.0, 34.0, 46.0, 33.0, 38.0, 39.0, 43.0, 26.0, 30.0, 28.0, 33.0, 26.0, 31.0, 23.0, 31.0, 22.0, 14.0, 12.0, 14.0, 13.0, 8.0, 10.0, 15.0, 8.0, 5.0, 6.0, 9.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.59765625, -2.513397216796875, -2.42913818359375, -2.344879150390625, -2.2606201171875, -2.176361083984375, -2.09210205078125, -2.007843017578125, -1.923583984375, -1.839324951171875, -1.75506591796875, -1.670806884765625, -1.5865478515625, -1.502288818359375, -1.41802978515625, -1.333770751953125, -1.24951171875, -1.165252685546875, -1.08099365234375, -0.996734619140625, -0.9124755859375, -0.828216552734375, -0.74395751953125, -0.659698486328125, -0.575439453125, -0.491180419921875, -0.40692138671875, -0.322662353515625, -0.2384033203125, -0.154144287109375, -0.06988525390625, 0.014373779296875, 0.0986328125, 0.182891845703125, 0.26715087890625, 0.351409912109375, 0.4356689453125, 0.519927978515625, 0.60418701171875, 0.688446044921875, 0.772705078125, 0.856964111328125, 0.94122314453125, 1.025482177734375, 1.1097412109375, 1.194000244140625, 1.27825927734375, 1.362518310546875, 1.44677734375, 1.531036376953125, 1.61529541015625, 1.699554443359375, 1.7838134765625, 1.868072509765625, 1.95233154296875, 2.036590576171875, 2.120849609375, 2.205108642578125, 2.28936767578125, 2.373626708984375, 2.4578857421875, 2.542144775390625, 2.62640380859375, 2.710662841796875, 2.794921875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 2.0, 7.0, 3.0, 14.0, 9.0, 15.0, 16.0, 18.0, 18.0, 23.0, 24.0, 31.0, 42.0, 21.0, 33.0, 33.0, 34.0, 39.0, 45.0, 47.0, 44.0, 53.0, 37.0, 42.0, 53.0, 33.0, 44.0, 27.0, 28.0, 25.0, 20.0, 16.0, 16.0, 19.0, 14.0, 14.0, 15.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-44.33330154418945, -43.064884185791016, -41.79646301269531, -40.528045654296875, -39.25962829589844, -37.991207122802734, -36.7227897644043, -35.454368591308594, -34.185951232910156, -32.91753387451172, -31.649112701416016, -30.380695343017578, -29.112276077270508, -27.843856811523438, -26.575439453125, -25.30702018737793, -24.03860092163086, -22.77018165588379, -21.50176239013672, -20.23334503173828, -18.96492576599121, -17.69650650024414, -16.428089141845703, -15.159669876098633, -13.891250610351562, -12.622831344604492, -11.354413032531738, -10.085994720458984, -8.817575454711914, -7.549156665802002, -6.28073787689209, -5.012319564819336, -3.743896484375, -2.475477695465088, -1.2070589065551758, 0.06135988235473633, 1.3297786712646484, 2.5981974601745605, 3.8666162490844727, 5.135034561157227, 6.403453826904297, 7.671872615814209, 8.940291404724121, 10.208709716796875, 11.477128982543945, 12.745548248291016, 14.01396656036377, 15.282384872436523, 16.550804138183594, 17.819223403930664, 19.087642669677734, 20.356060028076172, 21.624479293823242, 22.892898559570312, 24.16131591796875, 25.42973518371582, 26.69815444946289, 27.96657371520996, 29.23499298095703, 30.50341033935547, 31.77182960510254, 33.04024887084961, 34.30866622924805, 35.57708740234375, 36.84550476074219]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 8.0, 6.0, 9.0, 16.0, 16.0, 25.0, 20.0, 26.0, 31.0, 33.0, 35.0, 43.0, 45.0, 46.0, 49.0, 46.0, 43.0, 57.0, 35.0, 49.0, 43.0, 45.0, 36.0, 49.0, 41.0, 28.0, 30.0, 22.0, 15.0, 13.0, 12.0, 4.0, 6.0, 5.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.892276763916016, -59.191890716552734, -57.49150466918945, -55.79111862182617, -54.09073257446289, -52.39034652709961, -50.68995666503906, -48.98957061767578, -47.2891845703125, -45.58879852294922, -43.88841247558594, -42.188026428222656, -40.487640380859375, -38.787254333496094, -37.08686828613281, -35.38648223876953, -33.68609619140625, -31.98571014404297, -30.285324096679688, -28.584938049316406, -26.884552001953125, -25.184165954589844, -23.48377799987793, -21.78339195251465, -20.083005905151367, -18.382619857788086, -16.682233810424805, -14.981846809387207, -13.281460762023926, -11.581074714660645, -9.880687713623047, -8.180301666259766, -6.479911804199219, -4.7795257568359375, -3.079139232635498, -1.3787527084350586, 0.32163333892822266, 2.022019386291504, 3.7224063873291016, 5.422792434692383, 7.123178482055664, 8.823564529418945, 10.523950576782227, 12.224337577819824, 13.924723625183105, 15.625109672546387, 17.325496673583984, 19.025882720947266, 20.726268768310547, 22.426654815673828, 24.12704086303711, 25.82742691040039, 27.527812957763672, 29.228199005126953, 30.928586959838867, 32.62897491455078, 34.32936096191406, 36.029747009277344, 37.730133056640625, 39.430519104003906, 41.13090515136719, 42.83129119873047, 44.53167724609375, 46.23206329345703, 47.93244934082031]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 12.0, 16.0, 22.0, 47.0, 75.0, 136.0, 228.0, 330.0, 589.0, 941.0, 1517.0, 2446.0, 3788.0, 5839.0, 9405.0, 14560.0, 21495.0, 30965.0, 43751.0, 58473.0, 74680.0, 90144.0, 101880.0, 106551.0, 103237.0, 92245.0, 78090.0, 61494.0, 46102.0, 32935.0, 23103.0, 15610.0, 10028.0, 6771.0, 4236.0, 2633.0, 1636.0, 1003.0, 619.0, 384.0, 220.0, 116.0, 79.0, 60.0, 31.0, 13.0, 11.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-31.3125, -30.38037109375, -29.4482421875, -28.51611328125, -27.583984375, -26.65185546875, -25.7197265625, -24.78759765625, -23.85546875, -22.92333984375, -21.9912109375, -21.05908203125, -20.126953125, -19.19482421875, -18.2626953125, -17.33056640625, -16.3984375, -15.46630859375, -14.5341796875, -13.60205078125, -12.669921875, -11.73779296875, -10.8056640625, -9.87353515625, -8.94140625, -8.00927734375, -7.0771484375, -6.14501953125, -5.212890625, -4.28076171875, -3.3486328125, -2.41650390625, -1.484375, -0.55224609375, 0.3798828125, 1.31201171875, 2.244140625, 3.17626953125, 4.1083984375, 5.04052734375, 5.97265625, 6.90478515625, 7.8369140625, 8.76904296875, 9.701171875, 10.63330078125, 11.5654296875, 12.49755859375, 13.4296875, 14.36181640625, 15.2939453125, 16.22607421875, 17.158203125, 18.09033203125, 19.0224609375, 19.95458984375, 20.88671875, 21.81884765625, 22.7509765625, 23.68310546875, 24.615234375, 25.54736328125, 26.4794921875, 27.41162109375, 28.34375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 6.0, 8.0, 17.0, 14.0, 26.0, 21.0, 25.0, 34.0, 31.0, 37.0, 37.0, 45.0, 51.0, 45.0, 45.0, 49.0, 52.0, 41.0, 46.0, 45.0, 38.0, 44.0, 44.0, 45.0, 26.0, 30.0, 23.0, 14.0, 14.0, 11.0, 5.0, 7.0, 5.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.34375, -57.6875, -56.03125, -54.375, -52.71875, -51.0625, -49.40625, -47.75, -46.09375, -44.4375, -42.78125, -41.125, -39.46875, -37.8125, -36.15625, -34.5, -32.84375, -31.1875, -29.53125, -27.875, -26.21875, -24.5625, -22.90625, -21.25, -19.59375, -17.9375, -16.28125, -14.625, -12.96875, -11.3125, -9.65625, -8.0, -6.34375, -4.6875, -3.03125, -1.375, 0.28125, 1.9375, 3.59375, 5.25, 6.90625, 8.5625, 10.21875, 11.875, 13.53125, 15.1875, 16.84375, 18.5, 20.15625, 21.8125, 23.46875, 25.125, 26.78125, 28.4375, 30.09375, 31.75, 33.40625, 35.0625, 36.71875, 38.375, 40.03125, 41.6875, 43.34375, 45.0, 46.65625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 8.0, 11.0, 15.0, 22.0, 30.0, 57.0, 77.0, 158.0, 186.0, 310.0, 484.0, 790.0, 1225.0, 1920.0, 2965.0, 4453.0, 6915.0, 10390.0, 15728.0, 23565.0, 33259.0, 46859.0, 62840.0, 79771.0, 94534.0, 105606.0, 108024.0, 101675.0, 89148.0, 72779.0, 56138.0, 40843.0, 29121.0, 20110.0, 13231.0, 8807.0, 5819.0, 3836.0, 2499.0, 1517.0, 979.0, 681.0, 419.0, 229.0, 187.0, 105.0, 75.0, 50.0, 33.0, 25.0, 17.0, 12.0, 12.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-32.375, -31.37255859375, -30.3701171875, -29.36767578125, -28.365234375, -27.36279296875, -26.3603515625, -25.35791015625, -24.35546875, -23.35302734375, -22.3505859375, -21.34814453125, -20.345703125, -19.34326171875, -18.3408203125, -17.33837890625, -16.3359375, -15.33349609375, -14.3310546875, -13.32861328125, -12.326171875, -11.32373046875, -10.3212890625, -9.31884765625, -8.31640625, -7.31396484375, -6.3115234375, -5.30908203125, -4.306640625, -3.30419921875, -2.3017578125, -1.29931640625, -0.296875, 0.70556640625, 1.7080078125, 2.71044921875, 3.712890625, 4.71533203125, 5.7177734375, 6.72021484375, 7.72265625, 8.72509765625, 9.7275390625, 10.72998046875, 11.732421875, 12.73486328125, 13.7373046875, 14.73974609375, 15.7421875, 16.74462890625, 17.7470703125, 18.74951171875, 19.751953125, 20.75439453125, 21.7568359375, 22.75927734375, 23.76171875, 24.76416015625, 25.7666015625, 26.76904296875, 27.771484375, 28.77392578125, 29.7763671875, 30.77880859375, 31.78125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 8.0, 11.0, 7.0, 14.0, 14.0, 15.0, 23.0, 21.0, 21.0, 21.0, 30.0, 21.0, 30.0, 28.0, 40.0, 34.0, 32.0, 44.0, 43.0, 39.0, 44.0, 45.0, 39.0, 33.0, 41.0, 37.0, 31.0, 30.0, 31.0, 21.0, 19.0, 24.0, 17.0, 17.0, 19.0, 10.0, 11.0, 11.0, 9.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.625, -26.75146484375, -25.8779296875, -25.00439453125, -24.130859375, -23.25732421875, -22.3837890625, -21.51025390625, -20.63671875, -19.76318359375, -18.8896484375, -18.01611328125, -17.142578125, -16.26904296875, -15.3955078125, -14.52197265625, -13.6484375, -12.77490234375, -11.9013671875, -11.02783203125, -10.154296875, -9.28076171875, -8.4072265625, -7.53369140625, -6.66015625, -5.78662109375, -4.9130859375, -4.03955078125, -3.166015625, -2.29248046875, -1.4189453125, -0.54541015625, 0.328125, 1.20166015625, 2.0751953125, 2.94873046875, 3.822265625, 4.69580078125, 5.5693359375, 6.44287109375, 7.31640625, 8.18994140625, 9.0634765625, 9.93701171875, 10.810546875, 11.68408203125, 12.5576171875, 13.43115234375, 14.3046875, 15.17822265625, 16.0517578125, 16.92529296875, 17.798828125, 18.67236328125, 19.5458984375, 20.41943359375, 21.29296875, 22.16650390625, 23.0400390625, 23.91357421875, 24.787109375, 25.66064453125, 26.5341796875, 27.40771484375, 28.28125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 12.0, 5.0, 6.0, 6.0, 18.0, 16.0, 20.0, 35.0, 44.0, 56.0, 80.0, 132.0, 180.0, 297.0, 450.0, 713.0, 1108.0, 1863.0, 3127.0, 5356.0, 10053.0, 18674.0, 37007.0, 72206.0, 127047.0, 184902.0, 202398.0, 163363.0, 102445.0, 55082.0, 28352.0, 14619.0, 7862.0, 4329.0, 2620.0, 1484.0, 887.0, 548.0, 356.0, 243.0, 135.0, 115.0, 82.0, 58.0, 45.0, 28.0, 30.0, 17.0, 13.0, 11.0, 10.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-20.453125, -19.8388671875, -19.224609375, -18.6103515625, -17.99609375, -17.3818359375, -16.767578125, -16.1533203125, -15.5390625, -14.9248046875, -14.310546875, -13.6962890625, -13.08203125, -12.4677734375, -11.853515625, -11.2392578125, -10.625, -10.0107421875, -9.396484375, -8.7822265625, -8.16796875, -7.5537109375, -6.939453125, -6.3251953125, -5.7109375, -5.0966796875, -4.482421875, -3.8681640625, -3.25390625, -2.6396484375, -2.025390625, -1.4111328125, -0.796875, -0.1826171875, 0.431640625, 1.0458984375, 1.66015625, 2.2744140625, 2.888671875, 3.5029296875, 4.1171875, 4.7314453125, 5.345703125, 5.9599609375, 6.57421875, 7.1884765625, 7.802734375, 8.4169921875, 9.03125, 9.6455078125, 10.259765625, 10.8740234375, 11.48828125, 12.1025390625, 12.716796875, 13.3310546875, 13.9453125, 14.5595703125, 15.173828125, 15.7880859375, 16.40234375, 17.0166015625, 17.630859375, 18.2451171875, 18.859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 15.0, 7.0, 20.0, 18.0, 23.0, 28.0, 29.0, 33.0, 43.0, 58.0, 67.0, 49.0, 76.0, 67.0, 62.0, 61.0, 63.0, 60.0, 28.0, 37.0, 29.0, 18.0, 17.0, 12.0, 12.0, 12.0, 12.0, 4.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0020046234130859375, -0.0019434690475463867, -0.001882314682006836, -0.0018211603164672852, -0.0017600059509277344, -0.0016988515853881836, -0.0016376972198486328, -0.001576542854309082, -0.0015153884887695312, -0.0014542341232299805, -0.0013930797576904297, -0.001331925392150879, -0.0012707710266113281, -0.0012096166610717773, -0.0011484622955322266, -0.0010873079299926758, -0.001026153564453125, -0.0009649991989135742, -0.0009038448333740234, -0.0008426904678344727, -0.0007815361022949219, -0.0007203817367553711, -0.0006592273712158203, -0.0005980730056762695, -0.0005369186401367188, -0.00047576427459716797, -0.0004146099090576172, -0.0003534555435180664, -0.0002923011779785156, -0.00023114681243896484, -0.00016999244689941406, -0.00010883808135986328, -4.76837158203125e-05, 1.3470649719238281e-05, 7.462501525878906e-05, 0.00013577938079833984, 0.00019693374633789062, 0.0002580881118774414, 0.0003192424774169922, 0.00038039684295654297, 0.00044155120849609375, 0.0005027055740356445, 0.0005638599395751953, 0.0006250143051147461, 0.0006861686706542969, 0.0007473230361938477, 0.0008084774017333984, 0.0008696317672729492, 0.0009307861328125, 0.0009919404983520508, 0.0010530948638916016, 0.0011142492294311523, 0.0011754035949707031, 0.001236557960510254, 0.0012977123260498047, 0.0013588666915893555, 0.0014200210571289062, 0.001481175422668457, 0.0015423297882080078, 0.0016034841537475586, 0.0016646385192871094, 0.0017257928848266602, 0.001786947250366211, 0.0018481016159057617, 0.0019092559814453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 12.0, 17.0, 22.0, 30.0, 63.0, 75.0, 103.0, 158.0, 238.0, 319.0, 574.0, 877.0, 1432.0, 2473.0, 4301.0, 7669.0, 13781.0, 25507.0, 46547.0, 80000.0, 123813.0, 162759.0, 174285.0, 149141.0, 106145.0, 65501.0, 36810.0, 20235.0, 10872.0, 6074.0, 3429.0, 1949.0, 1268.0, 720.0, 452.0, 313.0, 194.0, 120.0, 81.0, 64.0, 33.0, 35.0, 17.0, 18.0, 12.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.359375, -16.838134765625, -16.31689453125, -15.795654296875, -15.2744140625, -14.753173828125, -14.23193359375, -13.710693359375, -13.189453125, -12.668212890625, -12.14697265625, -11.625732421875, -11.1044921875, -10.583251953125, -10.06201171875, -9.540771484375, -9.01953125, -8.498291015625, -7.97705078125, -7.455810546875, -6.9345703125, -6.413330078125, -5.89208984375, -5.370849609375, -4.849609375, -4.328369140625, -3.80712890625, -3.285888671875, -2.7646484375, -2.243408203125, -1.72216796875, -1.200927734375, -0.6796875, -0.158447265625, 0.36279296875, 0.884033203125, 1.4052734375, 1.926513671875, 2.44775390625, 2.968994140625, 3.490234375, 4.011474609375, 4.53271484375, 5.053955078125, 5.5751953125, 6.096435546875, 6.61767578125, 7.138916015625, 7.66015625, 8.181396484375, 8.70263671875, 9.223876953125, 9.7451171875, 10.266357421875, 10.78759765625, 11.308837890625, 11.830078125, 12.351318359375, 12.87255859375, 13.393798828125, 13.9150390625, 14.436279296875, 14.95751953125, 15.478759765625, 16.0]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 3.0, 11.0, 16.0, 31.0, 34.0, 44.0, 42.0, 34.0, 56.0, 57.0, 59.0, 64.0, 60.0, 68.0, 57.0, 55.0, 37.0, 44.0, 48.0, 34.0, 30.0, 22.0, 13.0, 16.0, 20.0, 7.0, 3.0, 4.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1171875, -5.9066162109375, -5.696044921875, -5.4854736328125, -5.27490234375, -5.0643310546875, -4.853759765625, -4.6431884765625, -4.4326171875, -4.2220458984375, -4.011474609375, -3.8009033203125, -3.59033203125, -3.3797607421875, -3.169189453125, -2.9586181640625, -2.748046875, -2.5374755859375, -2.326904296875, -2.1163330078125, -1.90576171875, -1.6951904296875, -1.484619140625, -1.2740478515625, -1.0634765625, -0.8529052734375, -0.642333984375, -0.4317626953125, -0.22119140625, -0.0106201171875, 0.199951171875, 0.4105224609375, 0.62109375, 0.8316650390625, 1.042236328125, 1.2528076171875, 1.46337890625, 1.6739501953125, 1.884521484375, 2.0950927734375, 2.3056640625, 2.5162353515625, 2.726806640625, 2.9373779296875, 3.14794921875, 3.3585205078125, 3.569091796875, 3.7796630859375, 3.990234375, 4.2008056640625, 4.411376953125, 4.6219482421875, 4.83251953125, 5.0430908203125, 5.253662109375, 5.4642333984375, 5.6748046875, 5.8853759765625, 6.095947265625, 6.3065185546875, 6.51708984375, 6.7276611328125, 6.938232421875, 7.1488037109375, 7.359375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 8.0, 8.0, 4.0, 9.0, 15.0, 10.0, 14.0, 20.0, 18.0, 33.0, 15.0, 26.0, 31.0, 47.0, 28.0, 29.0, 39.0, 41.0, 54.0, 43.0, 49.0, 57.0, 44.0, 35.0, 39.0, 39.0, 45.0, 21.0, 30.0, 21.0, 21.0, 25.0, 15.0, 14.0, 18.0, 10.0, 14.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-45.150146484375, -43.81840133666992, -42.48665237426758, -41.1549072265625, -39.82316207885742, -38.491416931152344, -37.15966796875, -35.82792282104492, -34.496177673339844, -33.164432525634766, -31.832685470581055, -30.500938415527344, -29.169193267822266, -27.837446212768555, -26.505699157714844, -25.173954010009766, -23.842205047607422, -22.51045799255371, -21.178712844848633, -19.846965789794922, -18.515220642089844, -17.183473587036133, -15.851726531982422, -14.519980430603027, -13.188234329223633, -11.856488227844238, -10.524742126464844, -9.192995071411133, -7.861248970031738, -6.529502868652344, -5.197756290435791, -3.8660097122192383, -2.5342636108398438, -1.2025172710418701, 0.12922906875610352, 1.4609754085540771, 2.792721748352051, 4.124467849731445, 5.456214427947998, 6.787961006164551, 8.119707107543945, 9.45145320892334, 10.783199310302734, 12.114946365356445, 13.44669246673584, 14.778438568115234, 16.110185623168945, 17.441932678222656, 18.773677825927734, 20.105424880981445, 21.437170028686523, 22.768917083740234, 24.100662231445312, 25.432409286499023, 26.764156341552734, 28.095901489257812, 29.427648544311523, 30.759395599365234, 32.09114074707031, 33.42288589477539, 34.754634857177734, 36.08638000488281, 37.41812515258789, 38.749874114990234, 40.08161926269531]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 10.0, 14.0, 22.0, 17.0, 16.0, 25.0, 31.0, 40.0, 36.0, 43.0, 35.0, 50.0, 44.0, 46.0, 48.0, 49.0, 49.0, 63.0, 40.0, 46.0, 51.0, 42.0, 33.0, 25.0, 20.0, 22.0, 18.0, 12.0, 9.0, 14.0, 5.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.722686767578125, -60.859710693359375, -58.99673080444336, -57.13375473022461, -55.270774841308594, -53.407798767089844, -51.544822692871094, -49.68184280395508, -47.81886291503906, -45.95588684082031, -44.0929069519043, -42.22993087768555, -40.36695098876953, -38.50397491455078, -36.64099884033203, -34.778018951416016, -32.915042877197266, -31.052064895629883, -29.1890869140625, -27.32611083984375, -25.463130950927734, -23.600154876708984, -21.7371768951416, -19.87419891357422, -18.011220932006836, -16.148242950439453, -14.28526496887207, -12.422287940979004, -10.559309959411621, -8.696331977844238, -6.833354949951172, -4.970376968383789, -3.107402801513672, -1.2444250583648682, 0.6185526847839355, 2.48153018951416, 4.344508171081543, 6.207486152648926, 8.070463180541992, 9.933441162109375, 11.796419143676758, 13.65939712524414, 15.522375106811523, 17.385353088378906, 19.248329162597656, 21.111309051513672, 22.974285125732422, 24.837263107299805, 26.700241088867188, 28.56321907043457, 30.426197052001953, 32.2891731262207, 34.15215301513672, 36.01512908935547, 37.87810516357422, 39.741085052490234, 41.60406494140625, 43.467041015625, 45.330020904541016, 47.192996978759766, 49.05597686767578, 50.91895294189453, 52.78192901611328, 54.6449089050293, 56.50788497924805]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 15.0, 33.0, 55.0, 73.0, 103.0, 177.0, 348.0, 601.0, 1094.0, 1856.0, 3393.0, 5870.0, 10244.0, 18058.0, 30596.0, 52258.0, 86718.0, 139877.0, 214634.0, 308968.0, 413144.0, 498442.0, 534493.0, 507938.0, 429167.0, 327348.0, 229498.0, 150039.0, 94571.0, 56818.0, 33247.0, 19367.0, 10887.0, 6230.0, 3547.0, 1997.0, 1103.0, 602.0, 367.0, 196.0, 108.0, 74.0, 46.0, 37.0, 24.0, 12.0, 6.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.75, -37.62939453125, -36.5087890625, -35.38818359375, -34.267578125, -33.14697265625, -32.0263671875, -30.90576171875, -29.78515625, -28.66455078125, -27.5439453125, -26.42333984375, -25.302734375, -24.18212890625, -23.0615234375, -21.94091796875, -20.8203125, -19.69970703125, -18.5791015625, -17.45849609375, -16.337890625, -15.21728515625, -14.0966796875, -12.97607421875, -11.85546875, -10.73486328125, -9.6142578125, -8.49365234375, -7.373046875, -6.25244140625, -5.1318359375, -4.01123046875, -2.890625, -1.77001953125, -0.6494140625, 0.47119140625, 1.591796875, 2.71240234375, 3.8330078125, 4.95361328125, 6.07421875, 7.19482421875, 8.3154296875, 9.43603515625, 10.556640625, 11.67724609375, 12.7978515625, 13.91845703125, 15.0390625, 16.15966796875, 17.2802734375, 18.40087890625, 19.521484375, 20.64208984375, 21.7626953125, 22.88330078125, 24.00390625, 25.12451171875, 26.2451171875, 27.36572265625, 28.486328125, 29.60693359375, 30.7275390625, 31.84814453125, 32.96875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 11.0, 9.0, 13.0, 14.0, 17.0, 17.0, 21.0, 22.0, 32.0, 44.0, 37.0, 38.0, 35.0, 42.0, 53.0, 41.0, 52.0, 48.0, 51.0, 59.0, 44.0, 38.0, 55.0, 38.0, 30.0, 27.0, 22.0, 22.0, 17.0, 14.0, 9.0, 14.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.9375, -48.45361328125, -46.9697265625, -45.48583984375, -44.001953125, -42.51806640625, -41.0341796875, -39.55029296875, -38.06640625, -36.58251953125, -35.0986328125, -33.61474609375, -32.130859375, -30.64697265625, -29.1630859375, -27.67919921875, -26.1953125, -24.71142578125, -23.2275390625, -21.74365234375, -20.259765625, -18.77587890625, -17.2919921875, -15.80810546875, -14.32421875, -12.84033203125, -11.3564453125, -9.87255859375, -8.388671875, -6.90478515625, -5.4208984375, -3.93701171875, -2.453125, -0.96923828125, 0.5146484375, 1.99853515625, 3.482421875, 4.96630859375, 6.4501953125, 7.93408203125, 9.41796875, 10.90185546875, 12.3857421875, 13.86962890625, 15.353515625, 16.83740234375, 18.3212890625, 19.80517578125, 21.2890625, 22.77294921875, 24.2568359375, 25.74072265625, 27.224609375, 28.70849609375, 30.1923828125, 31.67626953125, 33.16015625, 34.64404296875, 36.1279296875, 37.61181640625, 39.095703125, 40.57958984375, 42.0634765625, 43.54736328125, 45.03125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 7.0, 6.0, 19.0, 29.0, 65.0, 97.0, 186.0, 293.0, 490.0, 903.0, 1343.0, 2292.0, 3717.0, 6049.0, 9462.0, 14979.0, 23349.0, 35343.0, 52758.0, 77022.0, 107884.0, 148219.0, 192646.0, 243321.0, 292539.0, 334477.0, 364633.0, 373412.0, 363563.0, 335390.0, 291388.0, 242452.0, 192961.0, 147058.0, 108002.0, 76766.0, 52869.0, 35695.0, 23126.0, 14667.0, 9617.0, 5934.0, 3704.0, 2146.0, 1357.0, 808.0, 511.0, 326.0, 185.0, 81.0, 53.0, 45.0, 24.0, 12.0, 3.0, 6.0, 0.0, 1.0, 3.0], "bins": [-27.125, -26.290283203125, -25.45556640625, -24.620849609375, -23.7861328125, -22.951416015625, -22.11669921875, -21.281982421875, -20.447265625, -19.612548828125, -18.77783203125, -17.943115234375, -17.1083984375, -16.273681640625, -15.43896484375, -14.604248046875, -13.76953125, -12.934814453125, -12.10009765625, -11.265380859375, -10.4306640625, -9.595947265625, -8.76123046875, -7.926513671875, -7.091796875, -6.257080078125, -5.42236328125, -4.587646484375, -3.7529296875, -2.918212890625, -2.08349609375, -1.248779296875, -0.4140625, 0.420654296875, 1.25537109375, 2.090087890625, 2.9248046875, 3.759521484375, 4.59423828125, 5.428955078125, 6.263671875, 7.098388671875, 7.93310546875, 8.767822265625, 9.6025390625, 10.437255859375, 11.27197265625, 12.106689453125, 12.94140625, 13.776123046875, 14.61083984375, 15.445556640625, 16.2802734375, 17.114990234375, 17.94970703125, 18.784423828125, 19.619140625, 20.453857421875, 21.28857421875, 22.123291015625, 22.9580078125, 23.792724609375, 24.62744140625, 25.462158203125, 26.296875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 14.0, 13.0, 13.0, 21.0, 44.0, 45.0, 40.0, 65.0, 72.0, 80.0, 93.0, 121.0, 139.0, 160.0, 158.0, 201.0, 166.0, 202.0, 215.0, 217.0, 220.0, 212.0, 210.0, 192.0, 163.0, 161.0, 145.0, 120.0, 101.0, 81.0, 70.0, 60.0, 58.0, 49.0, 30.0, 30.0, 22.0, 14.0, 18.0, 9.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.953125, -17.3994140625, -16.845703125, -16.2919921875, -15.73828125, -15.1845703125, -14.630859375, -14.0771484375, -13.5234375, -12.9697265625, -12.416015625, -11.8623046875, -11.30859375, -10.7548828125, -10.201171875, -9.6474609375, -9.09375, -8.5400390625, -7.986328125, -7.4326171875, -6.87890625, -6.3251953125, -5.771484375, -5.2177734375, -4.6640625, -4.1103515625, -3.556640625, -3.0029296875, -2.44921875, -1.8955078125, -1.341796875, -0.7880859375, -0.234375, 0.3193359375, 0.873046875, 1.4267578125, 1.98046875, 2.5341796875, 3.087890625, 3.6416015625, 4.1953125, 4.7490234375, 5.302734375, 5.8564453125, 6.41015625, 6.9638671875, 7.517578125, 8.0712890625, 8.625, 9.1787109375, 9.732421875, 10.2861328125, 10.83984375, 11.3935546875, 11.947265625, 12.5009765625, 13.0546875, 13.6083984375, 14.162109375, 14.7158203125, 15.26953125, 15.8232421875, 16.376953125, 16.9306640625, 17.484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 8.0, 11.0, 7.0, 8.0, 11.0, 15.0, 8.0, 18.0, 18.0, 18.0, 18.0, 35.0, 21.0, 50.0, 34.0, 42.0, 35.0, 46.0, 38.0, 39.0, 49.0, 43.0, 50.0, 50.0, 40.0, 36.0, 20.0, 34.0, 29.0, 28.0, 14.0, 19.0, 16.0, 12.0, 10.0, 13.0, 12.0, 11.0, 15.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.42414474487305, -37.19244384765625, -35.96074676513672, -34.72904586791992, -33.497344970703125, -32.265647888183594, -31.033946990966797, -29.80224609375, -28.570547103881836, -27.338848114013672, -26.107147216796875, -24.87544822692871, -23.643749237060547, -22.41204833984375, -21.180349349975586, -19.948650360107422, -18.716949462890625, -17.48525047302246, -16.253549575805664, -15.0218505859375, -13.79015064239502, -12.558450698852539, -11.326751708984375, -10.095051765441895, -8.863351821899414, -7.631651878356934, -6.399952411651611, -5.168252944946289, -3.9365530014038086, -2.704853057861328, -1.4731535911560059, -0.2414541244506836, 0.9902458190917969, 2.2219455242156982, 3.4536452293395996, 4.685344696044922, 5.917044639587402, 7.148744583129883, 8.380443572998047, 9.612143516540527, 10.843843460083008, 12.075543403625488, 13.307243347167969, 14.538942337036133, 15.770642280578613, 17.002342224121094, 18.234041213989258, 19.465740203857422, 20.69744110107422, 21.929140090942383, 23.16084098815918, 24.392539978027344, 25.62424087524414, 26.855939865112305, 28.08763885498047, 29.319339752197266, 30.55103874206543, 31.782737731933594, 33.01443862915039, 34.24613952636719, 35.47783660888672, 36.709537506103516, 37.94123840332031, 39.172935485839844, 40.40463638305664]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 5.0, 4.0, 10.0, 10.0, 13.0, 11.0, 22.0, 20.0, 26.0, 36.0, 34.0, 41.0, 38.0, 41.0, 35.0, 37.0, 44.0, 57.0, 48.0, 47.0, 55.0, 50.0, 51.0, 50.0, 38.0, 32.0, 30.0, 24.0, 16.0, 16.0, 14.0, 9.0, 13.0, 11.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.75094985961914, -52.07831573486328, -50.40568161010742, -48.73304748535156, -47.0604133605957, -45.387779235839844, -43.71514892578125, -42.042510986328125, -40.36988067626953, -38.69724655151367, -37.02461242675781, -35.35197830200195, -33.679344177246094, -32.006710052490234, -30.334077835083008, -28.66144371032715, -26.988807678222656, -25.316173553466797, -23.643539428710938, -21.970905303955078, -20.29827117919922, -18.62563705444336, -16.953004837036133, -15.280370712280273, -13.607736587524414, -11.935102462768555, -10.262468338012695, -8.589835166931152, -6.917201042175293, -5.244566917419434, -3.5719337463378906, -1.8992996215820312, -0.2266693115234375, 1.4459645748138428, 3.118598461151123, 4.791232109069824, 6.463866233825684, 8.136500358581543, 9.809133529663086, 11.481767654418945, 13.154401779174805, 14.827035903930664, 16.499670028686523, 18.17230224609375, 19.84493637084961, 21.51757049560547, 23.190204620361328, 24.862838745117188, 26.535472869873047, 28.208106994628906, 29.880741119384766, 31.553375244140625, 33.226009368896484, 34.898643493652344, 36.57127380371094, 38.24391174316406, 39.916542053222656, 41.589176177978516, 43.261810302734375, 44.934444427490234, 46.607078552246094, 48.27971267700195, 49.95234680175781, 51.624977111816406, 53.29761505126953]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 15.0, 15.0, 16.0, 23.0, 41.0, 51.0, 64.0, 118.0, 144.0, 229.0, 311.0, 460.0, 683.0, 987.0, 1438.0, 2201.0, 3665.0, 6216.0, 11011.0, 21680.0, 43672.0, 94420.0, 205677.0, 298613.0, 186076.0, 85013.0, 39955.0, 19748.0, 10314.0, 5748.0, 3442.0, 2196.0, 1414.0, 947.0, 590.0, 429.0, 276.0, 207.0, 130.0, 91.0, 65.0, 50.0, 39.0, 16.0, 16.0, 18.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.3671875, -14.8450927734375, -14.322998046875, -13.8009033203125, -13.27880859375, -12.7567138671875, -12.234619140625, -11.7125244140625, -11.1904296875, -10.6683349609375, -10.146240234375, -9.6241455078125, -9.10205078125, -8.5799560546875, -8.057861328125, -7.5357666015625, -7.013671875, -6.4915771484375, -5.969482421875, -5.4473876953125, -4.92529296875, -4.4031982421875, -3.881103515625, -3.3590087890625, -2.8369140625, -2.3148193359375, -1.792724609375, -1.2706298828125, -0.74853515625, -0.2264404296875, 0.295654296875, 0.8177490234375, 1.33984375, 1.8619384765625, 2.384033203125, 2.9061279296875, 3.42822265625, 3.9503173828125, 4.472412109375, 4.9945068359375, 5.5166015625, 6.0386962890625, 6.560791015625, 7.0828857421875, 7.60498046875, 8.1270751953125, 8.649169921875, 9.1712646484375, 9.693359375, 10.2154541015625, 10.737548828125, 11.2596435546875, 11.78173828125, 12.3038330078125, 12.825927734375, 13.3480224609375, 13.8701171875, 14.3922119140625, 14.914306640625, 15.4364013671875, 15.95849609375, 16.4805908203125, 17.002685546875, 17.5247802734375, 18.046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 7.0, 3.0, 10.0, 10.0, 15.0, 10.0, 21.0, 21.0, 26.0, 37.0, 31.0, 40.0, 40.0, 43.0, 32.0, 41.0, 41.0, 55.0, 53.0, 47.0, 55.0, 50.0, 51.0, 47.0, 40.0, 32.0, 31.0, 21.0, 16.0, 18.0, 12.0, 11.0, 11.0, 11.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.3125, -51.64404296875, -49.9755859375, -48.30712890625, -46.638671875, -44.97021484375, -43.3017578125, -41.63330078125, -39.96484375, -38.29638671875, -36.6279296875, -34.95947265625, -33.291015625, -31.62255859375, -29.9541015625, -28.28564453125, -26.6171875, -24.94873046875, -23.2802734375, -21.61181640625, -19.943359375, -18.27490234375, -16.6064453125, -14.93798828125, -13.26953125, -11.60107421875, -9.9326171875, -8.26416015625, -6.595703125, -4.92724609375, -3.2587890625, -1.59033203125, 0.078125, 1.74658203125, 3.4150390625, 5.08349609375, 6.751953125, 8.42041015625, 10.0888671875, 11.75732421875, 13.42578125, 15.09423828125, 16.7626953125, 18.43115234375, 20.099609375, 21.76806640625, 23.4365234375, 25.10498046875, 26.7734375, 28.44189453125, 30.1103515625, 31.77880859375, 33.447265625, 35.11572265625, 36.7841796875, 38.45263671875, 40.12109375, 41.78955078125, 43.4580078125, 45.12646484375, 46.794921875, 48.46337890625, 50.1318359375, 51.80029296875, 53.46875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 0.0, 5.0, 3.0, 7.0, 16.0, 13.0, 10.0, 28.0, 22.0, 30.0, 31.0, 42.0, 65.0, 75.0, 91.0, 164.0, 244.0, 366.0, 554.0, 921.0, 1582.0, 2724.0, 5061.0, 10309.0, 23648.0, 63848.0, 215301.0, 461378.0, 169449.0, 52633.0, 20097.0, 9046.0, 4476.0, 2478.0, 1381.0, 901.0, 492.0, 319.0, 195.0, 150.0, 103.0, 86.0, 65.0, 44.0, 28.0, 17.0, 15.0, 9.0, 14.0, 10.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-15.34375, -14.855224609375, -14.36669921875, -13.878173828125, -13.3896484375, -12.901123046875, -12.41259765625, -11.924072265625, -11.435546875, -10.947021484375, -10.45849609375, -9.969970703125, -9.4814453125, -8.992919921875, -8.50439453125, -8.015869140625, -7.52734375, -7.038818359375, -6.55029296875, -6.061767578125, -5.5732421875, -5.084716796875, -4.59619140625, -4.107666015625, -3.619140625, -3.130615234375, -2.64208984375, -2.153564453125, -1.6650390625, -1.176513671875, -0.68798828125, -0.199462890625, 0.2890625, 0.777587890625, 1.26611328125, 1.754638671875, 2.2431640625, 2.731689453125, 3.22021484375, 3.708740234375, 4.197265625, 4.685791015625, 5.17431640625, 5.662841796875, 6.1513671875, 6.639892578125, 7.12841796875, 7.616943359375, 8.10546875, 8.593994140625, 9.08251953125, 9.571044921875, 10.0595703125, 10.548095703125, 11.03662109375, 11.525146484375, 12.013671875, 12.502197265625, 12.99072265625, 13.479248046875, 13.9677734375, 14.456298828125, 14.94482421875, 15.433349609375, 15.921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 0.0, 3.0, 4.0, 4.0, 5.0, 10.0, 4.0, 8.0, 7.0, 6.0, 12.0, 11.0, 20.0, 24.0, 17.0, 23.0, 25.0, 29.0, 29.0, 40.0, 27.0, 31.0, 37.0, 39.0, 35.0, 34.0, 42.0, 39.0, 35.0, 33.0, 38.0, 33.0, 35.0, 31.0, 24.0, 33.0, 23.0, 22.0, 20.0, 20.0, 16.0, 15.0, 11.0, 8.0, 7.0, 3.0, 3.0, 7.0, 3.0, 5.0, 8.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-31.375, -30.460205078125, -29.54541015625, -28.630615234375, -27.7158203125, -26.801025390625, -25.88623046875, -24.971435546875, -24.056640625, -23.141845703125, -22.22705078125, -21.312255859375, -20.3974609375, -19.482666015625, -18.56787109375, -17.653076171875, -16.73828125, -15.823486328125, -14.90869140625, -13.993896484375, -13.0791015625, -12.164306640625, -11.24951171875, -10.334716796875, -9.419921875, -8.505126953125, -7.59033203125, -6.675537109375, -5.7607421875, -4.845947265625, -3.93115234375, -3.016357421875, -2.1015625, -1.186767578125, -0.27197265625, 0.642822265625, 1.5576171875, 2.472412109375, 3.38720703125, 4.302001953125, 5.216796875, 6.131591796875, 7.04638671875, 7.961181640625, 8.8759765625, 9.790771484375, 10.70556640625, 11.620361328125, 12.53515625, 13.449951171875, 14.36474609375, 15.279541015625, 16.1943359375, 17.109130859375, 18.02392578125, 18.938720703125, 19.853515625, 20.768310546875, 21.68310546875, 22.597900390625, 23.5126953125, 24.427490234375, 25.34228515625, 26.257080078125, 27.171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 7.0, 13.0, 10.0, 14.0, 18.0, 31.0, 46.0, 47.0, 72.0, 100.0, 179.0, 254.0, 392.0, 673.0, 1071.0, 1837.0, 3315.0, 6760.0, 16777.0, 56323.0, 395150.0, 467963.0, 63449.0, 18241.0, 7243.0, 3605.0, 1844.0, 1084.0, 686.0, 435.0, 288.0, 201.0, 149.0, 75.0, 57.0, 38.0, 34.0, 15.0, 11.0, 17.0, 6.0, 7.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5390625, -11.1898193359375, -10.840576171875, -10.4913330078125, -10.14208984375, -9.7928466796875, -9.443603515625, -9.0943603515625, -8.7451171875, -8.3958740234375, -8.046630859375, -7.6973876953125, -7.34814453125, -6.9989013671875, -6.649658203125, -6.3004150390625, -5.951171875, -5.6019287109375, -5.252685546875, -4.9034423828125, -4.55419921875, -4.2049560546875, -3.855712890625, -3.5064697265625, -3.1572265625, -2.8079833984375, -2.458740234375, -2.1094970703125, -1.76025390625, -1.4110107421875, -1.061767578125, -0.7125244140625, -0.36328125, -0.0140380859375, 0.335205078125, 0.6844482421875, 1.03369140625, 1.3829345703125, 1.732177734375, 2.0814208984375, 2.4306640625, 2.7799072265625, 3.129150390625, 3.4783935546875, 3.82763671875, 4.1768798828125, 4.526123046875, 4.8753662109375, 5.224609375, 5.5738525390625, 5.923095703125, 6.2723388671875, 6.62158203125, 6.9708251953125, 7.320068359375, 7.6693115234375, 8.0185546875, 8.3677978515625, 8.717041015625, 9.0662841796875, 9.41552734375, 9.7647705078125, 10.114013671875, 10.4632568359375, 10.8125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 7.0, 14.0, 20.0, 21.0, 39.0, 59.0, 111.0, 184.0, 171.0, 140.0, 82.0, 47.0, 27.0, 22.0, 10.0, 9.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015878677368164062, -0.001539960503578186, -0.0014920532703399658, -0.0014441460371017456, -0.0013962388038635254, -0.0013483315706253052, -0.001300424337387085, -0.0012525171041488647, -0.0012046098709106445, -0.0011567026376724243, -0.001108795404434204, -0.0010608881711959839, -0.0010129809379577637, -0.0009650737047195435, -0.0009171664714813232, -0.000869259238243103, -0.0008213520050048828, -0.0007734447717666626, -0.0007255375385284424, -0.0006776303052902222, -0.000629723072052002, -0.0005818158388137817, -0.0005339086055755615, -0.0004860013723373413, -0.0004380941390991211, -0.0003901869058609009, -0.00034227967262268066, -0.00029437243938446045, -0.00024646520614624023, -0.00019855797290802002, -0.0001506507396697998, -0.00010274350643157959, -5.4836273193359375e-05, -6.92903995513916e-06, 4.0978193283081055e-05, 8.888542652130127e-05, 0.00013679265975952148, 0.0001846998929977417, 0.00023260712623596191, 0.00028051435947418213, 0.00032842159271240234, 0.00037632882595062256, 0.0004242360591888428, 0.000472143292427063, 0.0005200505256652832, 0.0005679577589035034, 0.0006158649921417236, 0.0006637722253799438, 0.0007116794586181641, 0.0007595866918563843, 0.0008074939250946045, 0.0008554011583328247, 0.0009033083915710449, 0.0009512156248092651, 0.0009991228580474854, 0.0010470300912857056, 0.0010949373245239258, 0.001142844557762146, 0.0011907517910003662, 0.0012386590242385864, 0.0012865662574768066, 0.0013344734907150269, 0.001382380723953247, 0.0014302879571914673, 0.0014781951904296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 10.0, 7.0, 16.0, 15.0, 24.0, 31.0, 52.0, 77.0, 108.0, 153.0, 195.0, 239.0, 373.0, 450.0, 620.0, 825.0, 1077.0, 1540.0, 2190.0, 2870.0, 4128.0, 5716.0, 8484.0, 12727.0, 20797.0, 36984.0, 73961.0, 160047.0, 289424.0, 209327.0, 96323.0, 46372.0, 25069.0, 15023.0, 9670.0, 6714.0, 4686.0, 3317.0, 2362.0, 1763.0, 1227.0, 928.0, 678.0, 528.0, 353.0, 273.0, 228.0, 156.0, 131.0, 90.0, 71.0, 46.0, 30.0, 14.0, 19.0, 12.0, 6.0, 4.0, 5.0, 1.0], "bins": [-9.4296875, -9.14111328125, -8.8525390625, -8.56396484375, -8.275390625, -7.98681640625, -7.6982421875, -7.40966796875, -7.12109375, -6.83251953125, -6.5439453125, -6.25537109375, -5.966796875, -5.67822265625, -5.3896484375, -5.10107421875, -4.8125, -4.52392578125, -4.2353515625, -3.94677734375, -3.658203125, -3.36962890625, -3.0810546875, -2.79248046875, -2.50390625, -2.21533203125, -1.9267578125, -1.63818359375, -1.349609375, -1.06103515625, -0.7724609375, -0.48388671875, -0.1953125, 0.09326171875, 0.3818359375, 0.67041015625, 0.958984375, 1.24755859375, 1.5361328125, 1.82470703125, 2.11328125, 2.40185546875, 2.6904296875, 2.97900390625, 3.267578125, 3.55615234375, 3.8447265625, 4.13330078125, 4.421875, 4.71044921875, 4.9990234375, 5.28759765625, 5.576171875, 5.86474609375, 6.1533203125, 6.44189453125, 6.73046875, 7.01904296875, 7.3076171875, 7.59619140625, 7.884765625, 8.17333984375, 8.4619140625, 8.75048828125, 9.0390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 2.0, 4.0, 4.0, 7.0, 2.0, 11.0, 12.0, 15.0, 22.0, 46.0, 63.0, 85.0, 93.0, 93.0, 98.0, 82.0, 74.0, 60.0, 55.0, 29.0, 25.0, 17.0, 9.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-6.18359375, -5.9857177734375, -5.787841796875, -5.5899658203125, -5.39208984375, -5.1942138671875, -4.996337890625, -4.7984619140625, -4.6005859375, -4.4027099609375, -4.204833984375, -4.0069580078125, -3.80908203125, -3.6112060546875, -3.413330078125, -3.2154541015625, -3.017578125, -2.8197021484375, -2.621826171875, -2.4239501953125, -2.22607421875, -2.0281982421875, -1.830322265625, -1.6324462890625, -1.4345703125, -1.2366943359375, -1.038818359375, -0.8409423828125, -0.64306640625, -0.4451904296875, -0.247314453125, -0.0494384765625, 0.1484375, 0.3463134765625, 0.544189453125, 0.7420654296875, 0.93994140625, 1.1378173828125, 1.335693359375, 1.5335693359375, 1.7314453125, 1.9293212890625, 2.127197265625, 2.3250732421875, 2.52294921875, 2.7208251953125, 2.918701171875, 3.1165771484375, 3.314453125, 3.5123291015625, 3.710205078125, 3.9080810546875, 4.10595703125, 4.3038330078125, 4.501708984375, 4.6995849609375, 4.8974609375, 5.0953369140625, 5.293212890625, 5.4910888671875, 5.68896484375, 5.8868408203125, 6.084716796875, 6.2825927734375, 6.48046875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 7.0, 8.0, 9.0, 12.0, 10.0, 11.0, 14.0, 14.0, 18.0, 21.0, 29.0, 36.0, 35.0, 35.0, 43.0, 38.0, 40.0, 46.0, 42.0, 40.0, 54.0, 46.0, 51.0, 41.0, 30.0, 35.0, 34.0, 35.0, 21.0, 23.0, 14.0, 16.0, 15.0, 12.0, 9.0, 13.0, 11.0, 10.0, 4.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.810516357421875, -38.53291702270508, -37.25532150268555, -35.97772216796875, -34.70012664794922, -33.42252731323242, -32.144927978515625, -30.86733055114746, -29.589733123779297, -28.312135696411133, -27.03453826904297, -25.756938934326172, -24.479341506958008, -23.201744079589844, -21.924144744873047, -20.646547317504883, -19.36894989013672, -18.091352462768555, -16.81375503540039, -15.536155700683594, -14.25855827331543, -12.980960845947266, -11.703362464904785, -10.425764083862305, -9.14816665649414, -7.870568752288818, -6.592970848083496, -5.315372943878174, -4.037775039672852, -2.7601771354675293, -1.482579231262207, -0.20498085021972656, 1.0726203918457031, 2.3502182960510254, 3.6278162002563477, 4.90541410446167, 6.183012008666992, 7.4606099128723145, 8.738207817077637, 10.015806198120117, 11.293403625488281, 12.571001052856445, 13.848599433898926, 15.126197814941406, 16.40379524230957, 17.681392669677734, 18.95899200439453, 20.236589431762695, 21.51418685913086, 22.791784286499023, 24.069381713867188, 25.346981048583984, 26.62457847595215, 27.902175903320312, 29.17977523803711, 30.457372665405273, 31.734970092773438, 33.012569427490234, 34.290164947509766, 35.56776428222656, 36.845359802246094, 38.12295913696289, 39.40055847167969, 40.67815399169922, 41.955753326416016]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 5.0, 5.0, 13.0, 12.0, 7.0, 16.0, 17.0, 23.0, 23.0, 33.0, 34.0, 37.0, 37.0, 37.0, 37.0, 32.0, 41.0, 42.0, 55.0, 40.0, 51.0, 52.0, 48.0, 47.0, 46.0, 37.0, 31.0, 28.0, 23.0, 18.0, 10.0, 16.0, 7.0, 12.0, 11.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.9063606262207, -50.256919860839844, -48.607479095458984, -46.958038330078125, -45.30859375, -43.65915298461914, -42.00971221923828, -40.36027145385742, -38.71083068847656, -37.0613899230957, -35.411949157714844, -33.76250457763672, -32.11306381225586, -30.463623046875, -28.81418228149414, -27.16474151611328, -25.515296936035156, -23.865856170654297, -22.216413497924805, -20.566972732543945, -18.917530059814453, -17.268089294433594, -15.618648529052734, -13.969206809997559, -12.319765090942383, -10.670323371887207, -9.020881652832031, -7.371440887451172, -5.721999168395996, -4.07255744934082, -2.423116683959961, -0.7736749649047852, 0.8757667541503906, 2.5252082347869873, 4.174649715423584, 5.824090957641602, 7.473532676696777, 9.122974395751953, 10.772415161132812, 12.421856880187988, 14.071298599243164, 15.72074031829834, 17.370182037353516, 19.019622802734375, 20.669063568115234, 22.318506240844727, 23.967947006225586, 25.617389678955078, 27.266830444335938, 28.916271209716797, 30.56571388244629, 32.21515655517578, 33.86459732055664, 35.5140380859375, 37.16347885131836, 38.81291961669922, 40.462364196777344, 42.1118049621582, 43.76124572753906, 45.41069030761719, 47.06013107299805, 48.709571838378906, 50.359012603759766, 52.008453369140625, 53.657894134521484]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 9.0, 8.0, 18.0, 18.0, 23.0, 42.0, 64.0, 104.0, 139.0, 236.0, 339.0, 548.0, 891.0, 1347.0, 2051.0, 3440.0, 5138.0, 8228.0, 12404.0, 19038.0, 27997.0, 40400.0, 55774.0, 73526.0, 90061.0, 103682.0, 110104.0, 107041.0, 96813.0, 81432.0, 63275.0, 46753.0, 33089.0, 22525.0, 15068.0, 9688.0, 6181.0, 3986.0, 2578.0, 1673.0, 989.0, 629.0, 437.0, 276.0, 174.0, 119.0, 67.0, 47.0, 35.0, 29.0, 14.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-27.53125, -26.604736328125, -25.67822265625, -24.751708984375, -23.8251953125, -22.898681640625, -21.97216796875, -21.045654296875, -20.119140625, -19.192626953125, -18.26611328125, -17.339599609375, -16.4130859375, -15.486572265625, -14.56005859375, -13.633544921875, -12.70703125, -11.780517578125, -10.85400390625, -9.927490234375, -9.0009765625, -8.074462890625, -7.14794921875, -6.221435546875, -5.294921875, -4.368408203125, -3.44189453125, -2.515380859375, -1.5888671875, -0.662353515625, 0.26416015625, 1.190673828125, 2.1171875, 3.043701171875, 3.97021484375, 4.896728515625, 5.8232421875, 6.749755859375, 7.67626953125, 8.602783203125, 9.529296875, 10.455810546875, 11.38232421875, 12.308837890625, 13.2353515625, 14.161865234375, 15.08837890625, 16.014892578125, 16.94140625, 17.867919921875, 18.79443359375, 19.720947265625, 20.6474609375, 21.573974609375, 22.50048828125, 23.427001953125, 24.353515625, 25.280029296875, 26.20654296875, 27.133056640625, 28.0595703125, 28.986083984375, 29.91259765625, 30.839111328125, 31.765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 5.0, 7.0, 12.0, 13.0, 5.0, 15.0, 16.0, 25.0, 24.0, 32.0, 36.0, 32.0, 45.0, 32.0, 41.0, 28.0, 45.0, 39.0, 56.0, 39.0, 49.0, 55.0, 39.0, 57.0, 44.0, 36.0, 31.0, 28.0, 23.0, 18.0, 10.0, 15.0, 6.0, 14.0, 10.0, 12.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.3125, -48.712890625, -47.11328125, -45.513671875, -43.9140625, -42.314453125, -40.71484375, -39.115234375, -37.515625, -35.916015625, -34.31640625, -32.716796875, -31.1171875, -29.517578125, -27.91796875, -26.318359375, -24.71875, -23.119140625, -21.51953125, -19.919921875, -18.3203125, -16.720703125, -15.12109375, -13.521484375, -11.921875, -10.322265625, -8.72265625, -7.123046875, -5.5234375, -3.923828125, -2.32421875, -0.724609375, 0.875, 2.474609375, 4.07421875, 5.673828125, 7.2734375, 8.873046875, 10.47265625, 12.072265625, 13.671875, 15.271484375, 16.87109375, 18.470703125, 20.0703125, 21.669921875, 23.26953125, 24.869140625, 26.46875, 28.068359375, 29.66796875, 31.267578125, 32.8671875, 34.466796875, 36.06640625, 37.666015625, 39.265625, 40.865234375, 42.46484375, 44.064453125, 45.6640625, 47.263671875, 48.86328125, 50.462890625, 52.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 16.0, 25.0, 33.0, 38.0, 83.0, 131.0, 205.0, 387.0, 538.0, 881.0, 1374.0, 2205.0, 3594.0, 5814.0, 9143.0, 14201.0, 21988.0, 32402.0, 46739.0, 65241.0, 83859.0, 101596.0, 112724.0, 114552.0, 106282.0, 90469.0, 71968.0, 53434.0, 37347.0, 25328.0, 16750.0, 10790.0, 6893.0, 4365.0, 2719.0, 1722.0, 1015.0, 640.0, 405.0, 265.0, 135.0, 100.0, 70.0, 33.0, 26.0, 15.0, 9.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-34.34375, -33.339111328125, -32.33447265625, -31.329833984375, -30.3251953125, -29.320556640625, -28.31591796875, -27.311279296875, -26.306640625, -25.302001953125, -24.29736328125, -23.292724609375, -22.2880859375, -21.283447265625, -20.27880859375, -19.274169921875, -18.26953125, -17.264892578125, -16.26025390625, -15.255615234375, -14.2509765625, -13.246337890625, -12.24169921875, -11.237060546875, -10.232421875, -9.227783203125, -8.22314453125, -7.218505859375, -6.2138671875, -5.209228515625, -4.20458984375, -3.199951171875, -2.1953125, -1.190673828125, -0.18603515625, 0.818603515625, 1.8232421875, 2.827880859375, 3.83251953125, 4.837158203125, 5.841796875, 6.846435546875, 7.85107421875, 8.855712890625, 9.8603515625, 10.864990234375, 11.86962890625, 12.874267578125, 13.87890625, 14.883544921875, 15.88818359375, 16.892822265625, 17.8974609375, 18.902099609375, 19.90673828125, 20.911376953125, 21.916015625, 22.920654296875, 23.92529296875, 24.929931640625, 25.9345703125, 26.939208984375, 27.94384765625, 28.948486328125, 29.953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 3.0, 7.0, 6.0, 5.0, 9.0, 7.0, 10.0, 7.0, 11.0, 11.0, 19.0, 18.0, 19.0, 16.0, 19.0, 30.0, 27.0, 25.0, 26.0, 32.0, 31.0, 31.0, 38.0, 20.0, 35.0, 31.0, 32.0, 49.0, 35.0, 38.0, 36.0, 29.0, 25.0, 36.0, 17.0, 25.0, 14.0, 20.0, 18.0, 24.0, 16.0, 11.0, 14.0, 15.0, 15.0, 5.0, 5.0, 8.0, 4.0, 8.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0], "bins": [-26.125, -25.323974609375, -24.52294921875, -23.721923828125, -22.9208984375, -22.119873046875, -21.31884765625, -20.517822265625, -19.716796875, -18.915771484375, -18.11474609375, -17.313720703125, -16.5126953125, -15.711669921875, -14.91064453125, -14.109619140625, -13.30859375, -12.507568359375, -11.70654296875, -10.905517578125, -10.1044921875, -9.303466796875, -8.50244140625, -7.701416015625, -6.900390625, -6.099365234375, -5.29833984375, -4.497314453125, -3.6962890625, -2.895263671875, -2.09423828125, -1.293212890625, -0.4921875, 0.308837890625, 1.10986328125, 1.910888671875, 2.7119140625, 3.512939453125, 4.31396484375, 5.114990234375, 5.916015625, 6.717041015625, 7.51806640625, 8.319091796875, 9.1201171875, 9.921142578125, 10.72216796875, 11.523193359375, 12.32421875, 13.125244140625, 13.92626953125, 14.727294921875, 15.5283203125, 16.329345703125, 17.13037109375, 17.931396484375, 18.732421875, 19.533447265625, 20.33447265625, 21.135498046875, 21.9365234375, 22.737548828125, 23.53857421875, 24.339599609375, 25.140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 10.0, 12.0, 10.0, 14.0, 24.0, 38.0, 45.0, 60.0, 76.0, 137.0, 205.0, 334.0, 556.0, 863.0, 1515.0, 2992.0, 7515.0, 25894.0, 119686.0, 384505.0, 362283.0, 105371.0, 23100.0, 6781.0, 2851.0, 1417.0, 797.0, 546.0, 309.0, 196.0, 140.0, 89.0, 57.0, 39.0, 28.0, 14.0, 16.0, 7.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.84375, -46.39208984375, -44.9404296875, -43.48876953125, -42.037109375, -40.58544921875, -39.1337890625, -37.68212890625, -36.23046875, -34.77880859375, -33.3271484375, -31.87548828125, -30.423828125, -28.97216796875, -27.5205078125, -26.06884765625, -24.6171875, -23.16552734375, -21.7138671875, -20.26220703125, -18.810546875, -17.35888671875, -15.9072265625, -14.45556640625, -13.00390625, -11.55224609375, -10.1005859375, -8.64892578125, -7.197265625, -5.74560546875, -4.2939453125, -2.84228515625, -1.390625, 0.06103515625, 1.5126953125, 2.96435546875, 4.416015625, 5.86767578125, 7.3193359375, 8.77099609375, 10.22265625, 11.67431640625, 13.1259765625, 14.57763671875, 16.029296875, 17.48095703125, 18.9326171875, 20.38427734375, 21.8359375, 23.28759765625, 24.7392578125, 26.19091796875, 27.642578125, 29.09423828125, 30.5458984375, 31.99755859375, 33.44921875, 34.90087890625, 36.3525390625, 37.80419921875, 39.255859375, 40.70751953125, 42.1591796875, 43.61083984375, 45.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 10.0, 12.0, 17.0, 19.0, 19.0, 48.0, 66.0, 82.0, 94.0, 100.0, 110.0, 104.0, 80.0, 69.0, 60.0, 40.0, 23.0, 23.0, 16.0, 6.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034389495849609375, -0.00334891676902771, -0.0032588839530944824, -0.003168851137161255, -0.0030788183212280273, -0.0029887855052948, -0.0028987526893615723, -0.0028087198734283447, -0.002718687057495117, -0.0026286542415618896, -0.002538621425628662, -0.0024485886096954346, -0.002358555793762207, -0.0022685229778289795, -0.002178490161895752, -0.0020884573459625244, -0.001998424530029297, -0.0019083917140960693, -0.0018183588981628418, -0.0017283260822296143, -0.0016382932662963867, -0.0015482604503631592, -0.0014582276344299316, -0.001368194818496704, -0.0012781620025634766, -0.001188129186630249, -0.0010980963706970215, -0.001008063554763794, -0.0009180307388305664, -0.0008279979228973389, -0.0007379651069641113, -0.0006479322910308838, -0.0005578994750976562, -0.0004678666591644287, -0.00037783384323120117, -0.00028780102729797363, -0.0001977682113647461, -0.00010773539543151855, -1.7702579498291016e-05, 7.233023643493652e-05, 0.00016236305236816406, 0.0002523958683013916, 0.00034242868423461914, 0.0004324615001678467, 0.0005224943161010742, 0.0006125271320343018, 0.0007025599479675293, 0.0007925927639007568, 0.0008826255798339844, 0.0009726583957672119, 0.0010626912117004395, 0.001152724027633667, 0.0012427568435668945, 0.001332789659500122, 0.0014228224754333496, 0.0015128552913665771, 0.0016028881072998047, 0.0016929209232330322, 0.0017829537391662598, 0.0018729865550994873, 0.001963019371032715, 0.0020530521869659424, 0.00214308500289917, 0.0022331178188323975, 0.002323150634765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 9.0, 12.0, 16.0, 23.0, 25.0, 38.0, 49.0, 61.0, 112.0, 146.0, 205.0, 300.0, 493.0, 738.0, 1188.0, 1937.0, 3303.0, 5747.0, 11063.0, 21988.0, 46836.0, 95317.0, 165796.0, 220174.0, 202028.0, 132307.0, 69364.0, 33532.0, 16448.0, 8011.0, 4479.0, 2475.0, 1534.0, 965.0, 579.0, 405.0, 274.0, 192.0, 112.0, 74.0, 58.0, 34.0, 35.0, 22.0, 14.0, 15.0, 8.0, 7.0, 1.0, 3.0, 3.0, 3.0], "bins": [-26.0, -25.273193359375, -24.54638671875, -23.819580078125, -23.0927734375, -22.365966796875, -21.63916015625, -20.912353515625, -20.185546875, -19.458740234375, -18.73193359375, -18.005126953125, -17.2783203125, -16.551513671875, -15.82470703125, -15.097900390625, -14.37109375, -13.644287109375, -12.91748046875, -12.190673828125, -11.4638671875, -10.737060546875, -10.01025390625, -9.283447265625, -8.556640625, -7.829833984375, -7.10302734375, -6.376220703125, -5.6494140625, -4.922607421875, -4.19580078125, -3.468994140625, -2.7421875, -2.015380859375, -1.28857421875, -0.561767578125, 0.1650390625, 0.891845703125, 1.61865234375, 2.345458984375, 3.072265625, 3.799072265625, 4.52587890625, 5.252685546875, 5.9794921875, 6.706298828125, 7.43310546875, 8.159912109375, 8.88671875, 9.613525390625, 10.34033203125, 11.067138671875, 11.7939453125, 12.520751953125, 13.24755859375, 13.974365234375, 14.701171875, 15.427978515625, 16.15478515625, 16.881591796875, 17.6083984375, 18.335205078125, 19.06201171875, 19.788818359375, 20.515625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 8.0, 14.0, 14.0, 17.0, 20.0, 30.0, 36.0, 47.0, 41.0, 71.0, 81.0, 87.0, 88.0, 71.0, 66.0, 55.0, 49.0, 47.0, 39.0, 26.0, 20.0, 23.0, 8.0, 12.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.675537109375, -9.33544921875, -8.995361328125, -8.6552734375, -8.315185546875, -7.97509765625, -7.635009765625, -7.294921875, -6.954833984375, -6.61474609375, -6.274658203125, -5.9345703125, -5.594482421875, -5.25439453125, -4.914306640625, -4.57421875, -4.234130859375, -3.89404296875, -3.553955078125, -3.2138671875, -2.873779296875, -2.53369140625, -2.193603515625, -1.853515625, -1.513427734375, -1.17333984375, -0.833251953125, -0.4931640625, -0.153076171875, 0.18701171875, 0.527099609375, 0.8671875, 1.207275390625, 1.54736328125, 1.887451171875, 2.2275390625, 2.567626953125, 2.90771484375, 3.247802734375, 3.587890625, 3.927978515625, 4.26806640625, 4.608154296875, 4.9482421875, 5.288330078125, 5.62841796875, 5.968505859375, 6.30859375, 6.648681640625, 6.98876953125, 7.328857421875, 7.6689453125, 8.009033203125, 8.34912109375, 8.689208984375, 9.029296875, 9.369384765625, 9.70947265625, 10.049560546875, 10.3896484375, 10.729736328125, 11.06982421875, 11.409912109375, 11.75]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 13.0, 10.0, 5.0, 8.0, 12.0, 13.0, 19.0, 17.0, 25.0, 24.0, 36.0, 30.0, 36.0, 39.0, 34.0, 45.0, 62.0, 58.0, 45.0, 36.0, 41.0, 51.0, 49.0, 33.0, 34.0, 30.0, 31.0, 24.0, 19.0, 22.0, 17.0, 19.0, 16.0, 10.0, 6.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-45.9792366027832, -44.65081787109375, -43.32240295410156, -41.99398422241211, -40.66556930541992, -39.33715057373047, -38.00873565673828, -36.68031692504883, -35.351898193359375, -34.02347946166992, -32.695064544677734, -31.366647720336914, -30.038230895996094, -28.70981216430664, -27.38139533996582, -26.052978515625, -24.724563598632812, -23.396146774291992, -22.067729949951172, -20.73931312561035, -19.41089630126953, -18.082477569580078, -16.754060745239258, -15.425643920898438, -14.097227096557617, -12.768810272216797, -11.440393447875977, -10.11197566986084, -8.78355884552002, -7.455142021179199, -6.126724720001221, -4.798307418823242, -3.4698944091796875, -2.141477346420288, -0.8130602836608887, 0.5153567790985107, 1.8437738418579102, 3.1721906661987305, 4.500607967376709, 5.8290252685546875, 7.157442092895508, 8.485858917236328, 9.814275741577148, 11.142693519592285, 12.471110343933105, 13.799527168273926, 15.127944946289062, 16.456361770629883, 17.784778594970703, 19.113195419311523, 20.441612243652344, 21.770029067993164, 23.098445892333984, 24.426864624023438, 25.755281448364258, 27.083698272705078, 28.4121150970459, 29.74053192138672, 31.06894874572754, 32.39736557006836, 33.72578430175781, 35.05419921875, 36.38261795043945, 37.711036682128906, 39.039451599121094]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 8.0, 14.0, 17.0, 18.0, 24.0, 25.0, 21.0, 30.0, 26.0, 38.0, 33.0, 36.0, 49.0, 42.0, 39.0, 48.0, 52.0, 55.0, 52.0, 34.0, 51.0, 48.0, 29.0, 28.0, 27.0, 24.0, 24.0, 11.0, 22.0, 19.0, 9.0, 9.0, 3.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.95375061035156, -50.256561279296875, -48.55937576293945, -46.862186431884766, -45.165000915527344, -43.467811584472656, -41.77062225341797, -40.07343673706055, -38.376251220703125, -36.67906188964844, -34.981876373291016, -33.28468704223633, -31.587501525878906, -29.89031219482422, -28.193124771118164, -26.49593734741211, -24.798748016357422, -23.101560592651367, -21.404373168945312, -19.707183837890625, -18.009998321533203, -16.312808990478516, -14.615621566772461, -12.918434143066406, -11.221246719360352, -9.524059295654297, -7.826871395111084, -6.129683494567871, -4.432496070861816, -2.7353086471557617, -1.0381202697753906, 0.6590671539306641, 2.356250762939453, 4.053438186645508, 5.750626087188721, 7.447813987731934, 9.145001411437988, 10.842188835144043, 12.539377212524414, 14.236564636230469, 15.933752059936523, 17.630939483642578, 19.328126907348633, 21.025314331054688, 22.722503662109375, 24.419689178466797, 26.116878509521484, 27.81406593322754, 29.511253356933594, 31.20844078063965, 32.9056282043457, 34.60281753540039, 36.30000305175781, 37.9971923828125, 39.69438171386719, 41.39156723022461, 43.08875274658203, 44.78594207763672, 46.48312759399414, 48.18031692504883, 49.87750244140625, 51.57469177246094, 53.271881103515625, 54.96906661987305, 56.666255950927734]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 13.0, 21.0, 33.0, 50.0, 89.0, 166.0, 283.0, 465.0, 796.0, 1311.0, 2245.0, 3533.0, 5959.0, 9611.0, 15625.0, 25184.0, 39332.0, 61390.0, 92810.0, 135670.0, 193367.0, 262675.0, 334221.0, 399983.0, 439590.0, 446128.0, 415585.0, 357659.0, 286493.0, 215427.0, 153287.0, 105299.0, 69983.0, 45314.0, 28710.0, 17785.0, 11075.0, 6764.0, 4078.0, 2504.0, 1462.0, 902.0, 544.0, 342.0, 195.0, 130.0, 61.0, 53.0, 30.0, 19.0, 13.0, 11.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-30.125, -29.188232421875, -28.25146484375, -27.314697265625, -26.3779296875, -25.441162109375, -24.50439453125, -23.567626953125, -22.630859375, -21.694091796875, -20.75732421875, -19.820556640625, -18.8837890625, -17.947021484375, -17.01025390625, -16.073486328125, -15.13671875, -14.199951171875, -13.26318359375, -12.326416015625, -11.3896484375, -10.452880859375, -9.51611328125, -8.579345703125, -7.642578125, -6.705810546875, -5.76904296875, -4.832275390625, -3.8955078125, -2.958740234375, -2.02197265625, -1.085205078125, -0.1484375, 0.788330078125, 1.72509765625, 2.661865234375, 3.5986328125, 4.535400390625, 5.47216796875, 6.408935546875, 7.345703125, 8.282470703125, 9.21923828125, 10.156005859375, 11.0927734375, 12.029541015625, 12.96630859375, 13.903076171875, 14.83984375, 15.776611328125, 16.71337890625, 17.650146484375, 18.5869140625, 19.523681640625, 20.46044921875, 21.397216796875, 22.333984375, 23.270751953125, 24.20751953125, 25.144287109375, 26.0810546875, 27.017822265625, 27.95458984375, 28.891357421875, 29.828125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 4.0, 9.0, 11.0, 12.0, 21.0, 17.0, 25.0, 23.0, 19.0, 30.0, 29.0, 39.0, 35.0, 45.0, 40.0, 42.0, 43.0, 47.0, 52.0, 56.0, 48.0, 36.0, 57.0, 38.0, 28.0, 26.0, 28.0, 21.0, 27.0, 16.0, 16.0, 17.0, 11.0, 8.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.28125, -40.89892578125, -39.5166015625, -38.13427734375, -36.751953125, -35.36962890625, -33.9873046875, -32.60498046875, -31.22265625, -29.84033203125, -28.4580078125, -27.07568359375, -25.693359375, -24.31103515625, -22.9287109375, -21.54638671875, -20.1640625, -18.78173828125, -17.3994140625, -16.01708984375, -14.634765625, -13.25244140625, -11.8701171875, -10.48779296875, -9.10546875, -7.72314453125, -6.3408203125, -4.95849609375, -3.576171875, -2.19384765625, -0.8115234375, 0.57080078125, 1.953125, 3.33544921875, 4.7177734375, 6.10009765625, 7.482421875, 8.86474609375, 10.2470703125, 11.62939453125, 13.01171875, 14.39404296875, 15.7763671875, 17.15869140625, 18.541015625, 19.92333984375, 21.3056640625, 22.68798828125, 24.0703125, 25.45263671875, 26.8349609375, 28.21728515625, 29.599609375, 30.98193359375, 32.3642578125, 33.74658203125, 35.12890625, 36.51123046875, 37.8935546875, 39.27587890625, 40.658203125, 42.04052734375, 43.4228515625, 44.80517578125, 46.1875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 11.0, 11.0, 22.0, 24.0, 57.0, 75.0, 125.0, 224.0, 347.0, 613.0, 1028.0, 1535.0, 2481.0, 4099.0, 6431.0, 10164.0, 15605.0, 24024.0, 35712.0, 52023.0, 73745.0, 102152.0, 137007.0, 178057.0, 220889.0, 267006.0, 305556.0, 335389.0, 350608.0, 349591.0, 330822.0, 301239.0, 257975.0, 215179.0, 171446.0, 130779.0, 97196.0, 70228.0, 48879.0, 33312.0, 22475.0, 14519.0, 9602.0, 6185.0, 3802.0, 2449.0, 1417.0, 877.0, 512.0, 340.0, 191.0, 97.0, 66.0, 38.0, 25.0, 11.0, 11.0, 6.0, 5.0, 1.0, 2.0], "bins": [-25.109375, -24.32275390625, -23.5361328125, -22.74951171875, -21.962890625, -21.17626953125, -20.3896484375, -19.60302734375, -18.81640625, -18.02978515625, -17.2431640625, -16.45654296875, -15.669921875, -14.88330078125, -14.0966796875, -13.31005859375, -12.5234375, -11.73681640625, -10.9501953125, -10.16357421875, -9.376953125, -8.59033203125, -7.8037109375, -7.01708984375, -6.23046875, -5.44384765625, -4.6572265625, -3.87060546875, -3.083984375, -2.29736328125, -1.5107421875, -0.72412109375, 0.0625, 0.84912109375, 1.6357421875, 2.42236328125, 3.208984375, 3.99560546875, 4.7822265625, 5.56884765625, 6.35546875, 7.14208984375, 7.9287109375, 8.71533203125, 9.501953125, 10.28857421875, 11.0751953125, 11.86181640625, 12.6484375, 13.43505859375, 14.2216796875, 15.00830078125, 15.794921875, 16.58154296875, 17.3681640625, 18.15478515625, 18.94140625, 19.72802734375, 20.5146484375, 21.30126953125, 22.087890625, 22.87451171875, 23.6611328125, 24.44775390625, 25.234375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 9.0, 17.0, 9.0, 20.0, 19.0, 39.0, 42.0, 59.0, 56.0, 76.0, 99.0, 114.0, 131.0, 143.0, 140.0, 178.0, 186.0, 181.0, 200.0, 193.0, 200.0, 210.0, 185.0, 191.0, 177.0, 172.0, 124.0, 151.0, 110.0, 101.0, 114.0, 65.0, 66.0, 54.0, 55.0, 44.0, 27.0, 19.0, 18.0, 22.0, 18.0, 8.0, 9.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-17.4375, -16.90185546875, -16.3662109375, -15.83056640625, -15.294921875, -14.75927734375, -14.2236328125, -13.68798828125, -13.15234375, -12.61669921875, -12.0810546875, -11.54541015625, -11.009765625, -10.47412109375, -9.9384765625, -9.40283203125, -8.8671875, -8.33154296875, -7.7958984375, -7.26025390625, -6.724609375, -6.18896484375, -5.6533203125, -5.11767578125, -4.58203125, -4.04638671875, -3.5107421875, -2.97509765625, -2.439453125, -1.90380859375, -1.3681640625, -0.83251953125, -0.296875, 0.23876953125, 0.7744140625, 1.31005859375, 1.845703125, 2.38134765625, 2.9169921875, 3.45263671875, 3.98828125, 4.52392578125, 5.0595703125, 5.59521484375, 6.130859375, 6.66650390625, 7.2021484375, 7.73779296875, 8.2734375, 8.80908203125, 9.3447265625, 9.88037109375, 10.416015625, 10.95166015625, 11.4873046875, 12.02294921875, 12.55859375, 13.09423828125, 13.6298828125, 14.16552734375, 14.701171875, 15.23681640625, 15.7724609375, 16.30810546875, 16.84375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 6.0, 7.0, 13.0, 7.0, 6.0, 12.0, 12.0, 19.0, 27.0, 22.0, 18.0, 26.0, 24.0, 30.0, 31.0, 52.0, 41.0, 38.0, 37.0, 36.0, 48.0, 44.0, 52.0, 45.0, 43.0, 40.0, 48.0, 34.0, 16.0, 26.0, 27.0, 16.0, 11.0, 21.0, 10.0, 17.0, 2.0, 3.0, 11.0, 3.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.246639251708984, -41.012481689453125, -39.778324127197266, -38.544166564941406, -37.31000900268555, -36.07585144042969, -34.84169387817383, -33.60753631591797, -32.373382568359375, -31.139225006103516, -29.905067443847656, -28.670909881591797, -27.436752319335938, -26.202594757080078, -24.96843910217285, -23.734281539916992, -22.5001220703125, -21.26596450805664, -20.03180694580078, -18.797649383544922, -17.563491821289062, -16.329334259033203, -15.095178604125977, -13.861021041870117, -12.626863479614258, -11.392705917358398, -10.158548355102539, -8.924391746520996, -7.690234184265137, -6.456076622009277, -5.221919536590576, -3.987762451171875, -2.7536087036132812, -1.519451379776001, -0.2852940559387207, 0.9488632678985596, 2.18302059173584, 3.417178153991699, 4.6513352394104, 5.885492324829102, 7.119649887084961, 8.35380744934082, 9.58796501159668, 10.822121620178223, 12.056279182434082, 13.290436744689941, 14.524593353271484, 15.758750915527344, 16.992908477783203, 18.227066040039062, 19.461223602294922, 20.69538116455078, 21.92953872680664, 23.1636962890625, 24.397851943969727, 25.632009506225586, 26.866167068481445, 28.100324630737305, 29.334482192993164, 30.568639755249023, 31.80279541015625, 33.03695297241211, 34.27111053466797, 35.50526809692383, 36.73942565917969]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 3.0, 0.0, 1.0, 11.0, 3.0, 6.0, 8.0, 4.0, 19.0, 23.0, 12.0, 18.0, 22.0, 27.0, 23.0, 32.0, 39.0, 40.0, 40.0, 37.0, 42.0, 44.0, 35.0, 46.0, 49.0, 43.0, 48.0, 33.0, 48.0, 35.0, 32.0, 34.0, 27.0, 17.0, 19.0, 21.0, 11.0, 14.0, 11.0, 10.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.74911880493164, -44.217613220214844, -42.68610763549805, -41.15460205078125, -39.62309646606445, -38.091590881347656, -36.560081481933594, -35.02857971191406, -33.4970703125, -31.965564727783203, -30.434059143066406, -28.90255355834961, -27.371047973632812, -25.839542388916016, -24.308034896850586, -22.77652931213379, -21.245025634765625, -19.713520050048828, -18.18201446533203, -16.650508880615234, -15.119002342224121, -13.587496757507324, -12.055990219116211, -10.524484634399414, -8.992979049682617, -7.46147346496582, -5.929967403411865, -4.39846134185791, -2.8669557571411133, -1.3354501724243164, 0.19605636596679688, 1.7275619506835938, 3.2590675354003906, 4.7905731201171875, 6.322079181671143, 7.853585243225098, 9.385090827941895, 10.916596412658691, 12.448102951049805, 13.979608535766602, 15.511114120483398, 17.042619705200195, 18.574125289916992, 20.105632781982422, 21.63713836669922, 23.168643951416016, 24.700149536132812, 26.23165512084961, 27.763160705566406, 29.294666290283203, 30.826171875, 32.3576774597168, 33.889183044433594, 35.42068862915039, 36.95219421386719, 38.48370361328125, 40.01520538330078, 41.54671096801758, 43.078216552734375, 44.60972213745117, 46.14122772216797, 47.672733306884766, 49.20423889160156, 50.735748291015625, 52.26725387573242]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 5.0, 7.0, 11.0, 11.0, 23.0, 26.0, 39.0, 41.0, 72.0, 84.0, 120.0, 172.0, 203.0, 298.0, 464.0, 718.0, 971.0, 1577.0, 2670.0, 5070.0, 10146.0, 21356.0, 48075.0, 111286.0, 239890.0, 301392.0, 167901.0, 72329.0, 31865.0, 14732.0, 7168.0, 3717.0, 2165.0, 1242.0, 852.0, 530.0, 380.0, 270.0, 193.0, 136.0, 99.0, 61.0, 47.0, 44.0, 28.0, 16.0, 20.0, 10.0, 10.0, 5.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.8046875, -15.2989501953125, -14.793212890625, -14.2874755859375, -13.78173828125, -13.2760009765625, -12.770263671875, -12.2645263671875, -11.7587890625, -11.2530517578125, -10.747314453125, -10.2415771484375, -9.73583984375, -9.2301025390625, -8.724365234375, -8.2186279296875, -7.712890625, -7.2071533203125, -6.701416015625, -6.1956787109375, -5.68994140625, -5.1842041015625, -4.678466796875, -4.1727294921875, -3.6669921875, -3.1612548828125, -2.655517578125, -2.1497802734375, -1.64404296875, -1.1383056640625, -0.632568359375, -0.1268310546875, 0.37890625, 0.8846435546875, 1.390380859375, 1.8961181640625, 2.40185546875, 2.9075927734375, 3.413330078125, 3.9190673828125, 4.4248046875, 4.9305419921875, 5.436279296875, 5.9420166015625, 6.44775390625, 6.9534912109375, 7.459228515625, 7.9649658203125, 8.470703125, 8.9764404296875, 9.482177734375, 9.9879150390625, 10.49365234375, 10.9993896484375, 11.505126953125, 12.0108642578125, 12.5166015625, 13.0223388671875, 13.528076171875, 14.0338134765625, 14.53955078125, 15.0452880859375, 15.551025390625, 16.0567626953125, 16.5625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 0.0, 2.0, 10.0, 3.0, 7.0, 6.0, 5.0, 18.0, 24.0, 11.0, 18.0, 24.0, 24.0, 24.0, 34.0, 35.0, 42.0, 40.0, 36.0, 45.0, 40.0, 38.0, 45.0, 50.0, 40.0, 51.0, 35.0, 41.0, 39.0, 31.0, 36.0, 27.0, 15.0, 21.0, 21.0, 11.0, 13.0, 9.0, 13.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.53125, -44.00634765625, -42.4814453125, -40.95654296875, -39.431640625, -37.90673828125, -36.3818359375, -34.85693359375, -33.33203125, -31.80712890625, -30.2822265625, -28.75732421875, -27.232421875, -25.70751953125, -24.1826171875, -22.65771484375, -21.1328125, -19.60791015625, -18.0830078125, -16.55810546875, -15.033203125, -13.50830078125, -11.9833984375, -10.45849609375, -8.93359375, -7.40869140625, -5.8837890625, -4.35888671875, -2.833984375, -1.30908203125, 0.2158203125, 1.74072265625, 3.265625, 4.79052734375, 6.3154296875, 7.84033203125, 9.365234375, 10.89013671875, 12.4150390625, 13.93994140625, 15.46484375, 16.98974609375, 18.5146484375, 20.03955078125, 21.564453125, 23.08935546875, 24.6142578125, 26.13916015625, 27.6640625, 29.18896484375, 30.7138671875, 32.23876953125, 33.763671875, 35.28857421875, 36.8134765625, 38.33837890625, 39.86328125, 41.38818359375, 42.9130859375, 44.43798828125, 45.962890625, 47.48779296875, 49.0126953125, 50.53759765625, 52.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 10.0, 10.0, 15.0, 19.0, 17.0, 33.0, 46.0, 62.0, 105.0, 158.0, 241.0, 390.0, 661.0, 1064.0, 1961.0, 3727.0, 7435.0, 17198.0, 44986.0, 138305.0, 424321.0, 275495.0, 80546.0, 28280.0, 11518.0, 5365.0, 2793.0, 1459.0, 901.0, 480.0, 294.0, 240.0, 131.0, 84.0, 47.0, 41.0, 27.0, 16.0, 20.0, 16.0, 5.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.0859375, -14.6256103515625, -14.165283203125, -13.7049560546875, -13.24462890625, -12.7843017578125, -12.323974609375, -11.8636474609375, -11.4033203125, -10.9429931640625, -10.482666015625, -10.0223388671875, -9.56201171875, -9.1016845703125, -8.641357421875, -8.1810302734375, -7.720703125, -7.2603759765625, -6.800048828125, -6.3397216796875, -5.87939453125, -5.4190673828125, -4.958740234375, -4.4984130859375, -4.0380859375, -3.5777587890625, -3.117431640625, -2.6571044921875, -2.19677734375, -1.7364501953125, -1.276123046875, -0.8157958984375, -0.35546875, 0.1048583984375, 0.565185546875, 1.0255126953125, 1.48583984375, 1.9461669921875, 2.406494140625, 2.8668212890625, 3.3271484375, 3.7874755859375, 4.247802734375, 4.7081298828125, 5.16845703125, 5.6287841796875, 6.089111328125, 6.5494384765625, 7.009765625, 7.4700927734375, 7.930419921875, 8.3907470703125, 8.85107421875, 9.3114013671875, 9.771728515625, 10.2320556640625, 10.6923828125, 11.1527099609375, 11.613037109375, 12.0733642578125, 12.53369140625, 12.9940185546875, 13.454345703125, 13.9146728515625, 14.375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 5.0, 5.0, 5.0, 3.0, 6.0, 11.0, 11.0, 23.0, 20.0, 13.0, 36.0, 29.0, 25.0, 40.0, 31.0, 35.0, 46.0, 60.0, 40.0, 34.0, 44.0, 45.0, 37.0, 43.0, 41.0, 46.0, 50.0, 39.0, 30.0, 30.0, 26.0, 12.0, 18.0, 13.0, 13.0, 10.0, 6.0, 8.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.28125, -37.1875, -36.09375, -35.0, -33.90625, -32.8125, -31.71875, -30.625, -29.53125, -28.4375, -27.34375, -26.25, -25.15625, -24.0625, -22.96875, -21.875, -20.78125, -19.6875, -18.59375, -17.5, -16.40625, -15.3125, -14.21875, -13.125, -12.03125, -10.9375, -9.84375, -8.75, -7.65625, -6.5625, -5.46875, -4.375, -3.28125, -2.1875, -1.09375, 0.0, 1.09375, 2.1875, 3.28125, 4.375, 5.46875, 6.5625, 7.65625, 8.75, 9.84375, 10.9375, 12.03125, 13.125, 14.21875, 15.3125, 16.40625, 17.5, 18.59375, 19.6875, 20.78125, 21.875, 22.96875, 24.0625, 25.15625, 26.25, 27.34375, 28.4375, 29.53125, 30.625, 31.71875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 17.0, 13.0, 14.0, 24.0, 30.0, 51.0, 52.0, 72.0, 107.0, 168.0, 255.0, 391.0, 523.0, 799.0, 1355.0, 2160.0, 3726.0, 7277.0, 15582.0, 40628.0, 138518.0, 471642.0, 254629.0, 66031.0, 22688.0, 9712.0, 4845.0, 2763.0, 1610.0, 915.0, 646.0, 420.0, 258.0, 166.0, 117.0, 91.0, 80.0, 38.0, 28.0, 26.0, 21.0, 15.0, 10.0, 10.0, 3.0, 6.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.06640625, -5.8751220703125, -5.683837890625, -5.4925537109375, -5.30126953125, -5.1099853515625, -4.918701171875, -4.7274169921875, -4.5361328125, -4.3448486328125, -4.153564453125, -3.9622802734375, -3.77099609375, -3.5797119140625, -3.388427734375, -3.1971435546875, -3.005859375, -2.8145751953125, -2.623291015625, -2.4320068359375, -2.24072265625, -2.0494384765625, -1.858154296875, -1.6668701171875, -1.4755859375, -1.2843017578125, -1.093017578125, -0.9017333984375, -0.71044921875, -0.5191650390625, -0.327880859375, -0.1365966796875, 0.0546875, 0.2459716796875, 0.437255859375, 0.6285400390625, 0.81982421875, 1.0111083984375, 1.202392578125, 1.3936767578125, 1.5849609375, 1.7762451171875, 1.967529296875, 2.1588134765625, 2.35009765625, 2.5413818359375, 2.732666015625, 2.9239501953125, 3.115234375, 3.3065185546875, 3.497802734375, 3.6890869140625, 3.88037109375, 4.0716552734375, 4.262939453125, 4.4542236328125, 4.6455078125, 4.8367919921875, 5.028076171875, 5.2193603515625, 5.41064453125, 5.6019287109375, 5.793212890625, 5.9844970703125, 6.17578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 6.0, 19.0, 15.0, 13.0, 16.0, 24.0, 27.0, 34.0, 47.0, 57.0, 78.0, 78.0, 56.0, 66.0, 67.0, 65.0, 64.0, 43.0, 41.0, 26.0, 23.0, 23.0, 17.0, 14.0, 14.0, 9.0, 11.0, 9.0, 10.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004630088806152344, -0.0004467815160751343, -0.0004305541515350342, -0.0004143267869949341, -0.000398099422454834, -0.0003818720579147339, -0.0003656446933746338, -0.0003494173288345337, -0.0003331899642944336, -0.0003169625997543335, -0.0003007352352142334, -0.0002845078706741333, -0.0002682805061340332, -0.0002520531415939331, -0.000235825777053833, -0.0002195984125137329, -0.0002033710479736328, -0.00018714368343353271, -0.00017091631889343262, -0.00015468895435333252, -0.00013846158981323242, -0.00012223422527313232, -0.00010600686073303223, -8.977949619293213e-05, -7.355213165283203e-05, -5.7324767112731934e-05, -4.1097402572631836e-05, -2.4870038032531738e-05, -8.64267349243164e-06, 7.584691047668457e-06, 2.3812055587768555e-05, 4.003942012786865e-05, 5.626678466796875e-05, 7.249414920806885e-05, 8.872151374816895e-05, 0.00010494887828826904, 0.00012117624282836914, 0.00013740360736846924, 0.00015363097190856934, 0.00016985833644866943, 0.00018608570098876953, 0.00020231306552886963, 0.00021854043006896973, 0.00023476779460906982, 0.0002509951591491699, 0.00026722252368927, 0.0002834498882293701, 0.0002996772527694702, 0.0003159046173095703, 0.0003321319818496704, 0.0003483593463897705, 0.0003645867109298706, 0.0003808140754699707, 0.0003970414400100708, 0.0004132688045501709, 0.000429496169090271, 0.0004457235336303711, 0.0004619508981704712, 0.0004781782627105713, 0.0004944056272506714, 0.0005106329917907715, 0.0005268603563308716, 0.0005430877208709717, 0.0005593150854110718, 0.0005755424499511719]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 29.0, 36.0, 48.0, 58.0, 90.0, 130.0, 154.0, 257.0, 351.0, 453.0, 608.0, 838.0, 1194.0, 1678.0, 2537.0, 3903.0, 6416.0, 12417.0, 27682.0, 74037.0, 225394.0, 406132.0, 175455.0, 58419.0, 22774.0, 10437.0, 5762.0, 3500.0, 2280.0, 1461.0, 1117.0, 798.0, 556.0, 439.0, 318.0, 223.0, 149.0, 128.0, 90.0, 70.0, 30.0, 31.0, 19.0, 10.0, 10.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.7890625, -11.4134521484375, -11.037841796875, -10.6622314453125, -10.28662109375, -9.9110107421875, -9.535400390625, -9.1597900390625, -8.7841796875, -8.4085693359375, -8.032958984375, -7.6573486328125, -7.28173828125, -6.9061279296875, -6.530517578125, -6.1549072265625, -5.779296875, -5.4036865234375, -5.028076171875, -4.6524658203125, -4.27685546875, -3.9012451171875, -3.525634765625, -3.1500244140625, -2.7744140625, -2.3988037109375, -2.023193359375, -1.6475830078125, -1.27197265625, -0.8963623046875, -0.520751953125, -0.1451416015625, 0.23046875, 0.6060791015625, 0.981689453125, 1.3572998046875, 1.73291015625, 2.1085205078125, 2.484130859375, 2.8597412109375, 3.2353515625, 3.6109619140625, 3.986572265625, 4.3621826171875, 4.73779296875, 5.1134033203125, 5.489013671875, 5.8646240234375, 6.240234375, 6.6158447265625, 6.991455078125, 7.3670654296875, 7.74267578125, 8.1182861328125, 8.493896484375, 8.8695068359375, 9.2451171875, 9.6207275390625, 9.996337890625, 10.3719482421875, 10.74755859375, 11.1231689453125, 11.498779296875, 11.8743896484375, 12.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 11.0, 19.0, 24.0, 31.0, 45.0, 116.0, 138.0, 153.0, 162.0, 110.0, 54.0, 26.0, 29.0, 14.0, 11.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-9.109375, -8.86016845703125, -8.6109619140625, -8.36175537109375, -8.112548828125, -7.86334228515625, -7.6141357421875, -7.36492919921875, -7.11572265625, -6.86651611328125, -6.6173095703125, -6.36810302734375, -6.118896484375, -5.86968994140625, -5.6204833984375, -5.37127685546875, -5.1220703125, -4.87286376953125, -4.6236572265625, -4.37445068359375, -4.125244140625, -3.87603759765625, -3.6268310546875, -3.37762451171875, -3.12841796875, -2.87921142578125, -2.6300048828125, -2.38079833984375, -2.131591796875, -1.88238525390625, -1.6331787109375, -1.38397216796875, -1.134765625, -0.88555908203125, -0.6363525390625, -0.38714599609375, -0.137939453125, 0.11126708984375, 0.3604736328125, 0.60968017578125, 0.85888671875, 1.10809326171875, 1.3572998046875, 1.60650634765625, 1.855712890625, 2.10491943359375, 2.3541259765625, 2.60333251953125, 2.8525390625, 3.10174560546875, 3.3509521484375, 3.60015869140625, 3.849365234375, 4.09857177734375, 4.3477783203125, 4.59698486328125, 4.84619140625, 5.09539794921875, 5.3446044921875, 5.59381103515625, 5.843017578125, 6.09222412109375, 6.3414306640625, 6.59063720703125, 6.83984375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 12.0, 10.0, 10.0, 7.0, 6.0, 9.0, 11.0, 18.0, 21.0, 29.0, 18.0, 22.0, 35.0, 21.0, 40.0, 41.0, 43.0, 42.0, 39.0, 35.0, 39.0, 44.0, 49.0, 42.0, 46.0, 47.0, 40.0, 24.0, 34.0, 26.0, 16.0, 18.0, 19.0, 19.0, 14.0, 14.0, 9.0, 0.0, 9.0, 5.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.517696380615234, -39.299461364746094, -38.08123016357422, -36.86299514770508, -35.64476013183594, -34.42652893066406, -33.20829391479492, -31.99005889892578, -30.771825790405273, -29.553592681884766, -28.335357666015625, -27.117124557495117, -25.89889144897461, -24.68065643310547, -23.46242332458496, -22.244190216064453, -21.025955200195312, -19.807722091674805, -18.589487075805664, -17.371253967285156, -16.153018951416016, -14.934785842895508, -13.716552734375, -12.498318672180176, -11.280084609985352, -10.061850547790527, -8.843616485595703, -7.625383377075195, -6.407149314880371, -5.188915252685547, -3.970681667327881, -2.752448081970215, -1.5342140197753906, -0.3159801959991455, 0.9022536277770996, 2.1204874515533447, 3.33872127532959, 4.556955337524414, 5.77518892288208, 6.993422508239746, 8.21165657043457, 9.429890632629395, 10.648124694824219, 11.866357803344727, 13.08459186553955, 14.302825927734375, 15.521059036254883, 16.73929214477539, 17.95752716064453, 19.17576026916504, 20.39399528503418, 21.612228393554688, 22.830463409423828, 24.048696517944336, 25.266929626464844, 26.485164642333984, 27.703397750854492, 28.921630859375, 30.13986587524414, 31.35809898376465, 32.576332092285156, 33.7945671081543, 35.01280212402344, 36.23103332519531, 37.44926834106445]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 0.0, 3.0, 4.0, 5.0, 5.0, 5.0, 8.0, 6.0, 16.0, 20.0, 27.0, 16.0, 16.0, 26.0, 27.0, 34.0, 34.0, 40.0, 39.0, 40.0, 44.0, 31.0, 43.0, 41.0, 45.0, 43.0, 44.0, 31.0, 35.0, 49.0, 33.0, 29.0, 22.0, 29.0, 26.0, 18.0, 7.0, 15.0, 14.0, 6.0, 11.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.63716125488281, -46.09666061401367, -44.556156158447266, -43.015655517578125, -41.47515106201172, -39.93465042114258, -38.39414596557617, -36.85364532470703, -35.313140869140625, -33.772640228271484, -32.23213577270508, -30.691633224487305, -29.15113067626953, -27.610628128051758, -26.070125579833984, -24.529624938964844, -22.98912239074707, -21.448619842529297, -19.908117294311523, -18.36761474609375, -16.827112197875977, -15.286609649658203, -13.746108055114746, -12.205605506896973, -10.6651029586792, -9.124600410461426, -7.584097862243652, -6.043595790863037, -4.503093242645264, -2.9625906944274902, -1.422088623046875, 0.11841392517089844, 1.6589164733886719, 3.1994190216064453, 4.739921569824219, 6.280423641204834, 7.820926189422607, 9.361429214477539, 10.901930809020996, 12.44243335723877, 13.982935905456543, 15.523438453674316, 17.063940048217773, 18.604442596435547, 20.14494514465332, 21.685447692871094, 23.225950241088867, 24.76645278930664, 26.306955337524414, 27.847457885742188, 29.38796043395996, 30.928462982177734, 32.468963623046875, 34.00946807861328, 35.54996871948242, 37.09047317504883, 38.63097381591797, 40.17147445678711, 41.711978912353516, 43.252479553222656, 44.79298400878906, 46.3334846496582, 47.87398910522461, 49.41448974609375, 50.954994201660156]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 12.0, 26.0, 37.0, 51.0, 100.0, 159.0, 247.0, 391.0, 634.0, 885.0, 1489.0, 2236.0, 3539.0, 5020.0, 7464.0, 11050.0, 15969.0, 22595.0, 30848.0, 40963.0, 52969.0, 66374.0, 77631.0, 87650.0, 93015.0, 93331.0, 87562.0, 78589.0, 66261.0, 53777.0, 42295.0, 31498.0, 22931.0, 16308.0, 11408.0, 7768.0, 5238.0, 3647.0, 2318.0, 1557.0, 1005.0, 614.0, 398.0, 275.0, 165.0, 102.0, 62.0, 37.0, 21.0, 15.0, 13.0, 5.0, 2.0, 1.0, 4.0], "bins": [-26.640625, -25.85791015625, -25.0751953125, -24.29248046875, -23.509765625, -22.72705078125, -21.9443359375, -21.16162109375, -20.37890625, -19.59619140625, -18.8134765625, -18.03076171875, -17.248046875, -16.46533203125, -15.6826171875, -14.89990234375, -14.1171875, -13.33447265625, -12.5517578125, -11.76904296875, -10.986328125, -10.20361328125, -9.4208984375, -8.63818359375, -7.85546875, -7.07275390625, -6.2900390625, -5.50732421875, -4.724609375, -3.94189453125, -3.1591796875, -2.37646484375, -1.59375, -0.81103515625, -0.0283203125, 0.75439453125, 1.537109375, 2.31982421875, 3.1025390625, 3.88525390625, 4.66796875, 5.45068359375, 6.2333984375, 7.01611328125, 7.798828125, 8.58154296875, 9.3642578125, 10.14697265625, 10.9296875, 11.71240234375, 12.4951171875, 13.27783203125, 14.060546875, 14.84326171875, 15.6259765625, 16.40869140625, 17.19140625, 17.97412109375, 18.7568359375, 19.53955078125, 20.322265625, 21.10498046875, 21.8876953125, 22.67041015625, 23.453125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 3.0, 10.0, 7.0, 17.0, 16.0, 32.0, 15.0, 17.0, 22.0, 32.0, 27.0, 35.0, 42.0, 34.0, 45.0, 42.0, 36.0, 37.0, 47.0, 40.0, 44.0, 45.0, 29.0, 39.0, 47.0, 34.0, 28.0, 24.0, 25.0, 27.0, 19.0, 7.0, 16.0, 11.0, 8.0, 10.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.25, -44.7529296875, -43.255859375, -41.7587890625, -40.26171875, -38.7646484375, -37.267578125, -35.7705078125, -34.2734375, -32.7763671875, -31.279296875, -29.7822265625, -28.28515625, -26.7880859375, -25.291015625, -23.7939453125, -22.296875, -20.7998046875, -19.302734375, -17.8056640625, -16.30859375, -14.8115234375, -13.314453125, -11.8173828125, -10.3203125, -8.8232421875, -7.326171875, -5.8291015625, -4.33203125, -2.8349609375, -1.337890625, 0.1591796875, 1.65625, 3.1533203125, 4.650390625, 6.1474609375, 7.64453125, 9.1416015625, 10.638671875, 12.1357421875, 13.6328125, 15.1298828125, 16.626953125, 18.1240234375, 19.62109375, 21.1181640625, 22.615234375, 24.1123046875, 25.609375, 27.1064453125, 28.603515625, 30.1005859375, 31.59765625, 33.0947265625, 34.591796875, 36.0888671875, 37.5859375, 39.0830078125, 40.580078125, 42.0771484375, 43.57421875, 45.0712890625, 46.568359375, 48.0654296875, 49.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 10.0, 21.0, 27.0, 51.0, 80.0, 130.0, 181.0, 287.0, 468.0, 694.0, 956.0, 1470.0, 2278.0, 3376.0, 5008.0, 7390.0, 10921.0, 15667.0, 22298.0, 31158.0, 42104.0, 55528.0, 69005.0, 81596.0, 91381.0, 97895.0, 96095.0, 89009.0, 78364.0, 64266.0, 50785.0, 38369.0, 28203.0, 20009.0, 13888.0, 9616.0, 6637.0, 4481.0, 2967.0, 2010.0, 1311.0, 876.0, 578.0, 382.0, 286.0, 153.0, 109.0, 55.0, 47.0, 34.0, 18.0, 11.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0], "bins": [-26.671875, -25.834228515625, -24.99658203125, -24.158935546875, -23.3212890625, -22.483642578125, -21.64599609375, -20.808349609375, -19.970703125, -19.133056640625, -18.29541015625, -17.457763671875, -16.6201171875, -15.782470703125, -14.94482421875, -14.107177734375, -13.26953125, -12.431884765625, -11.59423828125, -10.756591796875, -9.9189453125, -9.081298828125, -8.24365234375, -7.406005859375, -6.568359375, -5.730712890625, -4.89306640625, -4.055419921875, -3.2177734375, -2.380126953125, -1.54248046875, -0.704833984375, 0.1328125, 0.970458984375, 1.80810546875, 2.645751953125, 3.4833984375, 4.321044921875, 5.15869140625, 5.996337890625, 6.833984375, 7.671630859375, 8.50927734375, 9.346923828125, 10.1845703125, 11.022216796875, 11.85986328125, 12.697509765625, 13.53515625, 14.372802734375, 15.21044921875, 16.048095703125, 16.8857421875, 17.723388671875, 18.56103515625, 19.398681640625, 20.236328125, 21.073974609375, 21.91162109375, 22.749267578125, 23.5869140625, 24.424560546875, 25.26220703125, 26.099853515625, 26.9375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 2.0, 6.0, 16.0, 11.0, 18.0, 12.0, 17.0, 29.0, 19.0, 24.0, 36.0, 29.0, 37.0, 31.0, 38.0, 40.0, 42.0, 36.0, 37.0, 35.0, 36.0, 37.0, 41.0, 44.0, 37.0, 39.0, 37.0, 26.0, 25.0, 18.0, 18.0, 17.0, 22.0, 11.0, 8.0, 11.0, 9.0, 9.0, 5.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.828125, -27.888916015625, -26.94970703125, -26.010498046875, -25.0712890625, -24.132080078125, -23.19287109375, -22.253662109375, -21.314453125, -20.375244140625, -19.43603515625, -18.496826171875, -17.5576171875, -16.618408203125, -15.67919921875, -14.739990234375, -13.80078125, -12.861572265625, -11.92236328125, -10.983154296875, -10.0439453125, -9.104736328125, -8.16552734375, -7.226318359375, -6.287109375, -5.347900390625, -4.40869140625, -3.469482421875, -2.5302734375, -1.591064453125, -0.65185546875, 0.287353515625, 1.2265625, 2.165771484375, 3.10498046875, 4.044189453125, 4.9833984375, 5.922607421875, 6.86181640625, 7.801025390625, 8.740234375, 9.679443359375, 10.61865234375, 11.557861328125, 12.4970703125, 13.436279296875, 14.37548828125, 15.314697265625, 16.25390625, 17.193115234375, 18.13232421875, 19.071533203125, 20.0107421875, 20.949951171875, 21.88916015625, 22.828369140625, 23.767578125, 24.706787109375, 25.64599609375, 26.585205078125, 27.5244140625, 28.463623046875, 29.40283203125, 30.342041015625, 31.28125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 6.0, 9.0, 9.0, 15.0, 24.0, 29.0, 60.0, 59.0, 75.0, 145.0, 169.0, 300.0, 384.0, 568.0, 838.0, 1243.0, 1906.0, 2913.0, 4583.0, 6930.0, 11285.0, 17959.0, 28662.0, 44570.0, 67022.0, 95162.0, 121973.0, 138388.0, 134856.0, 114690.0, 86398.0, 59753.0, 39174.0, 25143.0, 15357.0, 9722.0, 6328.0, 3952.0, 2583.0, 1778.0, 1097.0, 746.0, 537.0, 369.0, 251.0, 171.0, 113.0, 85.0, 62.0, 28.0, 26.0, 23.0, 9.0, 13.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0], "bins": [-15.1171875, -14.642578125, -14.16796875, -13.693359375, -13.21875, -12.744140625, -12.26953125, -11.794921875, -11.3203125, -10.845703125, -10.37109375, -9.896484375, -9.421875, -8.947265625, -8.47265625, -7.998046875, -7.5234375, -7.048828125, -6.57421875, -6.099609375, -5.625, -5.150390625, -4.67578125, -4.201171875, -3.7265625, -3.251953125, -2.77734375, -2.302734375, -1.828125, -1.353515625, -0.87890625, -0.404296875, 0.0703125, 0.544921875, 1.01953125, 1.494140625, 1.96875, 2.443359375, 2.91796875, 3.392578125, 3.8671875, 4.341796875, 4.81640625, 5.291015625, 5.765625, 6.240234375, 6.71484375, 7.189453125, 7.6640625, 8.138671875, 8.61328125, 9.087890625, 9.5625, 10.037109375, 10.51171875, 10.986328125, 11.4609375, 11.935546875, 12.41015625, 12.884765625, 13.359375, 13.833984375, 14.30859375, 14.783203125, 15.2578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 8.0, 16.0, 18.0, 21.0, 21.0, 36.0, 63.0, 65.0, 71.0, 77.0, 91.0, 82.0, 93.0, 73.0, 52.0, 51.0, 38.0, 43.0, 16.0, 11.0, 13.0, 4.0, 10.0, 2.0, 9.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030918121337890625, -0.003008037805557251, -0.0029242634773254395, -0.002840489149093628, -0.0027567148208618164, -0.002672940492630005, -0.0025891661643981934, -0.002505391836166382, -0.0024216175079345703, -0.002337843179702759, -0.0022540688514709473, -0.0021702945232391357, -0.0020865201950073242, -0.0020027458667755127, -0.0019189715385437012, -0.0018351972103118896, -0.0017514228820800781, -0.0016676485538482666, -0.001583874225616455, -0.0015000998973846436, -0.001416325569152832, -0.0013325512409210205, -0.001248776912689209, -0.0011650025844573975, -0.001081228256225586, -0.0009974539279937744, -0.0009136795997619629, -0.0008299052715301514, -0.0007461309432983398, -0.0006623566150665283, -0.0005785822868347168, -0.0004948079586029053, -0.00041103363037109375, -0.0003272593021392822, -0.0002434849739074707, -0.00015971064567565918, -7.593631744384766e-05, 7.838010787963867e-06, 9.161233901977539e-05, 0.00017538666725158691, 0.00025916099548339844, 0.00034293532371520996, 0.0004267096519470215, 0.000510483980178833, 0.0005942583084106445, 0.0006780326366424561, 0.0007618069648742676, 0.0008455812931060791, 0.0009293556213378906, 0.0010131299495697021, 0.0010969042778015137, 0.0011806786060333252, 0.0012644529342651367, 0.0013482272624969482, 0.0014320015907287598, 0.0015157759189605713, 0.0015995502471923828, 0.0016833245754241943, 0.0017670989036560059, 0.0018508732318878174, 0.001934647560119629, 0.0020184218883514404, 0.002102196216583252, 0.0021859705448150635, 0.002269744873046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 8.0, 8.0, 15.0, 17.0, 28.0, 51.0, 79.0, 125.0, 179.0, 266.0, 368.0, 576.0, 924.0, 1413.0, 2278.0, 3571.0, 5474.0, 8923.0, 13689.0, 21859.0, 34427.0, 52616.0, 76285.0, 104757.0, 129095.0, 137573.0, 127849.0, 104513.0, 76678.0, 52080.0, 33790.0, 21640.0, 13529.0, 8721.0, 5490.0, 3475.0, 2182.0, 1401.0, 908.0, 582.0, 411.0, 222.0, 159.0, 116.0, 72.0, 47.0, 35.0, 21.0, 14.0, 13.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-16.640625, -16.12841796875, -15.6162109375, -15.10400390625, -14.591796875, -14.07958984375, -13.5673828125, -13.05517578125, -12.54296875, -12.03076171875, -11.5185546875, -11.00634765625, -10.494140625, -9.98193359375, -9.4697265625, -8.95751953125, -8.4453125, -7.93310546875, -7.4208984375, -6.90869140625, -6.396484375, -5.88427734375, -5.3720703125, -4.85986328125, -4.34765625, -3.83544921875, -3.3232421875, -2.81103515625, -2.298828125, -1.78662109375, -1.2744140625, -0.76220703125, -0.25, 0.26220703125, 0.7744140625, 1.28662109375, 1.798828125, 2.31103515625, 2.8232421875, 3.33544921875, 3.84765625, 4.35986328125, 4.8720703125, 5.38427734375, 5.896484375, 6.40869140625, 6.9208984375, 7.43310546875, 7.9453125, 8.45751953125, 8.9697265625, 9.48193359375, 9.994140625, 10.50634765625, 11.0185546875, 11.53076171875, 12.04296875, 12.55517578125, 13.0673828125, 13.57958984375, 14.091796875, 14.60400390625, 15.1162109375, 15.62841796875, 16.140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 8.0, 17.0, 23.0, 22.0, 21.0, 24.0, 37.0, 32.0, 38.0, 37.0, 33.0, 50.0, 46.0, 54.0, 46.0, 55.0, 47.0, 46.0, 42.0, 34.0, 48.0, 30.0, 22.0, 24.0, 16.0, 26.0, 15.0, 12.0, 12.0, 13.0, 8.0, 5.0, 10.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6796875, -7.414794921875, -7.14990234375, -6.885009765625, -6.6201171875, -6.355224609375, -6.09033203125, -5.825439453125, -5.560546875, -5.295654296875, -5.03076171875, -4.765869140625, -4.5009765625, -4.236083984375, -3.97119140625, -3.706298828125, -3.44140625, -3.176513671875, -2.91162109375, -2.646728515625, -2.3818359375, -2.116943359375, -1.85205078125, -1.587158203125, -1.322265625, -1.057373046875, -0.79248046875, -0.527587890625, -0.2626953125, 0.002197265625, 0.26708984375, 0.531982421875, 0.796875, 1.061767578125, 1.32666015625, 1.591552734375, 1.8564453125, 2.121337890625, 2.38623046875, 2.651123046875, 2.916015625, 3.180908203125, 3.44580078125, 3.710693359375, 3.9755859375, 4.240478515625, 4.50537109375, 4.770263671875, 5.03515625, 5.300048828125, 5.56494140625, 5.829833984375, 6.0947265625, 6.359619140625, 6.62451171875, 6.889404296875, 7.154296875, 7.419189453125, 7.68408203125, 7.948974609375, 8.2138671875, 8.478759765625, 8.74365234375, 9.008544921875, 9.2734375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 12.0, 4.0, 9.0, 7.0, 15.0, 13.0, 9.0, 18.0, 22.0, 21.0, 27.0, 27.0, 33.0, 38.0, 28.0, 45.0, 38.0, 47.0, 33.0, 50.0, 43.0, 40.0, 51.0, 41.0, 47.0, 39.0, 38.0, 26.0, 27.0, 22.0, 15.0, 22.0, 12.0, 11.0, 12.0, 12.0, 5.0, 9.0, 6.0, 8.0, 2.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-42.20340347290039, -40.9516716003418, -39.6999397277832, -38.44820785522461, -37.196475982666016, -35.94474411010742, -34.69301223754883, -33.4412841796875, -32.189552307128906, -30.937820434570312, -29.68608856201172, -28.434356689453125, -27.18262481689453, -25.930892944335938, -24.679162979125977, -23.427431106567383, -22.175697326660156, -20.923965454101562, -19.67223358154297, -18.420501708984375, -17.16876983642578, -15.917038917541504, -14.665307998657227, -13.413576126098633, -12.161844253540039, -10.910112380981445, -9.658380508422852, -8.406649589538574, -7.1549177169799805, -5.903185844421387, -4.651454448699951, -3.3997230529785156, -2.1479873657226562, -0.8962557315826416, 0.35547590255737305, 1.6072075366973877, 2.8589391708374023, 4.110671043395996, 5.362402439117432, 6.614133834838867, 7.865865707397461, 9.117597579956055, 10.369329452514648, 11.621060371398926, 12.87279224395752, 14.124524116516113, 15.37625503540039, 16.627986907958984, 17.879718780517578, 19.131450653076172, 20.383182525634766, 21.63491439819336, 22.886646270751953, 24.138378143310547, 25.390108108520508, 26.6418399810791, 27.893571853637695, 29.14530372619629, 30.397035598754883, 31.648767471313477, 32.90049743652344, 34.15222930908203, 35.403961181640625, 36.65569305419922, 37.90742492675781]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 8.0, 10.0, 8.0, 11.0, 16.0, 20.0, 19.0, 24.0, 25.0, 26.0, 25.0, 31.0, 42.0, 33.0, 38.0, 45.0, 44.0, 36.0, 48.0, 49.0, 40.0, 40.0, 48.0, 33.0, 38.0, 34.0, 34.0, 29.0, 20.0, 19.0, 20.0, 15.0, 17.0, 9.0, 5.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.726112365722656, -46.140419006347656, -44.55472183227539, -42.96902847290039, -41.38333511352539, -39.797637939453125, -38.211944580078125, -36.626251220703125, -35.04055404663086, -33.45486068725586, -31.869165420532227, -30.283470153808594, -28.69777488708496, -27.112079620361328, -25.526386260986328, -23.940690994262695, -22.354997634887695, -20.769302368164062, -19.183609008789062, -17.59791374206543, -16.012218475341797, -14.42652416229248, -12.840829849243164, -11.255134582519531, -9.669440269470215, -8.083745956420898, -6.498050689697266, -4.912356376647949, -3.3266615867614746, -1.740966796875, -0.1552724838256836, 1.4304227828979492, 3.0161170959472656, 4.60181188583374, 6.187506675720215, 7.773200988769531, 9.358896255493164, 10.94459056854248, 12.530284881591797, 14.11598014831543, 15.701674461364746, 17.287368774414062, 18.873064041137695, 20.458759307861328, 22.044452667236328, 23.63014793395996, 25.215843200683594, 26.801536560058594, 28.387231826782227, 29.97292709350586, 31.55862045288086, 33.144317626953125, 34.730010986328125, 36.315704345703125, 37.901397705078125, 39.48709487915039, 41.07278823852539, 42.65848159790039, 44.244178771972656, 45.829872131347656, 47.415565490722656, 49.00126266479492, 50.58695602416992, 52.17265319824219, 53.75834655761719]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [3.0, 2.0, 8.0, 11.0, 12.0, 20.0, 36.0, 50.0, 89.0, 160.0, 288.0, 491.0, 695.0, 1217.0, 1915.0, 2950.0, 4973.0, 7965.0, 12317.0, 19448.0, 30433.0, 46344.0, 70098.0, 101839.0, 146094.0, 200477.0, 262486.0, 325376.0, 379431.0, 413498.0, 419343.0, 394934.0, 345552.0, 284679.0, 220164.0, 163129.0, 115632.0, 78681.0, 52334.0, 34295.0, 21737.0, 13209.0, 8419.0, 5289.0, 3236.0, 1877.0, 1197.0, 701.0, 447.0, 266.0, 181.0, 103.0, 60.0, 47.0, 25.0, 15.0, 16.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.84375, -25.953369140625, -25.06298828125, -24.172607421875, -23.2822265625, -22.391845703125, -21.50146484375, -20.611083984375, -19.720703125, -18.830322265625, -17.93994140625, -17.049560546875, -16.1591796875, -15.268798828125, -14.37841796875, -13.488037109375, -12.59765625, -11.707275390625, -10.81689453125, -9.926513671875, -9.0361328125, -8.145751953125, -7.25537109375, -6.364990234375, -5.474609375, -4.584228515625, -3.69384765625, -2.803466796875, -1.9130859375, -1.022705078125, -0.13232421875, 0.758056640625, 1.6484375, 2.538818359375, 3.42919921875, 4.319580078125, 5.2099609375, 6.100341796875, 6.99072265625, 7.881103515625, 8.771484375, 9.661865234375, 10.55224609375, 11.442626953125, 12.3330078125, 13.223388671875, 14.11376953125, 15.004150390625, 15.89453125, 16.784912109375, 17.67529296875, 18.565673828125, 19.4560546875, 20.346435546875, 21.23681640625, 22.127197265625, 23.017578125, 23.907958984375, 24.79833984375, 25.688720703125, 26.5791015625, 27.469482421875, 28.35986328125, 29.250244140625, 30.140625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 6.0, 7.0, 11.0, 11.0, 17.0, 15.0, 21.0, 16.0, 38.0, 23.0, 23.0, 32.0, 38.0, 37.0, 41.0, 42.0, 43.0, 40.0, 43.0, 49.0, 39.0, 41.0, 39.0, 44.0, 37.0, 37.0, 29.0, 35.0, 21.0, 20.0, 18.0, 19.0, 10.0, 11.0, 7.0, 5.0, 8.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.0625, -37.76513671875, -36.4677734375, -35.17041015625, -33.873046875, -32.57568359375, -31.2783203125, -29.98095703125, -28.68359375, -27.38623046875, -26.0888671875, -24.79150390625, -23.494140625, -22.19677734375, -20.8994140625, -19.60205078125, -18.3046875, -17.00732421875, -15.7099609375, -14.41259765625, -13.115234375, -11.81787109375, -10.5205078125, -9.22314453125, -7.92578125, -6.62841796875, -5.3310546875, -4.03369140625, -2.736328125, -1.43896484375, -0.1416015625, 1.15576171875, 2.453125, 3.75048828125, 5.0478515625, 6.34521484375, 7.642578125, 8.93994140625, 10.2373046875, 11.53466796875, 12.83203125, 14.12939453125, 15.4267578125, 16.72412109375, 18.021484375, 19.31884765625, 20.6162109375, 21.91357421875, 23.2109375, 24.50830078125, 25.8056640625, 27.10302734375, 28.400390625, 29.69775390625, 30.9951171875, 32.29248046875, 33.58984375, 34.88720703125, 36.1845703125, 37.48193359375, 38.779296875, 40.07666015625, 41.3740234375, 42.67138671875, 43.96875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 9.0, 11.0, 28.0, 52.0, 70.0, 131.0, 242.0, 393.0, 700.0, 1115.0, 1902.0, 3236.0, 5426.0, 8560.0, 13591.0, 21542.0, 32515.0, 48647.0, 70988.0, 99336.0, 136173.0, 177138.0, 224862.0, 270546.0, 313154.0, 344729.0, 361694.0, 358444.0, 340248.0, 304731.0, 260775.0, 213718.0, 167879.0, 127159.0, 93043.0, 65067.0, 44627.0, 29873.0, 19436.0, 12567.0, 7947.0, 4837.0, 2859.0, 1705.0, 1058.0, 624.0, 358.0, 257.0, 131.0, 64.0, 39.0, 28.0, 17.0, 7.0, 1.0, 6.0, 0.0, 2.0], "bins": [-26.796875, -25.982177734375, -25.16748046875, -24.352783203125, -23.5380859375, -22.723388671875, -21.90869140625, -21.093994140625, -20.279296875, -19.464599609375, -18.64990234375, -17.835205078125, -17.0205078125, -16.205810546875, -15.39111328125, -14.576416015625, -13.76171875, -12.947021484375, -12.13232421875, -11.317626953125, -10.5029296875, -9.688232421875, -8.87353515625, -8.058837890625, -7.244140625, -6.429443359375, -5.61474609375, -4.800048828125, -3.9853515625, -3.170654296875, -2.35595703125, -1.541259765625, -0.7265625, 0.088134765625, 0.90283203125, 1.717529296875, 2.5322265625, 3.346923828125, 4.16162109375, 4.976318359375, 5.791015625, 6.605712890625, 7.42041015625, 8.235107421875, 9.0498046875, 9.864501953125, 10.67919921875, 11.493896484375, 12.30859375, 13.123291015625, 13.93798828125, 14.752685546875, 15.5673828125, 16.382080078125, 17.19677734375, 18.011474609375, 18.826171875, 19.640869140625, 20.45556640625, 21.270263671875, 22.0849609375, 22.899658203125, 23.71435546875, 24.529052734375, 25.34375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 10.0, 11.0, 17.0, 23.0, 34.0, 45.0, 56.0, 61.0, 89.0, 82.0, 122.0, 123.0, 152.0, 211.0, 206.0, 212.0, 248.0, 238.0, 234.0, 228.0, 224.0, 201.0, 189.0, 179.0, 157.0, 130.0, 124.0, 100.0, 67.0, 63.0, 46.0, 48.0, 34.0, 32.0, 19.0, 21.0, 19.0, 5.0, 2.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.65625, -18.022216796875, -17.38818359375, -16.754150390625, -16.1201171875, -15.486083984375, -14.85205078125, -14.218017578125, -13.583984375, -12.949951171875, -12.31591796875, -11.681884765625, -11.0478515625, -10.413818359375, -9.77978515625, -9.145751953125, -8.51171875, -7.877685546875, -7.24365234375, -6.609619140625, -5.9755859375, -5.341552734375, -4.70751953125, -4.073486328125, -3.439453125, -2.805419921875, -2.17138671875, -1.537353515625, -0.9033203125, -0.269287109375, 0.36474609375, 0.998779296875, 1.6328125, 2.266845703125, 2.90087890625, 3.534912109375, 4.1689453125, 4.802978515625, 5.43701171875, 6.071044921875, 6.705078125, 7.339111328125, 7.97314453125, 8.607177734375, 9.2412109375, 9.875244140625, 10.50927734375, 11.143310546875, 11.77734375, 12.411376953125, 13.04541015625, 13.679443359375, 14.3134765625, 14.947509765625, 15.58154296875, 16.215576171875, 16.849609375, 17.483642578125, 18.11767578125, 18.751708984375, 19.3857421875, 20.019775390625, 20.65380859375, 21.287841796875, 21.921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 4.0, 2.0, 5.0, 9.0, 8.0, 7.0, 16.0, 13.0, 14.0, 14.0, 19.0, 19.0, 17.0, 21.0, 29.0, 35.0, 20.0, 35.0, 30.0, 55.0, 41.0, 39.0, 47.0, 44.0, 38.0, 35.0, 38.0, 34.0, 36.0, 26.0, 21.0, 45.0, 22.0, 24.0, 20.0, 10.0, 6.0, 18.0, 14.0, 16.0, 11.0, 8.0, 5.0, 5.0, 9.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.52833557128906, -36.41531753540039, -35.30229949951172, -34.18928146362305, -33.076263427734375, -31.963247299194336, -30.850231170654297, -29.737213134765625, -28.624195098876953, -27.51117706298828, -26.39815902709961, -25.28514289855957, -24.1721248626709, -23.059106826782227, -21.946090698242188, -20.833072662353516, -19.720054626464844, -18.607036590576172, -17.4940185546875, -16.38100242614746, -15.267984390258789, -14.154966354370117, -13.041949272155762, -11.928932189941406, -10.815914154052734, -9.702896118164062, -8.589879035949707, -7.476861476898193, -6.36384391784668, -5.250826358795166, -4.137808799743652, -3.0247912406921387, -1.9117774963378906, -0.798759937286377, 0.3142576217651367, 1.4272751808166504, 2.540292739868164, 3.6533102989196777, 4.766327857971191, 5.879345417022705, 6.992362976074219, 8.10538101196289, 9.218398094177246, 10.331415176391602, 11.444433212280273, 12.557451248168945, 13.6704683303833, 14.783485412597656, 15.896503448486328, 17.009521484375, 18.122539520263672, 19.23555564880371, 20.348573684692383, 21.461591720581055, 22.574607849121094, 23.687625885009766, 24.800643920898438, 25.91366195678711, 27.02667999267578, 28.13969612121582, 29.252714157104492, 30.365732192993164, 31.478748321533203, 32.591766357421875, 33.70478439331055]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 7.0, 7.0, 5.0, 5.0, 1.0, 17.0, 16.0, 12.0, 13.0, 20.0, 22.0, 35.0, 28.0, 42.0, 20.0, 33.0, 50.0, 40.0, 39.0, 47.0, 26.0, 49.0, 52.0, 48.0, 35.0, 50.0, 36.0, 32.0, 32.0, 32.0, 32.0, 21.0, 23.0, 9.0, 9.0, 14.0, 9.0, 10.0, 5.0, 4.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.15998077392578, -47.66093826293945, -46.16189193725586, -44.66284942626953, -43.16380310058594, -41.66476058959961, -40.16571807861328, -38.66667175292969, -37.167625427246094, -35.668582916259766, -34.16953659057617, -32.670494079589844, -31.17144775390625, -29.672405242919922, -28.17336082458496, -26.67431640625, -25.175273895263672, -23.67622947692871, -22.17718505859375, -20.678142547607422, -19.179096221923828, -17.6800537109375, -16.18100929260254, -14.681964874267578, -13.182920455932617, -11.683876037597656, -10.184831619262695, -8.68578815460205, -7.18674373626709, -5.687699317932129, -4.188655853271484, -2.6896114349365234, -1.1905632019042969, 0.30848097801208496, 1.8075251579284668, 3.3065690994262695, 4.8056135177612305, 6.304657936096191, 7.803701400756836, 9.302745819091797, 10.801790237426758, 12.300834655761719, 13.79987907409668, 15.298922538757324, 16.79796600341797, 18.297012329101562, 19.79605484008789, 21.29509925842285, 22.794143676757812, 24.293188095092773, 25.792232513427734, 27.291275024414062, 28.790321350097656, 30.289363861083984, 31.788408279418945, 33.287452697753906, 34.7864990234375, 36.28554153442383, 37.78458786010742, 39.28363037109375, 40.782676696777344, 42.28171920776367, 43.78076171875, 45.279808044433594, 46.77885055541992]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 9.0, 2.0, 13.0, 18.0, 22.0, 46.0, 41.0, 55.0, 108.0, 151.0, 194.0, 302.0, 425.0, 683.0, 996.0, 1522.0, 2623.0, 3960.0, 6492.0, 10939.0, 18749.0, 33688.0, 60576.0, 108364.0, 185824.0, 233227.0, 163834.0, 93541.0, 51898.0, 28737.0, 16222.0, 9741.0, 5697.0, 3561.0, 2120.0, 1456.0, 883.0, 577.0, 392.0, 272.0, 186.0, 95.0, 94.0, 58.0, 47.0, 38.0, 18.0, 19.0, 14.0, 8.0, 9.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-10.953125, -10.61474609375, -10.2763671875, -9.93798828125, -9.599609375, -9.26123046875, -8.9228515625, -8.58447265625, -8.24609375, -7.90771484375, -7.5693359375, -7.23095703125, -6.892578125, -6.55419921875, -6.2158203125, -5.87744140625, -5.5390625, -5.20068359375, -4.8623046875, -4.52392578125, -4.185546875, -3.84716796875, -3.5087890625, -3.17041015625, -2.83203125, -2.49365234375, -2.1552734375, -1.81689453125, -1.478515625, -1.14013671875, -0.8017578125, -0.46337890625, -0.125, 0.21337890625, 0.5517578125, 0.89013671875, 1.228515625, 1.56689453125, 1.9052734375, 2.24365234375, 2.58203125, 2.92041015625, 3.2587890625, 3.59716796875, 3.935546875, 4.27392578125, 4.6123046875, 4.95068359375, 5.2890625, 5.62744140625, 5.9658203125, 6.30419921875, 6.642578125, 6.98095703125, 7.3193359375, 7.65771484375, 7.99609375, 8.33447265625, 8.6728515625, 9.01123046875, 9.349609375, 9.68798828125, 10.0263671875, 10.36474609375, 10.703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 7.0, 7.0, 5.0, 5.0, 1.0, 17.0, 16.0, 13.0, 14.0, 19.0, 25.0, 31.0, 31.0, 38.0, 23.0, 37.0, 44.0, 42.0, 40.0, 44.0, 26.0, 49.0, 56.0, 46.0, 37.0, 46.0, 38.0, 31.0, 33.0, 34.0, 28.0, 21.0, 22.0, 11.0, 8.0, 14.0, 9.0, 11.0, 4.0, 4.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.96875, -47.47119140625, -45.9736328125, -44.47607421875, -42.978515625, -41.48095703125, -39.9833984375, -38.48583984375, -36.98828125, -35.49072265625, -33.9931640625, -32.49560546875, -30.998046875, -29.50048828125, -28.0029296875, -26.50537109375, -25.0078125, -23.51025390625, -22.0126953125, -20.51513671875, -19.017578125, -17.52001953125, -16.0224609375, -14.52490234375, -13.02734375, -11.52978515625, -10.0322265625, -8.53466796875, -7.037109375, -5.53955078125, -4.0419921875, -2.54443359375, -1.046875, 0.45068359375, 1.9482421875, 3.44580078125, 4.943359375, 6.44091796875, 7.9384765625, 9.43603515625, 10.93359375, 12.43115234375, 13.9287109375, 15.42626953125, 16.923828125, 18.42138671875, 19.9189453125, 21.41650390625, 22.9140625, 24.41162109375, 25.9091796875, 27.40673828125, 28.904296875, 30.40185546875, 31.8994140625, 33.39697265625, 34.89453125, 36.39208984375, 37.8896484375, 39.38720703125, 40.884765625, 42.38232421875, 43.8798828125, 45.37744140625, 46.875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 6.0, 15.0, 18.0, 24.0, 39.0, 47.0, 58.0, 87.0, 97.0, 162.0, 196.0, 299.0, 424.0, 629.0, 949.0, 1382.0, 2262.0, 3611.0, 6108.0, 11011.0, 20896.0, 42070.0, 93050.0, 219816.0, 330372.0, 167515.0, 72520.0, 34002.0, 17283.0, 9178.0, 5153.0, 3131.0, 2000.0, 1304.0, 833.0, 625.0, 390.0, 285.0, 194.0, 136.0, 98.0, 84.0, 50.0, 40.0, 29.0, 23.0, 23.0, 9.0, 10.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.703125, -9.3935546875, -9.083984375, -8.7744140625, -8.46484375, -8.1552734375, -7.845703125, -7.5361328125, -7.2265625, -6.9169921875, -6.607421875, -6.2978515625, -5.98828125, -5.6787109375, -5.369140625, -5.0595703125, -4.75, -4.4404296875, -4.130859375, -3.8212890625, -3.51171875, -3.2021484375, -2.892578125, -2.5830078125, -2.2734375, -1.9638671875, -1.654296875, -1.3447265625, -1.03515625, -0.7255859375, -0.416015625, -0.1064453125, 0.203125, 0.5126953125, 0.822265625, 1.1318359375, 1.44140625, 1.7509765625, 2.060546875, 2.3701171875, 2.6796875, 2.9892578125, 3.298828125, 3.6083984375, 3.91796875, 4.2275390625, 4.537109375, 4.8466796875, 5.15625, 5.4658203125, 5.775390625, 6.0849609375, 6.39453125, 6.7041015625, 7.013671875, 7.3232421875, 7.6328125, 7.9423828125, 8.251953125, 8.5615234375, 8.87109375, 9.1806640625, 9.490234375, 9.7998046875, 10.109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 11.0, 5.0, 11.0, 13.0, 13.0, 14.0, 30.0, 16.0, 30.0, 36.0, 40.0, 32.0, 45.0, 35.0, 33.0, 39.0, 41.0, 51.0, 40.0, 29.0, 35.0, 29.0, 39.0, 46.0, 35.0, 30.0, 40.0, 28.0, 21.0, 19.0, 25.0, 22.0, 9.0, 11.0, 12.0, 8.0, 4.0, 7.0, 6.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.5, -30.52099609375, -29.5419921875, -28.56298828125, -27.583984375, -26.60498046875, -25.6259765625, -24.64697265625, -23.66796875, -22.68896484375, -21.7099609375, -20.73095703125, -19.751953125, -18.77294921875, -17.7939453125, -16.81494140625, -15.8359375, -14.85693359375, -13.8779296875, -12.89892578125, -11.919921875, -10.94091796875, -9.9619140625, -8.98291015625, -8.00390625, -7.02490234375, -6.0458984375, -5.06689453125, -4.087890625, -3.10888671875, -2.1298828125, -1.15087890625, -0.171875, 0.80712890625, 1.7861328125, 2.76513671875, 3.744140625, 4.72314453125, 5.7021484375, 6.68115234375, 7.66015625, 8.63916015625, 9.6181640625, 10.59716796875, 11.576171875, 12.55517578125, 13.5341796875, 14.51318359375, 15.4921875, 16.47119140625, 17.4501953125, 18.42919921875, 19.408203125, 20.38720703125, 21.3662109375, 22.34521484375, 23.32421875, 24.30322265625, 25.2822265625, 26.26123046875, 27.240234375, 28.21923828125, 29.1982421875, 30.17724609375, 31.15625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 13.0, 12.0, 20.0, 24.0, 38.0, 49.0, 67.0, 95.0, 135.0, 178.0, 261.0, 463.0, 710.0, 1334.0, 4026.0, 28398.0, 929858.0, 72811.0, 5862.0, 1748.0, 854.0, 493.0, 314.0, 217.0, 146.0, 115.0, 81.0, 48.0, 45.0, 34.0, 19.0, 16.0, 12.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.453125, -18.796630859375, -18.14013671875, -17.483642578125, -16.8271484375, -16.170654296875, -15.51416015625, -14.857666015625, -14.201171875, -13.544677734375, -12.88818359375, -12.231689453125, -11.5751953125, -10.918701171875, -10.26220703125, -9.605712890625, -8.94921875, -8.292724609375, -7.63623046875, -6.979736328125, -6.3232421875, -5.666748046875, -5.01025390625, -4.353759765625, -3.697265625, -3.040771484375, -2.38427734375, -1.727783203125, -1.0712890625, -0.414794921875, 0.24169921875, 0.898193359375, 1.5546875, 2.211181640625, 2.86767578125, 3.524169921875, 4.1806640625, 4.837158203125, 5.49365234375, 6.150146484375, 6.806640625, 7.463134765625, 8.11962890625, 8.776123046875, 9.4326171875, 10.089111328125, 10.74560546875, 11.402099609375, 12.05859375, 12.715087890625, 13.37158203125, 14.028076171875, 14.6845703125, 15.341064453125, 15.99755859375, 16.654052734375, 17.310546875, 17.967041015625, 18.62353515625, 19.280029296875, 19.9365234375, 20.593017578125, 21.24951171875, 21.906005859375, 22.5625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 13.0, 10.0, 17.0, 15.0, 14.0, 39.0, 59.0, 67.0, 128.0, 157.0, 149.0, 109.0, 65.0, 51.0, 20.0, 13.0, 10.0, 9.0, 6.0, 9.0, 4.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008358955383300781, -0.0008086860179901123, -0.0007814764976501465, -0.0007542669773101807, -0.0007270574569702148, -0.000699847936630249, -0.0006726384162902832, -0.0006454288959503174, -0.0006182193756103516, -0.0005910098552703857, -0.0005638003349304199, -0.0005365908145904541, -0.0005093812942504883, -0.00048217177391052246, -0.00045496225357055664, -0.0004277527332305908, -0.000400543212890625, -0.0003733336925506592, -0.00034612417221069336, -0.00031891465187072754, -0.0002917051315307617, -0.0002644956111907959, -0.00023728609085083008, -0.00021007657051086426, -0.00018286705017089844, -0.00015565752983093262, -0.0001284480094909668, -0.00010123848915100098, -7.402896881103516e-05, -4.6819448471069336e-05, -1.9609928131103516e-05, 7.599592208862305e-06, 3.4809112548828125e-05, 6.201863288879395e-05, 8.922815322875977e-05, 0.00011643767356872559, 0.0001436471939086914, 0.00017085671424865723, 0.00019806623458862305, 0.00022527575492858887, 0.0002524852752685547, 0.0002796947956085205, 0.00030690431594848633, 0.00033411383628845215, 0.00036132335662841797, 0.0003885328769683838, 0.0004157423973083496, 0.00044295191764831543, 0.00047016143798828125, 0.0004973709583282471, 0.0005245804786682129, 0.0005517899990081787, 0.0005789995193481445, 0.0006062090396881104, 0.0006334185600280762, 0.000660628080368042, 0.0006878376007080078, 0.0007150471210479736, 0.0007422566413879395, 0.0007694661617279053, 0.0007966756820678711, 0.0008238852024078369, 0.0008510947227478027, 0.0008783042430877686, 0.0009055137634277344]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 7.0, 11.0, 7.0, 15.0, 14.0, 20.0, 43.0, 43.0, 64.0, 106.0, 141.0, 219.0, 311.0, 501.0, 739.0, 1149.0, 1796.0, 3009.0, 6193.0, 15959.0, 55222.0, 225667.0, 498933.0, 169791.0, 42884.0, 12942.0, 5229.0, 2735.0, 1621.0, 1062.0, 704.0, 452.0, 308.0, 197.0, 146.0, 95.0, 66.0, 35.0, 34.0, 19.0, 18.0, 11.0, 11.0, 9.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.7734375, -14.3175048828125, -13.861572265625, -13.4056396484375, -12.94970703125, -12.4937744140625, -12.037841796875, -11.5819091796875, -11.1259765625, -10.6700439453125, -10.214111328125, -9.7581787109375, -9.30224609375, -8.8463134765625, -8.390380859375, -7.9344482421875, -7.478515625, -7.0225830078125, -6.566650390625, -6.1107177734375, -5.65478515625, -5.1988525390625, -4.742919921875, -4.2869873046875, -3.8310546875, -3.3751220703125, -2.919189453125, -2.4632568359375, -2.00732421875, -1.5513916015625, -1.095458984375, -0.6395263671875, -0.18359375, 0.2723388671875, 0.728271484375, 1.1842041015625, 1.64013671875, 2.0960693359375, 2.552001953125, 3.0079345703125, 3.4638671875, 3.9197998046875, 4.375732421875, 4.8316650390625, 5.28759765625, 5.7435302734375, 6.199462890625, 6.6553955078125, 7.111328125, 7.5672607421875, 8.023193359375, 8.4791259765625, 8.93505859375, 9.3909912109375, 9.846923828125, 10.3028564453125, 10.7587890625, 11.2147216796875, 11.670654296875, 12.1265869140625, 12.58251953125, 13.0384521484375, 13.494384765625, 13.9503173828125, 14.40625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 4.0, 10.0, 15.0, 15.0, 21.0, 22.0, 21.0, 36.0, 28.0, 41.0, 48.0, 64.0, 80.0, 113.0, 100.0, 54.0, 57.0, 41.0, 33.0, 23.0, 21.0, 29.0, 17.0, 19.0, 18.0, 13.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.763671875, -3.648712158203125, -3.53375244140625, -3.418792724609375, -3.3038330078125, -3.188873291015625, -3.07391357421875, -2.958953857421875, -2.843994140625, -2.729034423828125, -2.61407470703125, -2.499114990234375, -2.3841552734375, -2.269195556640625, -2.15423583984375, -2.039276123046875, -1.92431640625, -1.809356689453125, -1.69439697265625, -1.579437255859375, -1.4644775390625, -1.349517822265625, -1.23455810546875, -1.119598388671875, -1.004638671875, -0.889678955078125, -0.77471923828125, -0.659759521484375, -0.5447998046875, -0.429840087890625, -0.31488037109375, -0.199920654296875, -0.0849609375, 0.029998779296875, 0.14495849609375, 0.259918212890625, 0.3748779296875, 0.489837646484375, 0.60479736328125, 0.719757080078125, 0.834716796875, 0.949676513671875, 1.06463623046875, 1.179595947265625, 1.2945556640625, 1.409515380859375, 1.52447509765625, 1.639434814453125, 1.75439453125, 1.869354248046875, 1.98431396484375, 2.099273681640625, 2.2142333984375, 2.329193115234375, 2.44415283203125, 2.559112548828125, 2.674072265625, 2.789031982421875, 2.90399169921875, 3.018951416015625, 3.1339111328125, 3.248870849609375, 3.36383056640625, 3.478790283203125, 3.59375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 4.0, 5.0, 8.0, 7.0, 9.0, 9.0, 10.0, 13.0, 21.0, 14.0, 18.0, 15.0, 15.0, 31.0, 21.0, 31.0, 36.0, 35.0, 34.0, 37.0, 47.0, 37.0, 38.0, 39.0, 42.0, 38.0, 28.0, 44.0, 31.0, 19.0, 34.0, 32.0, 24.0, 26.0, 20.0, 10.0, 12.0, 11.0, 18.0, 17.0, 11.0, 9.0, 4.0, 8.0, 8.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-36.41582107543945, -35.33332824707031, -34.25083541870117, -33.16834259033203, -32.08584976196289, -31.00335693359375, -29.920866012573242, -28.8383731842041, -27.75588035583496, -26.67338752746582, -25.59089469909668, -24.50840187072754, -23.42591094970703, -22.34341812133789, -21.26092529296875, -20.17843246459961, -19.09593963623047, -18.013446807861328, -16.930953979492188, -15.848462104797363, -14.765969276428223, -13.683476448059082, -12.600984573364258, -11.518491744995117, -10.435998916625977, -9.353506088256836, -8.271013259887695, -7.188521385192871, -6.1060285568237305, -5.02353572845459, -3.9410433769226074, -2.858551025390625, -1.7760581970214844, -0.6935656070709229, 0.38892698287963867, 1.4714195728302002, 2.5539121627807617, 3.6364049911499023, 4.718897342681885, 5.801389694213867, 6.883882522583008, 7.966375350952148, 9.048868179321289, 10.131360054016113, 11.213852882385254, 12.296345710754395, 13.378837585449219, 14.46133041381836, 15.5438232421875, 16.62631607055664, 17.70880889892578, 18.791301727294922, 19.873794555664062, 20.956287384033203, 22.03877830505371, 23.12127113342285, 24.203763961791992, 25.286256790161133, 26.368749618530273, 27.451242446899414, 28.533733367919922, 29.616226196289062, 30.698719024658203, 31.781211853027344, 32.863704681396484]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 4.0, 9.0, 8.0, 19.0, 14.0, 21.0, 23.0, 33.0, 28.0, 24.0, 31.0, 35.0, 37.0, 51.0, 25.0, 55.0, 42.0, 35.0, 55.0, 48.0, 41.0, 42.0, 42.0, 27.0, 51.0, 27.0, 29.0, 22.0, 21.0, 17.0, 10.0, 14.0, 8.0, 6.0, 10.0, 3.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.511680603027344, -48.939414978027344, -47.36715316772461, -45.79488754272461, -44.222625732421875, -42.650360107421875, -41.078094482421875, -39.50583267211914, -37.93356704711914, -36.36130142211914, -34.789039611816406, -33.216773986816406, -31.64451026916504, -30.072246551513672, -28.499982833862305, -26.927719116210938, -25.35545539855957, -23.783191680908203, -22.210927963256836, -20.63866424560547, -19.06639862060547, -17.4941349029541, -15.921871185302734, -14.34960651397705, -12.777342796325684, -11.205079078674316, -9.632814407348633, -8.060550689697266, -6.48828649520874, -4.916022300720215, -3.3437585830688477, -1.771493911743164, -0.19923019409179688, 1.373033881187439, 2.945297956466675, 4.517561912536621, 6.0898261070251465, 7.662090301513672, 9.234354019165039, 10.806618690490723, 12.37888240814209, 13.951146125793457, 15.52341079711914, 17.095674514770508, 18.667938232421875, 20.240203857421875, 21.81246566772461, 23.38473129272461, 24.956995010375977, 26.529258728027344, 28.10152244567871, 29.673786163330078, 31.246051788330078, 32.81831359863281, 34.39057922363281, 35.96284484863281, 37.53510665893555, 39.10737228393555, 40.67963409423828, 42.25189971923828, 43.824161529541016, 45.396427154541016, 46.96868896484375, 48.54095458984375, 50.11322021484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 7.0, 8.0, 21.0, 26.0, 55.0, 87.0, 149.0, 249.0, 359.0, 592.0, 984.0, 1446.0, 2398.0, 3831.0, 5947.0, 9188.0, 13666.0, 20367.0, 29761.0, 40959.0, 55638.0, 70522.0, 85056.0, 96705.0, 102890.0, 100882.0, 93711.0, 80986.0, 65869.0, 50565.0, 37269.0, 26288.0, 18101.0, 12037.0, 7933.0, 5069.0, 3337.0, 2078.0, 1304.0, 832.0, 546.0, 327.0, 207.0, 122.0, 70.0, 44.0, 31.0, 16.0, 13.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.96875, -23.1376953125, -22.306640625, -21.4755859375, -20.64453125, -19.8134765625, -18.982421875, -18.1513671875, -17.3203125, -16.4892578125, -15.658203125, -14.8271484375, -13.99609375, -13.1650390625, -12.333984375, -11.5029296875, -10.671875, -9.8408203125, -9.009765625, -8.1787109375, -7.34765625, -6.5166015625, -5.685546875, -4.8544921875, -4.0234375, -3.1923828125, -2.361328125, -1.5302734375, -0.69921875, 0.1318359375, 0.962890625, 1.7939453125, 2.625, 3.4560546875, 4.287109375, 5.1181640625, 5.94921875, 6.7802734375, 7.611328125, 8.4423828125, 9.2734375, 10.1044921875, 10.935546875, 11.7666015625, 12.59765625, 13.4287109375, 14.259765625, 15.0908203125, 15.921875, 16.7529296875, 17.583984375, 18.4150390625, 19.24609375, 20.0771484375, 20.908203125, 21.7392578125, 22.5703125, 23.4013671875, 24.232421875, 25.0634765625, 25.89453125, 26.7255859375, 27.556640625, 28.3876953125, 29.21875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 4.0, 9.0, 9.0, 16.0, 14.0, 22.0, 18.0, 39.0, 26.0, 24.0, 30.0, 33.0, 38.0, 51.0, 30.0, 44.0, 46.0, 34.0, 57.0, 50.0, 39.0, 42.0, 42.0, 30.0, 48.0, 24.0, 32.0, 24.0, 21.0, 19.0, 9.0, 15.0, 9.0, 6.0, 7.0, 6.0, 5.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.28125, -47.75341796875, -46.2255859375, -44.69775390625, -43.169921875, -41.64208984375, -40.1142578125, -38.58642578125, -37.05859375, -35.53076171875, -34.0029296875, -32.47509765625, -30.947265625, -29.41943359375, -27.8916015625, -26.36376953125, -24.8359375, -23.30810546875, -21.7802734375, -20.25244140625, -18.724609375, -17.19677734375, -15.6689453125, -14.14111328125, -12.61328125, -11.08544921875, -9.5576171875, -8.02978515625, -6.501953125, -4.97412109375, -3.4462890625, -1.91845703125, -0.390625, 1.13720703125, 2.6650390625, 4.19287109375, 5.720703125, 7.24853515625, 8.7763671875, 10.30419921875, 11.83203125, 13.35986328125, 14.8876953125, 16.41552734375, 17.943359375, 19.47119140625, 20.9990234375, 22.52685546875, 24.0546875, 25.58251953125, 27.1103515625, 28.63818359375, 30.166015625, 31.69384765625, 33.2216796875, 34.74951171875, 36.27734375, 37.80517578125, 39.3330078125, 40.86083984375, 42.388671875, 43.91650390625, 45.4443359375, 46.97216796875, 48.5]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 5.0, 1.0, 8.0, 12.0, 15.0, 23.0, 50.0, 69.0, 142.0, 185.0, 333.0, 459.0, 695.0, 1247.0, 1984.0, 3019.0, 4692.0, 7093.0, 11106.0, 16811.0, 24670.0, 34341.0, 48128.0, 63291.0, 79652.0, 93097.0, 102285.0, 104336.0, 99359.0, 87562.0, 73292.0, 56572.0, 42453.0, 30202.0, 20755.0, 14349.0, 9293.0, 6040.0, 3941.0, 2595.0, 1656.0, 1002.0, 673.0, 411.0, 263.0, 148.0, 96.0, 52.0, 43.0, 23.0, 13.0, 7.0, 11.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.46875, -26.591064453125, -25.71337890625, -24.835693359375, -23.9580078125, -23.080322265625, -22.20263671875, -21.324951171875, -20.447265625, -19.569580078125, -18.69189453125, -17.814208984375, -16.9365234375, -16.058837890625, -15.18115234375, -14.303466796875, -13.42578125, -12.548095703125, -11.67041015625, -10.792724609375, -9.9150390625, -9.037353515625, -8.15966796875, -7.281982421875, -6.404296875, -5.526611328125, -4.64892578125, -3.771240234375, -2.8935546875, -2.015869140625, -1.13818359375, -0.260498046875, 0.6171875, 1.494873046875, 2.37255859375, 3.250244140625, 4.1279296875, 5.005615234375, 5.88330078125, 6.760986328125, 7.638671875, 8.516357421875, 9.39404296875, 10.271728515625, 11.1494140625, 12.027099609375, 12.90478515625, 13.782470703125, 14.66015625, 15.537841796875, 16.41552734375, 17.293212890625, 18.1708984375, 19.048583984375, 19.92626953125, 20.803955078125, 21.681640625, 22.559326171875, 23.43701171875, 24.314697265625, 25.1923828125, 26.070068359375, 26.94775390625, 27.825439453125, 28.703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 10.0, 13.0, 10.0, 21.0, 24.0, 16.0, 21.0, 26.0, 22.0, 32.0, 28.0, 35.0, 31.0, 38.0, 32.0, 39.0, 37.0, 42.0, 42.0, 51.0, 31.0, 40.0, 30.0, 29.0, 33.0, 25.0, 25.0, 34.0, 22.0, 28.0, 20.0, 17.0, 7.0, 15.0, 8.0, 6.0, 8.0, 9.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-27.78125, -26.894287109375, -26.00732421875, -25.120361328125, -24.2333984375, -23.346435546875, -22.45947265625, -21.572509765625, -20.685546875, -19.798583984375, -18.91162109375, -18.024658203125, -17.1376953125, -16.250732421875, -15.36376953125, -14.476806640625, -13.58984375, -12.702880859375, -11.81591796875, -10.928955078125, -10.0419921875, -9.155029296875, -8.26806640625, -7.381103515625, -6.494140625, -5.607177734375, -4.72021484375, -3.833251953125, -2.9462890625, -2.059326171875, -1.17236328125, -0.285400390625, 0.6015625, 1.488525390625, 2.37548828125, 3.262451171875, 4.1494140625, 5.036376953125, 5.92333984375, 6.810302734375, 7.697265625, 8.584228515625, 9.47119140625, 10.358154296875, 11.2451171875, 12.132080078125, 13.01904296875, 13.906005859375, 14.79296875, 15.679931640625, 16.56689453125, 17.453857421875, 18.3408203125, 19.227783203125, 20.11474609375, 21.001708984375, 21.888671875, 22.775634765625, 23.66259765625, 24.549560546875, 25.4365234375, 26.323486328125, 27.21044921875, 28.097412109375, 28.984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 10.0, 15.0, 32.0, 40.0, 62.0, 99.0, 145.0, 246.0, 362.0, 672.0, 1400.0, 3019.0, 7570.0, 20964.0, 60728.0, 156631.0, 279339.0, 275654.0, 150540.0, 58130.0, 19772.0, 7124.0, 2868.0, 1417.0, 658.0, 431.0, 238.0, 154.0, 89.0, 50.0, 25.0, 18.0, 15.0, 11.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.515625, -28.531005859375, -27.54638671875, -26.561767578125, -25.5771484375, -24.592529296875, -23.60791015625, -22.623291015625, -21.638671875, -20.654052734375, -19.66943359375, -18.684814453125, -17.7001953125, -16.715576171875, -15.73095703125, -14.746337890625, -13.76171875, -12.777099609375, -11.79248046875, -10.807861328125, -9.8232421875, -8.838623046875, -7.85400390625, -6.869384765625, -5.884765625, -4.900146484375, -3.91552734375, -2.930908203125, -1.9462890625, -0.961669921875, 0.02294921875, 1.007568359375, 1.9921875, 2.976806640625, 3.96142578125, 4.946044921875, 5.9306640625, 6.915283203125, 7.89990234375, 8.884521484375, 9.869140625, 10.853759765625, 11.83837890625, 12.822998046875, 13.8076171875, 14.792236328125, 15.77685546875, 16.761474609375, 17.74609375, 18.730712890625, 19.71533203125, 20.699951171875, 21.6845703125, 22.669189453125, 23.65380859375, 24.638427734375, 25.623046875, 26.607666015625, 27.59228515625, 28.576904296875, 29.5615234375, 30.546142578125, 31.53076171875, 32.515380859375, 33.5]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 10.0, 10.0, 13.0, 6.0, 15.0, 16.0, 26.0, 26.0, 28.0, 47.0, 32.0, 36.0, 49.0, 64.0, 43.0, 42.0, 48.0, 55.0, 40.0, 37.0, 50.0, 43.0, 36.0, 33.0, 37.0, 24.0, 27.0, 15.0, 14.0, 14.0, 14.0, 8.0, 7.0, 4.0, 5.0, 6.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00152587890625, -0.0014795362949371338, -0.0014331936836242676, -0.0013868510723114014, -0.0013405084609985352, -0.001294165849685669, -0.0012478232383728027, -0.0012014806270599365, -0.0011551380157470703, -0.001108795404434204, -0.0010624527931213379, -0.0010161101818084717, -0.0009697675704956055, -0.0009234249591827393, -0.000877082347869873, -0.0008307397365570068, -0.0007843971252441406, -0.0007380545139312744, -0.0006917119026184082, -0.000645369291305542, -0.0005990266799926758, -0.0005526840686798096, -0.0005063414573669434, -0.00045999884605407715, -0.00041365623474121094, -0.0003673136234283447, -0.0003209710121154785, -0.0002746284008026123, -0.0002282857894897461, -0.00018194317817687988, -0.00013560056686401367, -8.925795555114746e-05, -4.291534423828125e-05, 3.427267074584961e-06, 4.976987838745117e-05, 9.611248970031738e-05, 0.0001424551010131836, 0.0001887977123260498, 0.00023514032363891602, 0.0002814829349517822, 0.00032782554626464844, 0.00037416815757751465, 0.00042051076889038086, 0.00046685338020324707, 0.0005131959915161133, 0.0005595386028289795, 0.0006058812141418457, 0.0006522238254547119, 0.0006985664367675781, 0.0007449090480804443, 0.0007912516593933105, 0.0008375942707061768, 0.000883936882019043, 0.0009302794933319092, 0.0009766221046447754, 0.0010229647159576416, 0.0010693073272705078, 0.001115649938583374, 0.0011619925498962402, 0.0012083351612091064, 0.0012546777725219727, 0.0013010203838348389, 0.001347362995147705, 0.0013937056064605713, 0.0014400482177734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 8.0, 10.0, 11.0, 15.0, 23.0, 21.0, 35.0, 51.0, 87.0, 122.0, 155.0, 207.0, 336.0, 505.0, 931.0, 1806.0, 4032.0, 10739.0, 34971.0, 115005.0, 284345.0, 337901.0, 173147.0, 55938.0, 16918.0, 5714.0, 2438.0, 1138.0, 664.0, 408.0, 270.0, 176.0, 105.0, 88.0, 61.0, 46.0, 31.0, 34.0, 17.0, 16.0, 7.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.40625, -37.13427734375, -35.8623046875, -34.59033203125, -33.318359375, -32.04638671875, -30.7744140625, -29.50244140625, -28.23046875, -26.95849609375, -25.6865234375, -24.41455078125, -23.142578125, -21.87060546875, -20.5986328125, -19.32666015625, -18.0546875, -16.78271484375, -15.5107421875, -14.23876953125, -12.966796875, -11.69482421875, -10.4228515625, -9.15087890625, -7.87890625, -6.60693359375, -5.3349609375, -4.06298828125, -2.791015625, -1.51904296875, -0.2470703125, 1.02490234375, 2.296875, 3.56884765625, 4.8408203125, 6.11279296875, 7.384765625, 8.65673828125, 9.9287109375, 11.20068359375, 12.47265625, 13.74462890625, 15.0166015625, 16.28857421875, 17.560546875, 18.83251953125, 20.1044921875, 21.37646484375, 22.6484375, 23.92041015625, 25.1923828125, 26.46435546875, 27.736328125, 29.00830078125, 30.2802734375, 31.55224609375, 32.82421875, 34.09619140625, 35.3681640625, 36.64013671875, 37.912109375, 39.18408203125, 40.4560546875, 41.72802734375, 43.0]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 19.0, 31.0, 41.0, 76.0, 97.0, 154.0, 157.0, 131.0, 108.0, 70.0, 30.0, 31.0, 11.0, 6.0, 3.0, 6.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.3125, -23.6937255859375, -23.074951171875, -22.4561767578125, -21.83740234375, -21.2186279296875, -20.599853515625, -19.9810791015625, -19.3623046875, -18.7435302734375, -18.124755859375, -17.5059814453125, -16.88720703125, -16.2684326171875, -15.649658203125, -15.0308837890625, -14.412109375, -13.7933349609375, -13.174560546875, -12.5557861328125, -11.93701171875, -11.3182373046875, -10.699462890625, -10.0806884765625, -9.4619140625, -8.8431396484375, -8.224365234375, -7.6055908203125, -6.98681640625, -6.3680419921875, -5.749267578125, -5.1304931640625, -4.51171875, -3.8929443359375, -3.274169921875, -2.6553955078125, -2.03662109375, -1.4178466796875, -0.799072265625, -0.1802978515625, 0.4384765625, 1.0572509765625, 1.676025390625, 2.2947998046875, 2.91357421875, 3.5323486328125, 4.151123046875, 4.7698974609375, 5.388671875, 6.0074462890625, 6.626220703125, 7.2449951171875, 7.86376953125, 8.4825439453125, 9.101318359375, 9.7200927734375, 10.3388671875, 10.9576416015625, 11.576416015625, 12.1951904296875, 12.81396484375, 13.4327392578125, 14.051513671875, 14.6702880859375, 15.2890625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 2.0, 8.0, 2.0, 6.0, 9.0, 9.0, 18.0, 11.0, 30.0, 14.0, 19.0, 18.0, 29.0, 21.0, 29.0, 44.0, 40.0, 45.0, 46.0, 42.0, 38.0, 50.0, 47.0, 42.0, 39.0, 38.0, 40.0, 24.0, 30.0, 31.0, 30.0, 15.0, 19.0, 24.0, 7.0, 10.0, 13.0, 13.0, 17.0, 8.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.35676574707031, -41.15163040161133, -39.94649887084961, -38.741363525390625, -37.536231994628906, -36.33109664916992, -35.12596130371094, -33.92082977294922, -32.715694427490234, -31.510560989379883, -30.30542755126953, -29.100292205810547, -27.895158767700195, -26.690025329589844, -25.48488998413086, -24.279756546020508, -23.074623107910156, -21.869489669799805, -20.664356231689453, -19.45922088623047, -18.254087448120117, -17.048954010009766, -15.843819618225098, -14.63868522644043, -13.433551788330078, -12.228418350219727, -11.023283958435059, -9.81814956665039, -8.613016128540039, -7.407882213592529, -6.2027482986450195, -4.997613906860352, -3.79248046875, -2.5873465538024902, -1.3822126388549805, -0.1770787239074707, 1.028055191040039, 2.233189105987549, 3.4383230209350586, 4.643457412719727, 5.848590850830078, 7.053724765777588, 8.258858680725098, 9.463993072509766, 10.669126510620117, 11.874259948730469, 13.079394340515137, 14.284528732299805, 15.489662170410156, 16.694795608520508, 17.89992904663086, 19.105064392089844, 20.310197830200195, 21.515331268310547, 22.72046661376953, 23.925600051879883, 25.130733489990234, 26.335866928100586, 27.541000366210938, 28.746135711669922, 29.951269149780273, 31.156402587890625, 32.36153793334961, 33.566673278808594, 34.77180480957031]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 9.0, 10.0, 6.0, 9.0, 18.0, 14.0, 19.0, 19.0, 27.0, 24.0, 21.0, 31.0, 40.0, 43.0, 33.0, 37.0, 35.0, 50.0, 46.0, 44.0, 41.0, 52.0, 39.0, 43.0, 44.0, 33.0, 38.0, 17.0, 20.0, 26.0, 34.0, 13.0, 13.0, 9.0, 4.0, 5.0, 5.0, 8.0, 4.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.09488296508789, -48.514469146728516, -46.934051513671875, -45.3536376953125, -43.773223876953125, -42.19281005859375, -40.61239242553711, -39.031978607177734, -37.451560974121094, -35.87114715576172, -34.29072952270508, -32.7103157043457, -31.129901885986328, -29.54948616027832, -27.969070434570312, -26.388656616210938, -24.808242797851562, -23.227827072143555, -21.64741325378418, -20.066997528076172, -18.486583709716797, -16.90616798400879, -15.325752258300781, -13.74533748626709, -12.164922714233398, -10.584507942199707, -9.004093170166016, -7.423677444458008, -5.843262672424316, -4.262847900390625, -2.682432174682617, -1.1020174026489258, 0.47840118408203125, 2.0588161945343018, 3.6392312049865723, 5.219646453857422, 6.800061225891113, 8.380475997924805, 9.960891723632812, 11.541306495666504, 13.121721267700195, 14.702136039733887, 16.282550811767578, 17.862966537475586, 19.443382263183594, 21.02379608154297, 22.604211807250977, 24.184627532958984, 25.76504135131836, 27.345457077026367, 28.925870895385742, 30.50628662109375, 32.086700439453125, 33.6671142578125, 35.24753189086914, 36.827945709228516, 38.408363342285156, 39.98877716064453, 41.56919479370117, 43.14960861206055, 44.73002243041992, 46.31044006347656, 47.89085388183594, 49.47126770019531, 51.05168151855469]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 20.0, 33.0, 52.0, 78.0, 159.0, 273.0, 469.0, 808.0, 1449.0, 2442.0, 4201.0, 6991.0, 11636.0, 19365.0, 31985.0, 51671.0, 79749.0, 122200.0, 177952.0, 247537.0, 324403.0, 395459.0, 445380.0, 460655.0, 435512.0, 379588.0, 305412.0, 229574.0, 162483.0, 110470.0, 71894.0, 45331.0, 28126.0, 16993.0, 9999.0, 5799.0, 3399.0, 1992.0, 1178.0, 643.0, 396.0, 231.0, 127.0, 73.0, 42.0, 25.0, 17.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.53125, -32.5556640625, -31.580078125, -30.6044921875, -29.62890625, -28.6533203125, -27.677734375, -26.7021484375, -25.7265625, -24.7509765625, -23.775390625, -22.7998046875, -21.82421875, -20.8486328125, -19.873046875, -18.8974609375, -17.921875, -16.9462890625, -15.970703125, -14.9951171875, -14.01953125, -13.0439453125, -12.068359375, -11.0927734375, -10.1171875, -9.1416015625, -8.166015625, -7.1904296875, -6.21484375, -5.2392578125, -4.263671875, -3.2880859375, -2.3125, -1.3369140625, -0.361328125, 0.6142578125, 1.58984375, 2.5654296875, 3.541015625, 4.5166015625, 5.4921875, 6.4677734375, 7.443359375, 8.4189453125, 9.39453125, 10.3701171875, 11.345703125, 12.3212890625, 13.296875, 14.2724609375, 15.248046875, 16.2236328125, 17.19921875, 18.1748046875, 19.150390625, 20.1259765625, 21.1015625, 22.0771484375, 23.052734375, 24.0283203125, 25.00390625, 25.9794921875, 26.955078125, 27.9306640625, 28.90625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 8.0, 11.0, 3.0, 8.0, 15.0, 20.0, 12.0, 26.0, 27.0, 24.0, 17.0, 30.0, 37.0, 46.0, 34.0, 33.0, 39.0, 38.0, 54.0, 34.0, 49.0, 45.0, 44.0, 42.0, 43.0, 45.0, 23.0, 29.0, 21.0, 19.0, 28.0, 22.0, 16.0, 7.0, 9.0, 3.0, 4.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-40.78125, -39.50244140625, -38.2236328125, -36.94482421875, -35.666015625, -34.38720703125, -33.1083984375, -31.82958984375, -30.55078125, -29.27197265625, -27.9931640625, -26.71435546875, -25.435546875, -24.15673828125, -22.8779296875, -21.59912109375, -20.3203125, -19.04150390625, -17.7626953125, -16.48388671875, -15.205078125, -13.92626953125, -12.6474609375, -11.36865234375, -10.08984375, -8.81103515625, -7.5322265625, -6.25341796875, -4.974609375, -3.69580078125, -2.4169921875, -1.13818359375, 0.140625, 1.41943359375, 2.6982421875, 3.97705078125, 5.255859375, 6.53466796875, 7.8134765625, 9.09228515625, 10.37109375, 11.64990234375, 12.9287109375, 14.20751953125, 15.486328125, 16.76513671875, 18.0439453125, 19.32275390625, 20.6015625, 21.88037109375, 23.1591796875, 24.43798828125, 25.716796875, 26.99560546875, 28.2744140625, 29.55322265625, 30.83203125, 32.11083984375, 33.3896484375, 34.66845703125, 35.947265625, 37.22607421875, 38.5048828125, 39.78369140625, 41.0625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [4.0, 7.0, 8.0, 12.0, 34.0, 45.0, 90.0, 140.0, 256.0, 432.0, 754.0, 1303.0, 2116.0, 3577.0, 6053.0, 10041.0, 16344.0, 24990.0, 39221.0, 58100.0, 83248.0, 118065.0, 157940.0, 205644.0, 256419.0, 301539.0, 340671.0, 365591.0, 370981.0, 357343.0, 325959.0, 282034.0, 233603.0, 184038.0, 139390.0, 102106.0, 71640.0, 48410.0, 32287.0, 20739.0, 13100.0, 7971.0, 5018.0, 2994.0, 1693.0, 974.0, 577.0, 335.0, 212.0, 116.0, 48.0, 45.0, 19.0, 16.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.8125, -22.970458984375, -22.12841796875, -21.286376953125, -20.4443359375, -19.602294921875, -18.76025390625, -17.918212890625, -17.076171875, -16.234130859375, -15.39208984375, -14.550048828125, -13.7080078125, -12.865966796875, -12.02392578125, -11.181884765625, -10.33984375, -9.497802734375, -8.65576171875, -7.813720703125, -6.9716796875, -6.129638671875, -5.28759765625, -4.445556640625, -3.603515625, -2.761474609375, -1.91943359375, -1.077392578125, -0.2353515625, 0.606689453125, 1.44873046875, 2.290771484375, 3.1328125, 3.974853515625, 4.81689453125, 5.658935546875, 6.5009765625, 7.343017578125, 8.18505859375, 9.027099609375, 9.869140625, 10.711181640625, 11.55322265625, 12.395263671875, 13.2373046875, 14.079345703125, 14.92138671875, 15.763427734375, 16.60546875, 17.447509765625, 18.28955078125, 19.131591796875, 19.9736328125, 20.815673828125, 21.65771484375, 22.499755859375, 23.341796875, 24.183837890625, 25.02587890625, 25.867919921875, 26.7099609375, 27.552001953125, 28.39404296875, 29.236083984375, 30.078125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 6.0, 7.0, 13.0, 14.0, 16.0, 19.0, 23.0, 48.0, 42.0, 52.0, 60.0, 67.0, 91.0, 97.0, 111.0, 125.0, 143.0, 153.0, 163.0, 194.0, 155.0, 176.0, 211.0, 186.0, 187.0, 178.0, 175.0, 179.0, 172.0, 150.0, 135.0, 125.0, 118.0, 90.0, 86.0, 53.0, 59.0, 43.0, 37.0, 28.0, 19.0, 21.0, 11.0, 10.0, 8.0, 6.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-16.796875, -16.274658203125, -15.75244140625, -15.230224609375, -14.7080078125, -14.185791015625, -13.66357421875, -13.141357421875, -12.619140625, -12.096923828125, -11.57470703125, -11.052490234375, -10.5302734375, -10.008056640625, -9.48583984375, -8.963623046875, -8.44140625, -7.919189453125, -7.39697265625, -6.874755859375, -6.3525390625, -5.830322265625, -5.30810546875, -4.785888671875, -4.263671875, -3.741455078125, -3.21923828125, -2.697021484375, -2.1748046875, -1.652587890625, -1.13037109375, -0.608154296875, -0.0859375, 0.436279296875, 0.95849609375, 1.480712890625, 2.0029296875, 2.525146484375, 3.04736328125, 3.569580078125, 4.091796875, 4.614013671875, 5.13623046875, 5.658447265625, 6.1806640625, 6.702880859375, 7.22509765625, 7.747314453125, 8.26953125, 8.791748046875, 9.31396484375, 9.836181640625, 10.3583984375, 10.880615234375, 11.40283203125, 11.925048828125, 12.447265625, 12.969482421875, 13.49169921875, 14.013916015625, 14.5361328125, 15.058349609375, 15.58056640625, 16.102783203125, 16.625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 4.0, 7.0, 14.0, 13.0, 15.0, 11.0, 10.0, 15.0, 24.0, 17.0, 33.0, 26.0, 21.0, 31.0, 34.0, 27.0, 24.0, 46.0, 45.0, 39.0, 37.0, 33.0, 30.0, 39.0, 43.0, 37.0, 30.0, 35.0, 36.0, 32.0, 23.0, 26.0, 17.0, 14.0, 14.0, 19.0, 13.0, 15.0, 9.0, 12.0, 1.0, 11.0, 7.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4946403503418, -32.41445541381836, -31.334270477294922, -30.254085540771484, -29.173900604248047, -28.09371566772461, -27.013530731201172, -25.933345794677734, -24.853160858154297, -23.77297592163086, -22.692790985107422, -21.612606048583984, -20.532421112060547, -19.45223617553711, -18.372051239013672, -17.291866302490234, -16.211679458618164, -15.131494522094727, -14.051309585571289, -12.971124649047852, -11.890939712524414, -10.810754776000977, -9.730568885803223, -8.650383949279785, -7.570199012756348, -6.49001407623291, -5.409829139709473, -4.329643726348877, -3.2494587898254395, -2.169273853302002, -1.0890884399414062, -0.00890350341796875, 1.0712814331054688, 2.1514663696289062, 3.231651544570923, 4.3118367195129395, 5.392021656036377, 6.4722065925598145, 7.55239200592041, 8.632576942443848, 9.712761878967285, 10.792946815490723, 11.87313175201416, 12.953317642211914, 14.033502578735352, 15.113687515258789, 16.193872451782227, 17.274057388305664, 18.3542423248291, 19.43442726135254, 20.514612197875977, 21.594797134399414, 22.67498207092285, 23.75516700744629, 24.83535385131836, 25.915538787841797, 26.995723724365234, 28.075908660888672, 29.15609359741211, 30.236278533935547, 31.316463470458984, 32.39664840698242, 33.47683334350586, 34.5570182800293, 35.637203216552734]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 12.0, 6.0, 15.0, 15.0, 18.0, 12.0, 19.0, 15.0, 26.0, 21.0, 29.0, 33.0, 48.0, 36.0, 44.0, 41.0, 47.0, 39.0, 47.0, 39.0, 41.0, 49.0, 41.0, 34.0, 36.0, 28.0, 28.0, 23.0, 28.0, 20.0, 20.0, 19.0, 14.0, 11.0, 7.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-52.02000045776367, -50.544715881347656, -49.06943130493164, -47.594146728515625, -46.118858337402344, -44.64357376098633, -43.16828918457031, -41.6930046081543, -40.21772003173828, -38.742435455322266, -37.26715087890625, -35.79186248779297, -34.31657791137695, -32.84129333496094, -31.366008758544922, -29.890724182128906, -28.415435791015625, -26.94015121459961, -25.46486473083496, -23.989580154418945, -22.514293670654297, -21.03900909423828, -19.563724517822266, -18.08843994140625, -16.6131534576416, -15.13786792755127, -13.662582397460938, -12.187297821044922, -10.71201229095459, -9.236726760864258, -7.761442184448242, -6.28615665435791, -4.8108673095703125, -3.3355820178985596, -1.8602967262268066, -0.3850116729736328, 1.0902738571166992, 2.5655593872070312, 4.040843963623047, 5.516129493713379, 6.991415023803711, 8.466700553894043, 9.941986083984375, 11.41727066040039, 12.892556190490723, 14.367841720581055, 15.84312629699707, 17.31841278076172, 18.793697357177734, 20.26898193359375, 21.7442684173584, 23.219552993774414, 24.694839477539062, 26.170124053955078, 27.645408630371094, 29.12069320678711, 30.595979690551758, 32.071266174316406, 33.54655075073242, 35.02183532714844, 36.49711990356445, 37.97240447998047, 39.44769287109375, 40.922977447509766, 42.39826202392578]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 17.0, 15.0, 25.0, 25.0, 35.0, 56.0, 69.0, 103.0, 148.0, 202.0, 298.0, 483.0, 741.0, 1151.0, 1826.0, 3044.0, 5216.0, 9217.0, 16658.0, 32133.0, 63663.0, 132863.0, 256294.0, 255940.0, 132806.0, 64416.0, 32004.0, 16638.0, 8970.0, 5310.0, 2984.0, 1780.0, 1145.0, 729.0, 508.0, 314.0, 212.0, 132.0, 110.0, 74.0, 44.0, 45.0, 26.0, 22.0, 16.0, 9.0, 4.0, 10.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0], "bins": [-13.53125, -13.1212158203125, -12.711181640625, -12.3011474609375, -11.89111328125, -11.4810791015625, -11.071044921875, -10.6610107421875, -10.2509765625, -9.8409423828125, -9.430908203125, -9.0208740234375, -8.61083984375, -8.2008056640625, -7.790771484375, -7.3807373046875, -6.970703125, -6.5606689453125, -6.150634765625, -5.7406005859375, -5.33056640625, -4.9205322265625, -4.510498046875, -4.1004638671875, -3.6904296875, -3.2803955078125, -2.870361328125, -2.4603271484375, -2.05029296875, -1.6402587890625, -1.230224609375, -0.8201904296875, -0.41015625, -0.0001220703125, 0.409912109375, 0.8199462890625, 1.22998046875, 1.6400146484375, 2.050048828125, 2.4600830078125, 2.8701171875, 3.2801513671875, 3.690185546875, 4.1002197265625, 4.51025390625, 4.9202880859375, 5.330322265625, 5.7403564453125, 6.150390625, 6.5604248046875, 6.970458984375, 7.3804931640625, 7.79052734375, 8.2005615234375, 8.610595703125, 9.0206298828125, 9.4306640625, 9.8406982421875, 10.250732421875, 10.6607666015625, 11.07080078125, 11.4808349609375, 11.890869140625, 12.3009033203125, 12.7109375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 12.0, 5.0, 15.0, 16.0, 18.0, 14.0, 20.0, 14.0, 25.0, 22.0, 27.0, 35.0, 44.0, 39.0, 46.0, 39.0, 48.0, 39.0, 46.0, 36.0, 43.0, 50.0, 39.0, 37.0, 35.0, 27.0, 28.0, 24.0, 27.0, 21.0, 19.0, 19.0, 14.0, 12.0, 6.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-51.8125, -50.33984375, -48.8671875, -47.39453125, -45.921875, -44.44921875, -42.9765625, -41.50390625, -40.03125, -38.55859375, -37.0859375, -35.61328125, -34.140625, -32.66796875, -31.1953125, -29.72265625, -28.25, -26.77734375, -25.3046875, -23.83203125, -22.359375, -20.88671875, -19.4140625, -17.94140625, -16.46875, -14.99609375, -13.5234375, -12.05078125, -10.578125, -9.10546875, -7.6328125, -6.16015625, -4.6875, -3.21484375, -1.7421875, -0.26953125, 1.203125, 2.67578125, 4.1484375, 5.62109375, 7.09375, 8.56640625, 10.0390625, 11.51171875, 12.984375, 14.45703125, 15.9296875, 17.40234375, 18.875, 20.34765625, 21.8203125, 23.29296875, 24.765625, 26.23828125, 27.7109375, 29.18359375, 30.65625, 32.12890625, 33.6015625, 35.07421875, 36.546875, 38.01953125, 39.4921875, 40.96484375, 42.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 7.0, 6.0, 3.0, 13.0, 16.0, 40.0, 34.0, 62.0, 62.0, 112.0, 155.0, 207.0, 280.0, 435.0, 684.0, 1036.0, 1649.0, 2880.0, 4917.0, 8804.0, 17840.0, 37461.0, 88649.0, 231709.0, 362143.0, 163909.0, 65295.0, 28643.0, 13664.0, 7168.0, 3984.0, 2406.0, 1409.0, 929.0, 567.0, 398.0, 299.0, 193.0, 133.0, 113.0, 65.0, 41.0, 42.0, 29.0, 21.0, 9.0, 11.0, 9.0, 4.0, 2.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.984375, -10.6336669921875, -10.282958984375, -9.9322509765625, -9.58154296875, -9.2308349609375, -8.880126953125, -8.5294189453125, -8.1787109375, -7.8280029296875, -7.477294921875, -7.1265869140625, -6.77587890625, -6.4251708984375, -6.074462890625, -5.7237548828125, -5.373046875, -5.0223388671875, -4.671630859375, -4.3209228515625, -3.97021484375, -3.6195068359375, -3.268798828125, -2.9180908203125, -2.5673828125, -2.2166748046875, -1.865966796875, -1.5152587890625, -1.16455078125, -0.8138427734375, -0.463134765625, -0.1124267578125, 0.23828125, 0.5889892578125, 0.939697265625, 1.2904052734375, 1.64111328125, 1.9918212890625, 2.342529296875, 2.6932373046875, 3.0439453125, 3.3946533203125, 3.745361328125, 4.0960693359375, 4.44677734375, 4.7974853515625, 5.148193359375, 5.4989013671875, 5.849609375, 6.2003173828125, 6.551025390625, 6.9017333984375, 7.25244140625, 7.6031494140625, 7.953857421875, 8.3045654296875, 8.6552734375, 9.0059814453125, 9.356689453125, 9.7073974609375, 10.05810546875, 10.4088134765625, 10.759521484375, 11.1102294921875, 11.4609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 3.0, 7.0, 12.0, 15.0, 10.0, 18.0, 16.0, 26.0, 23.0, 25.0, 24.0, 25.0, 41.0, 32.0, 47.0, 39.0, 39.0, 42.0, 43.0, 50.0, 41.0, 42.0, 29.0, 48.0, 28.0, 39.0, 33.0, 34.0, 19.0, 18.0, 27.0, 17.0, 18.0, 18.0, 12.0, 9.0, 5.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.76171875, -29.7890625, -28.81640625, -27.84375, -26.87109375, -25.8984375, -24.92578125, -23.953125, -22.98046875, -22.0078125, -21.03515625, -20.0625, -19.08984375, -18.1171875, -17.14453125, -16.171875, -15.19921875, -14.2265625, -13.25390625, -12.28125, -11.30859375, -10.3359375, -9.36328125, -8.390625, -7.41796875, -6.4453125, -5.47265625, -4.5, -3.52734375, -2.5546875, -1.58203125, -0.609375, 0.36328125, 1.3359375, 2.30859375, 3.28125, 4.25390625, 5.2265625, 6.19921875, 7.171875, 8.14453125, 9.1171875, 10.08984375, 11.0625, 12.03515625, 13.0078125, 13.98046875, 14.953125, 15.92578125, 16.8984375, 17.87109375, 18.84375, 19.81640625, 20.7890625, 21.76171875, 22.734375, 23.70703125, 24.6796875, 25.65234375, 26.625, 27.59765625, 28.5703125, 29.54296875, 30.515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 7.0, 6.0, 5.0, 8.0, 9.0, 13.0, 18.0, 26.0, 35.0, 46.0, 60.0, 90.0, 97.0, 153.0, 229.0, 295.0, 480.0, 634.0, 1062.0, 1771.0, 2997.0, 5538.0, 12034.0, 31266.0, 112389.0, 538050.0, 251144.0, 53882.0, 18164.0, 8014.0, 3907.0, 2237.0, 1333.0, 774.0, 546.0, 366.0, 263.0, 151.0, 137.0, 86.0, 58.0, 58.0, 32.0, 21.0, 26.0, 11.0, 17.0, 8.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1328125, -5.92657470703125, -5.7203369140625, -5.51409912109375, -5.307861328125, -5.10162353515625, -4.8953857421875, -4.68914794921875, -4.48291015625, -4.27667236328125, -4.0704345703125, -3.86419677734375, -3.657958984375, -3.45172119140625, -3.2454833984375, -3.03924560546875, -2.8330078125, -2.62677001953125, -2.4205322265625, -2.21429443359375, -2.008056640625, -1.80181884765625, -1.5955810546875, -1.38934326171875, -1.18310546875, -0.97686767578125, -0.7706298828125, -0.56439208984375, -0.358154296875, -0.15191650390625, 0.0543212890625, 0.26055908203125, 0.466796875, 0.67303466796875, 0.8792724609375, 1.08551025390625, 1.291748046875, 1.49798583984375, 1.7042236328125, 1.91046142578125, 2.11669921875, 2.32293701171875, 2.5291748046875, 2.73541259765625, 2.941650390625, 3.14788818359375, 3.3541259765625, 3.56036376953125, 3.7666015625, 3.97283935546875, 4.1790771484375, 4.38531494140625, 4.591552734375, 4.79779052734375, 5.0040283203125, 5.21026611328125, 5.41650390625, 5.62274169921875, 5.8289794921875, 6.03521728515625, 6.241455078125, 6.44769287109375, 6.6539306640625, 6.86016845703125, 7.06640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 6.0, 6.0, 6.0, 18.0, 19.0, 31.0, 52.0, 102.0, 129.0, 197.0, 141.0, 81.0, 56.0, 40.0, 20.0, 13.0, 16.0, 8.0, 4.0, 6.0, 4.0, 4.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009622573852539062, -0.0009327232837677002, -0.0009031891822814941, -0.0008736550807952881, -0.000844120979309082, -0.000814586877822876, -0.0007850527763366699, -0.0007555186748504639, -0.0007259845733642578, -0.0006964504718780518, -0.0006669163703918457, -0.0006373822689056396, -0.0006078481674194336, -0.0005783140659332275, -0.0005487799644470215, -0.0005192458629608154, -0.0004897117614746094, -0.0004601776599884033, -0.00043064355850219727, -0.0004011094570159912, -0.00037157535552978516, -0.0003420412540435791, -0.00031250715255737305, -0.000282973051071167, -0.00025343894958496094, -0.00022390484809875488, -0.00019437074661254883, -0.00016483664512634277, -0.00013530254364013672, -0.00010576844215393066, -7.623434066772461e-05, -4.6700239181518555e-05, -1.71661376953125e-05, 1.2367963790893555e-05, 4.190206527709961e-05, 7.143616676330566e-05, 0.00010097026824951172, 0.00013050436973571777, 0.00016003847122192383, 0.00018957257270812988, 0.00021910667419433594, 0.000248640775680542, 0.00027817487716674805, 0.0003077089786529541, 0.00033724308013916016, 0.0003667771816253662, 0.00039631128311157227, 0.0004258453845977783, 0.0004553794860839844, 0.00048491358757019043, 0.0005144476890563965, 0.0005439817905426025, 0.0005735158920288086, 0.0006030499935150146, 0.0006325840950012207, 0.0006621181964874268, 0.0006916522979736328, 0.0007211863994598389, 0.0007507205009460449, 0.000780254602432251, 0.000809788703918457, 0.0008393228054046631, 0.0008688569068908691, 0.0008983910083770752, 0.0009279251098632812]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 5.0, 15.0, 26.0, 35.0, 56.0, 62.0, 87.0, 136.0, 180.0, 288.0, 350.0, 557.0, 745.0, 1055.0, 1489.0, 2211.0, 3779.0, 6314.0, 12086.0, 25441.0, 63913.0, 213987.0, 455513.0, 161046.0, 51641.0, 21397.0, 10452.0, 5573.0, 3328.0, 2117.0, 1349.0, 951.0, 696.0, 440.0, 349.0, 257.0, 172.0, 135.0, 85.0, 77.0, 51.0, 35.0, 17.0, 15.0, 14.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.1171875, -11.718505859375, -11.31982421875, -10.921142578125, -10.5224609375, -10.123779296875, -9.72509765625, -9.326416015625, -8.927734375, -8.529052734375, -8.13037109375, -7.731689453125, -7.3330078125, -6.934326171875, -6.53564453125, -6.136962890625, -5.73828125, -5.339599609375, -4.94091796875, -4.542236328125, -4.1435546875, -3.744873046875, -3.34619140625, -2.947509765625, -2.548828125, -2.150146484375, -1.75146484375, -1.352783203125, -0.9541015625, -0.555419921875, -0.15673828125, 0.241943359375, 0.640625, 1.039306640625, 1.43798828125, 1.836669921875, 2.2353515625, 2.634033203125, 3.03271484375, 3.431396484375, 3.830078125, 4.228759765625, 4.62744140625, 5.026123046875, 5.4248046875, 5.823486328125, 6.22216796875, 6.620849609375, 7.01953125, 7.418212890625, 7.81689453125, 8.215576171875, 8.6142578125, 9.012939453125, 9.41162109375, 9.810302734375, 10.208984375, 10.607666015625, 11.00634765625, 11.405029296875, 11.8037109375, 12.202392578125, 12.60107421875, 12.999755859375, 13.3984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 3.0, 4.0, 7.0, 8.0, 2.0, 9.0, 8.0, 11.0, 13.0, 11.0, 11.0, 29.0, 22.0, 22.0, 41.0, 53.0, 66.0, 66.0, 61.0, 77.0, 63.0, 73.0, 70.0, 52.0, 30.0, 29.0, 25.0, 9.0, 13.0, 17.0, 19.0, 5.0, 13.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 11.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.92578125, -3.811553955078125, -3.69732666015625, -3.583099365234375, -3.4688720703125, -3.354644775390625, -3.24041748046875, -3.126190185546875, -3.011962890625, -2.897735595703125, -2.78350830078125, -2.669281005859375, -2.5550537109375, -2.440826416015625, -2.32659912109375, -2.212371826171875, -2.09814453125, -1.983917236328125, -1.86968994140625, -1.755462646484375, -1.6412353515625, -1.527008056640625, -1.41278076171875, -1.298553466796875, -1.184326171875, -1.070098876953125, -0.95587158203125, -0.841644287109375, -0.7274169921875, -0.613189697265625, -0.49896240234375, -0.384735107421875, -0.2705078125, -0.156280517578125, -0.04205322265625, 0.072174072265625, 0.1864013671875, 0.300628662109375, 0.41485595703125, 0.529083251953125, 0.643310546875, 0.757537841796875, 0.87176513671875, 0.985992431640625, 1.1002197265625, 1.214447021484375, 1.32867431640625, 1.442901611328125, 1.55712890625, 1.671356201171875, 1.78558349609375, 1.899810791015625, 2.0140380859375, 2.128265380859375, 2.24249267578125, 2.356719970703125, 2.470947265625, 2.585174560546875, 2.69940185546875, 2.813629150390625, 2.9278564453125, 3.042083740234375, 3.15631103515625, 3.270538330078125, 3.384765625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 2.0, 6.0, 10.0, 9.0, 10.0, 13.0, 15.0, 11.0, 15.0, 23.0, 26.0, 24.0, 28.0, 34.0, 28.0, 31.0, 32.0, 39.0, 41.0, 47.0, 31.0, 35.0, 36.0, 36.0, 41.0, 40.0, 27.0, 39.0, 31.0, 31.0, 28.0, 22.0, 26.0, 14.0, 10.0, 20.0, 20.0, 12.0, 17.0, 10.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.369598388671875, -32.26945495605469, -31.169309616088867, -30.06916618347168, -28.969022750854492, -27.868877410888672, -26.768733978271484, -25.668590545654297, -24.56844711303711, -23.468303680419922, -22.3681583404541, -21.268014907836914, -20.167871475219727, -19.067726135253906, -17.96758270263672, -16.86743927001953, -15.767293930053711, -14.667149543762207, -13.56700611114502, -12.466861724853516, -11.366718292236328, -10.266573905944824, -9.16642951965332, -8.066286087036133, -6.966141700744629, -5.865997791290283, -4.7658538818359375, -3.6657094955444336, -2.565565586090088, -1.4654216766357422, -0.3652772903442383, 0.7348666191101074, 1.8350105285644531, 2.935154438018799, 4.0352983474731445, 5.135442733764648, 6.235586643218994, 7.33573055267334, 8.435874938964844, 9.536018371582031, 10.636162757873535, 11.736307144165039, 12.836450576782227, 13.93659496307373, 15.036739349365234, 16.136882781982422, 17.23702621459961, 18.33717155456543, 19.437314987182617, 20.537458419799805, 21.637603759765625, 22.737747192382812, 23.837890625, 24.938034057617188, 26.038179397583008, 27.138322830200195, 28.238468170166016, 29.338611602783203, 30.438756942749023, 31.53890037536621, 32.63904571533203, 33.73918914794922, 34.839332580566406, 35.939476013183594, 37.03961944580078]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 12.0, 6.0, 14.0, 15.0, 13.0, 21.0, 11.0, 18.0, 17.0, 25.0, 23.0, 32.0, 38.0, 44.0, 41.0, 44.0, 46.0, 47.0, 29.0, 45.0, 46.0, 40.0, 50.0, 35.0, 47.0, 24.0, 30.0, 26.0, 30.0, 15.0, 25.0, 16.0, 18.0, 12.0, 10.0, 9.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-52.56937026977539, -51.05672073364258, -49.54407501220703, -48.03142547607422, -46.51877975463867, -45.00613021850586, -43.49348449707031, -41.9808349609375, -40.46818542480469, -38.955535888671875, -37.44289016723633, -35.930240631103516, -34.41759490966797, -32.904945373535156, -31.392297744750977, -29.879650115966797, -28.36700439453125, -26.85435676574707, -25.34170913696289, -23.829059600830078, -22.31641387939453, -20.80376434326172, -19.29111671447754, -17.77846908569336, -16.26582145690918, -14.753173828125, -13.24052619934082, -11.727877616882324, -10.215229988098145, -8.702582359313965, -7.189933776855469, -5.677286148071289, -4.164634704589844, -2.651986837387085, -1.1393389701843262, 0.3733091354370117, 1.8859567642211914, 3.398604393005371, 4.911252975463867, 6.423900604248047, 7.936548233032227, 9.449195861816406, 10.961843490600586, 12.474492073059082, 13.987139701843262, 15.499787330627441, 17.012435913085938, 18.525083541870117, 20.037731170654297, 21.550378799438477, 23.063026428222656, 24.57567596435547, 26.088321685791016, 27.600971221923828, 29.113618850708008, 30.626266479492188, 32.138916015625, 33.65156555175781, 35.16421127319336, 36.67686080932617, 38.18950653076172, 39.70215606689453, 41.214805603027344, 42.72745132446289, 44.24009704589844]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 13.0, 20.0, 30.0, 44.0, 66.0, 94.0, 140.0, 216.0, 360.0, 613.0, 960.0, 1345.0, 2131.0, 3342.0, 5103.0, 7731.0, 11534.0, 17028.0, 24119.0, 33391.0, 44848.0, 58499.0, 70977.0, 83463.0, 92156.0, 96307.0, 94684.0, 87267.0, 76152.0, 63028.0, 49516.0, 37028.0, 27187.0, 19437.0, 13333.0, 9067.0, 5967.0, 3883.0, 2659.0, 1722.0, 1085.0, 705.0, 466.0, 304.0, 176.0, 131.0, 81.0, 49.0, 38.0, 22.0, 11.0, 9.0, 5.0, 2.0, 3.0, 1.0, 4.0], "bins": [-24.546875, -23.7958984375, -23.044921875, -22.2939453125, -21.54296875, -20.7919921875, -20.041015625, -19.2900390625, -18.5390625, -17.7880859375, -17.037109375, -16.2861328125, -15.53515625, -14.7841796875, -14.033203125, -13.2822265625, -12.53125, -11.7802734375, -11.029296875, -10.2783203125, -9.52734375, -8.7763671875, -8.025390625, -7.2744140625, -6.5234375, -5.7724609375, -5.021484375, -4.2705078125, -3.51953125, -2.7685546875, -2.017578125, -1.2666015625, -0.515625, 0.2353515625, 0.986328125, 1.7373046875, 2.48828125, 3.2392578125, 3.990234375, 4.7412109375, 5.4921875, 6.2431640625, 6.994140625, 7.7451171875, 8.49609375, 9.2470703125, 9.998046875, 10.7490234375, 11.5, 12.2509765625, 13.001953125, 13.7529296875, 14.50390625, 15.2548828125, 16.005859375, 16.7568359375, 17.5078125, 18.2587890625, 19.009765625, 19.7607421875, 20.51171875, 21.2626953125, 22.013671875, 22.7646484375, 23.515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 0.0, 4.0, 9.0, 8.0, 13.0, 14.0, 17.0, 19.0, 13.0, 13.0, 21.0, 23.0, 24.0, 33.0, 40.0, 41.0, 38.0, 46.0, 48.0, 47.0, 28.0, 45.0, 47.0, 38.0, 50.0, 39.0, 43.0, 25.0, 30.0, 28.0, 28.0, 17.0, 21.0, 18.0, 18.0, 12.0, 12.0, 9.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-51.5625, -50.07861328125, -48.5947265625, -47.11083984375, -45.626953125, -44.14306640625, -42.6591796875, -41.17529296875, -39.69140625, -38.20751953125, -36.7236328125, -35.23974609375, -33.755859375, -32.27197265625, -30.7880859375, -29.30419921875, -27.8203125, -26.33642578125, -24.8525390625, -23.36865234375, -21.884765625, -20.40087890625, -18.9169921875, -17.43310546875, -15.94921875, -14.46533203125, -12.9814453125, -11.49755859375, -10.013671875, -8.52978515625, -7.0458984375, -5.56201171875, -4.078125, -2.59423828125, -1.1103515625, 0.37353515625, 1.857421875, 3.34130859375, 4.8251953125, 6.30908203125, 7.79296875, 9.27685546875, 10.7607421875, 12.24462890625, 13.728515625, 15.21240234375, 16.6962890625, 18.18017578125, 19.6640625, 21.14794921875, 22.6318359375, 24.11572265625, 25.599609375, 27.08349609375, 28.5673828125, 30.05126953125, 31.53515625, 33.01904296875, 34.5029296875, 35.98681640625, 37.470703125, 38.95458984375, 40.4384765625, 41.92236328125, 43.40625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 6.0, 5.0, 11.0, 12.0, 19.0, 26.0, 42.0, 75.0, 96.0, 150.0, 246.0, 371.0, 509.0, 821.0, 1323.0, 1903.0, 3090.0, 4640.0, 6965.0, 10384.0, 15330.0, 22003.0, 31308.0, 43148.0, 56815.0, 71519.0, 85760.0, 96288.0, 101611.0, 98551.0, 91167.0, 77879.0, 62893.0, 48430.0, 35642.0, 25698.0, 17940.0, 12187.0, 7975.0, 5469.0, 3556.0, 2372.0, 1508.0, 981.0, 654.0, 413.0, 243.0, 173.0, 113.0, 86.0, 55.0, 30.0, 30.0, 11.0, 16.0, 7.0, 5.0, 5.0, 1.0, 0.0, 0.0, 4.0], "bins": [-24.59375, -23.792724609375, -22.99169921875, -22.190673828125, -21.3896484375, -20.588623046875, -19.78759765625, -18.986572265625, -18.185546875, -17.384521484375, -16.58349609375, -15.782470703125, -14.9814453125, -14.180419921875, -13.37939453125, -12.578369140625, -11.77734375, -10.976318359375, -10.17529296875, -9.374267578125, -8.5732421875, -7.772216796875, -6.97119140625, -6.170166015625, -5.369140625, -4.568115234375, -3.76708984375, -2.966064453125, -2.1650390625, -1.364013671875, -0.56298828125, 0.238037109375, 1.0390625, 1.840087890625, 2.64111328125, 3.442138671875, 4.2431640625, 5.044189453125, 5.84521484375, 6.646240234375, 7.447265625, 8.248291015625, 9.04931640625, 9.850341796875, 10.6513671875, 11.452392578125, 12.25341796875, 13.054443359375, 13.85546875, 14.656494140625, 15.45751953125, 16.258544921875, 17.0595703125, 17.860595703125, 18.66162109375, 19.462646484375, 20.263671875, 21.064697265625, 21.86572265625, 22.666748046875, 23.4677734375, 24.268798828125, 25.06982421875, 25.870849609375, 26.671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 9.0, 13.0, 18.0, 19.0, 24.0, 20.0, 20.0, 24.0, 37.0, 25.0, 30.0, 36.0, 38.0, 27.0, 50.0, 51.0, 34.0, 41.0, 37.0, 42.0, 43.0, 24.0, 24.0, 38.0, 21.0, 36.0, 27.0, 17.0, 24.0, 23.0, 12.0, 14.0, 14.0, 11.0, 8.0, 7.0, 6.0, 7.0, 4.0, 2.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.734375, -27.878662109375, -27.02294921875, -26.167236328125, -25.3115234375, -24.455810546875, -23.60009765625, -22.744384765625, -21.888671875, -21.032958984375, -20.17724609375, -19.321533203125, -18.4658203125, -17.610107421875, -16.75439453125, -15.898681640625, -15.04296875, -14.187255859375, -13.33154296875, -12.475830078125, -11.6201171875, -10.764404296875, -9.90869140625, -9.052978515625, -8.197265625, -7.341552734375, -6.48583984375, -5.630126953125, -4.7744140625, -3.918701171875, -3.06298828125, -2.207275390625, -1.3515625, -0.495849609375, 0.35986328125, 1.215576171875, 2.0712890625, 2.927001953125, 3.78271484375, 4.638427734375, 5.494140625, 6.349853515625, 7.20556640625, 8.061279296875, 8.9169921875, 9.772705078125, 10.62841796875, 11.484130859375, 12.33984375, 13.195556640625, 14.05126953125, 14.906982421875, 15.7626953125, 16.618408203125, 17.47412109375, 18.329833984375, 19.185546875, 20.041259765625, 20.89697265625, 21.752685546875, 22.6083984375, 23.464111328125, 24.31982421875, 25.175537109375, 26.03125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 5.0, 13.0, 16.0, 33.0, 39.0, 60.0, 99.0, 131.0, 187.0, 332.0, 460.0, 719.0, 1150.0, 1848.0, 2830.0, 4411.0, 6906.0, 10490.0, 16330.0, 24328.0, 35661.0, 50508.0, 68926.0, 86627.0, 102786.0, 111637.0, 111609.0, 101852.0, 86183.0, 67419.0, 50078.0, 35296.0, 24243.0, 16026.0, 10391.0, 6647.0, 4434.0, 2855.0, 1753.0, 1112.0, 755.0, 445.0, 316.0, 205.0, 130.0, 95.0, 52.0, 40.0, 31.0, 21.0, 10.0, 8.0, 4.0, 2.0, 4.0, 2.0, 2.0], "bins": [-10.8984375, -10.5679931640625, -10.237548828125, -9.9071044921875, -9.57666015625, -9.2462158203125, -8.915771484375, -8.5853271484375, -8.2548828125, -7.9244384765625, -7.593994140625, -7.2635498046875, -6.93310546875, -6.6026611328125, -6.272216796875, -5.9417724609375, -5.611328125, -5.2808837890625, -4.950439453125, -4.6199951171875, -4.28955078125, -3.9591064453125, -3.628662109375, -3.2982177734375, -2.9677734375, -2.6373291015625, -2.306884765625, -1.9764404296875, -1.64599609375, -1.3155517578125, -0.985107421875, -0.6546630859375, -0.32421875, 0.0062255859375, 0.336669921875, 0.6671142578125, 0.99755859375, 1.3280029296875, 1.658447265625, 1.9888916015625, 2.3193359375, 2.6497802734375, 2.980224609375, 3.3106689453125, 3.64111328125, 3.9715576171875, 4.302001953125, 4.6324462890625, 4.962890625, 5.2933349609375, 5.623779296875, 5.9542236328125, 6.28466796875, 6.6151123046875, 6.945556640625, 7.2760009765625, 7.6064453125, 7.9368896484375, 8.267333984375, 8.5977783203125, 8.92822265625, 9.2586669921875, 9.589111328125, 9.9195556640625, 10.25]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 8.0, 10.0, 10.0, 13.0, 10.0, 14.0, 11.0, 16.0, 17.0, 22.0, 22.0, 34.0, 39.0, 30.0, 45.0, 42.0, 35.0, 36.0, 44.0, 35.0, 42.0, 44.0, 58.0, 45.0, 52.0, 25.0, 35.0, 28.0, 17.0, 26.0, 22.0, 30.0, 12.0, 11.0, 5.0, 10.0, 6.0, 5.0, 1.0, 8.0, 5.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0010328292846679688, -0.000998571515083313, -0.0009643137454986572, -0.0009300559759140015, -0.0008957982063293457, -0.0008615404367446899, -0.0008272826671600342, -0.0007930248975753784, -0.0007587671279907227, -0.0007245093584060669, -0.0006902515888214111, -0.0006559938192367554, -0.0006217360496520996, -0.0005874782800674438, -0.0005532205104827881, -0.0005189627408981323, -0.00048470497131347656, -0.0004504472017288208, -0.00041618943214416504, -0.0003819316625595093, -0.0003476738929748535, -0.00031341612339019775, -0.000279158353805542, -0.00024490058422088623, -0.00021064281463623047, -0.0001763850450515747, -0.00014212727546691895, -0.00010786950588226318, -7.361173629760742e-05, -3.935396671295166e-05, -5.0961971282958984e-06, 2.9161572456359863e-05, 6.341934204101562e-05, 9.767711162567139e-05, 0.00013193488121032715, 0.0001661926507949829, 0.00020045042037963867, 0.00023470818996429443, 0.0002689659595489502, 0.00030322372913360596, 0.0003374814987182617, 0.0003717392683029175, 0.00040599703788757324, 0.000440254807472229, 0.00047451257705688477, 0.0005087703466415405, 0.0005430281162261963, 0.000577285885810852, 0.0006115436553955078, 0.0006458014249801636, 0.0006800591945648193, 0.0007143169641494751, 0.0007485747337341309, 0.0007828325033187866, 0.0008170902729034424, 0.0008513480424880981, 0.0008856058120727539, 0.0009198635816574097, 0.0009541213512420654, 0.0009883791208267212, 0.001022636890411377, 0.0010568946599960327, 0.0010911524295806885, 0.0011254101991653442, 0.00115966796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [6.0, 4.0, 3.0, 4.0, 2.0, 15.0, 23.0, 24.0, 52.0, 70.0, 88.0, 146.0, 181.0, 289.0, 452.0, 609.0, 902.0, 1321.0, 2125.0, 3166.0, 4872.0, 7781.0, 11964.0, 18970.0, 29742.0, 44471.0, 64628.0, 87967.0, 110987.0, 125250.0, 125890.0, 113079.0, 91120.0, 67910.0, 46739.0, 31466.0, 20051.0, 12694.0, 8045.0, 5271.0, 3492.0, 2191.0, 1455.0, 991.0, 660.0, 475.0, 329.0, 176.0, 128.0, 83.0, 78.0, 54.0, 28.0, 15.0, 15.0, 7.0, 8.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.4453125, -12.0313720703125, -11.617431640625, -11.2034912109375, -10.78955078125, -10.3756103515625, -9.961669921875, -9.5477294921875, -9.1337890625, -8.7198486328125, -8.305908203125, -7.8919677734375, -7.47802734375, -7.0640869140625, -6.650146484375, -6.2362060546875, -5.822265625, -5.4083251953125, -4.994384765625, -4.5804443359375, -4.16650390625, -3.7525634765625, -3.338623046875, -2.9246826171875, -2.5107421875, -2.0968017578125, -1.682861328125, -1.2689208984375, -0.85498046875, -0.4410400390625, -0.027099609375, 0.3868408203125, 0.80078125, 1.2147216796875, 1.628662109375, 2.0426025390625, 2.45654296875, 2.8704833984375, 3.284423828125, 3.6983642578125, 4.1123046875, 4.5262451171875, 4.940185546875, 5.3541259765625, 5.76806640625, 6.1820068359375, 6.595947265625, 7.0098876953125, 7.423828125, 7.8377685546875, 8.251708984375, 8.6656494140625, 9.07958984375, 9.4935302734375, 9.907470703125, 10.3214111328125, 10.7353515625, 11.1492919921875, 11.563232421875, 11.9771728515625, 12.39111328125, 12.8050537109375, 13.218994140625, 13.6329345703125, 14.046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 10.0, 22.0, 16.0, 30.0, 23.0, 35.0, 36.0, 46.0, 54.0, 47.0, 56.0, 52.0, 55.0, 64.0, 72.0, 54.0, 41.0, 39.0, 34.0, 29.0, 27.0, 23.0, 20.0, 16.0, 9.0, 10.0, 9.0, 14.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.66796875, -6.44219970703125, -6.2164306640625, -5.99066162109375, -5.764892578125, -5.53912353515625, -5.3133544921875, -5.08758544921875, -4.86181640625, -4.63604736328125, -4.4102783203125, -4.18450927734375, -3.958740234375, -3.73297119140625, -3.5072021484375, -3.28143310546875, -3.0556640625, -2.82989501953125, -2.6041259765625, -2.37835693359375, -2.152587890625, -1.92681884765625, -1.7010498046875, -1.47528076171875, -1.24951171875, -1.02374267578125, -0.7979736328125, -0.57220458984375, -0.346435546875, -0.12066650390625, 0.1051025390625, 0.33087158203125, 0.556640625, 0.78240966796875, 1.0081787109375, 1.23394775390625, 1.459716796875, 1.68548583984375, 1.9112548828125, 2.13702392578125, 2.36279296875, 2.58856201171875, 2.8143310546875, 3.04010009765625, 3.265869140625, 3.49163818359375, 3.7174072265625, 3.94317626953125, 4.1689453125, 4.39471435546875, 4.6204833984375, 4.84625244140625, 5.072021484375, 5.29779052734375, 5.5235595703125, 5.74932861328125, 5.97509765625, 6.20086669921875, 6.4266357421875, 6.65240478515625, 6.878173828125, 7.10394287109375, 7.3297119140625, 7.55548095703125, 7.78125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 7.0, 11.0, 4.0, 12.0, 19.0, 16.0, 19.0, 21.0, 20.0, 27.0, 35.0, 31.0, 43.0, 29.0, 33.0, 31.0, 45.0, 41.0, 41.0, 44.0, 38.0, 41.0, 34.0, 40.0, 46.0, 33.0, 25.0, 27.0, 33.0, 17.0, 17.0, 21.0, 11.0, 16.0, 13.0, 12.0, 8.0, 5.0, 7.0, 3.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.53727340698242, -34.387535095214844, -33.237796783447266, -32.08805465698242, -30.938316345214844, -29.788578033447266, -28.638839721679688, -27.48910140991211, -26.3393611907959, -25.18962287902832, -24.03988265991211, -22.89014434814453, -21.740406036376953, -20.590665817260742, -19.440927505493164, -18.291187286376953, -17.141448974609375, -15.99170970916748, -14.841970443725586, -13.692232131958008, -12.542492866516113, -11.392753601074219, -10.24301528930664, -9.093276023864746, -7.943536758422852, -6.793797492980957, -5.644058704376221, -4.494319915771484, -3.34458065032959, -2.1948413848876953, -1.045102596282959, 0.10463619232177734, 1.2543792724609375, 2.404118299484253, 3.5538573265075684, 4.703596115112305, 5.853335380554199, 7.003074645996094, 8.152812957763672, 9.302552223205566, 10.452291488647461, 11.602030754089355, 12.75177001953125, 13.901508331298828, 15.051247596740723, 16.200986862182617, 17.350725173950195, 18.500465393066406, 19.650203704833984, 20.799942016601562, 21.949682235717773, 23.09942054748535, 24.249160766601562, 25.39889907836914, 26.54863739013672, 27.698375701904297, 28.848115921020508, 29.997854232788086, 31.147594451904297, 32.297332763671875, 33.44707107543945, 34.59680938720703, 35.746551513671875, 36.89628982543945, 38.04602813720703]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 6.0, 4.0, 9.0, 6.0, 10.0, 15.0, 11.0, 12.0, 29.0, 24.0, 18.0, 19.0, 30.0, 32.0, 29.0, 29.0, 51.0, 44.0, 45.0, 43.0, 51.0, 43.0, 41.0, 36.0, 42.0, 25.0, 37.0, 27.0, 30.0, 32.0, 26.0, 10.0, 29.0, 14.0, 18.0, 20.0, 14.0, 11.0, 6.0, 4.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.662818908691406, -49.15444564819336, -47.64607620239258, -46.13770294189453, -44.62933349609375, -43.1209602355957, -41.612586975097656, -40.104217529296875, -38.59584426879883, -37.08747100830078, -35.5791015625, -34.07072830200195, -32.562355041503906, -31.053985595703125, -29.545612335205078, -28.037240982055664, -26.52886962890625, -25.020498275756836, -23.512126922607422, -22.003753662109375, -20.49538230895996, -18.987010955810547, -17.4786376953125, -15.970266342163086, -14.461894989013672, -12.953523635864258, -11.445151329040527, -9.936779022216797, -8.428407669067383, -6.9200358390808105, -5.411664009094238, -3.903291702270508, -2.3949241638183594, -0.8865523338317871, 0.6218194961547852, 2.1301913261413574, 3.6385631561279297, 5.146934986114502, 6.655306816101074, 8.163679122924805, 9.672050476074219, 11.180421829223633, 12.688794136047363, 14.197166442871094, 15.705537796020508, 17.213909149169922, 18.72228240966797, 20.230653762817383, 21.739025115966797, 23.24739646911621, 24.755767822265625, 26.264141082763672, 27.772512435913086, 29.2808837890625, 30.789257049560547, 32.297630310058594, 33.805999755859375, 35.31437301635742, 36.8227424621582, 38.33111572265625, 39.83948516845703, 41.34785842895508, 42.856231689453125, 44.364601135253906, 45.87297439575195]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 15.0, 30.0, 42.0, 74.0, 125.0, 196.0, 347.0, 606.0, 948.0, 1619.0, 2576.0, 4380.0, 7201.0, 11299.0, 18708.0, 29525.0, 45605.0, 68730.0, 101924.0, 144254.0, 198000.0, 258755.0, 321488.0, 373846.0, 407998.0, 415193.0, 392778.0, 348731.0, 288558.0, 226329.0, 169217.0, 120433.0, 83739.0, 55553.0, 36205.0, 22950.0, 14216.0, 8770.0, 5481.0, 3236.0, 1852.0, 1182.0, 658.0, 379.0, 238.0, 122.0, 82.0, 43.0, 20.0, 13.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.0, -27.103515625, -26.20703125, -25.310546875, -24.4140625, -23.517578125, -22.62109375, -21.724609375, -20.828125, -19.931640625, -19.03515625, -18.138671875, -17.2421875, -16.345703125, -15.44921875, -14.552734375, -13.65625, -12.759765625, -11.86328125, -10.966796875, -10.0703125, -9.173828125, -8.27734375, -7.380859375, -6.484375, -5.587890625, -4.69140625, -3.794921875, -2.8984375, -2.001953125, -1.10546875, -0.208984375, 0.6875, 1.583984375, 2.48046875, 3.376953125, 4.2734375, 5.169921875, 6.06640625, 6.962890625, 7.859375, 8.755859375, 9.65234375, 10.548828125, 11.4453125, 12.341796875, 13.23828125, 14.134765625, 15.03125, 15.927734375, 16.82421875, 17.720703125, 18.6171875, 19.513671875, 20.41015625, 21.306640625, 22.203125, 23.099609375, 23.99609375, 24.892578125, 25.7890625, 26.685546875, 27.58203125, 28.478515625, 29.375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 2.0, 3.0, 14.0, 4.0, 11.0, 15.0, 10.0, 15.0, 26.0, 24.0, 21.0, 18.0, 35.0, 29.0, 30.0, 35.0, 44.0, 38.0, 48.0, 51.0, 45.0, 39.0, 44.0, 33.0, 35.0, 30.0, 36.0, 39.0, 19.0, 35.0, 17.0, 17.0, 27.0, 18.0, 15.0, 20.0, 17.0, 10.0, 5.0, 4.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-41.9375, -40.68701171875, -39.4365234375, -38.18603515625, -36.935546875, -35.68505859375, -34.4345703125, -33.18408203125, -31.93359375, -30.68310546875, -29.4326171875, -28.18212890625, -26.931640625, -25.68115234375, -24.4306640625, -23.18017578125, -21.9296875, -20.67919921875, -19.4287109375, -18.17822265625, -16.927734375, -15.67724609375, -14.4267578125, -13.17626953125, -11.92578125, -10.67529296875, -9.4248046875, -8.17431640625, -6.923828125, -5.67333984375, -4.4228515625, -3.17236328125, -1.921875, -0.67138671875, 0.5791015625, 1.82958984375, 3.080078125, 4.33056640625, 5.5810546875, 6.83154296875, 8.08203125, 9.33251953125, 10.5830078125, 11.83349609375, 13.083984375, 14.33447265625, 15.5849609375, 16.83544921875, 18.0859375, 19.33642578125, 20.5869140625, 21.83740234375, 23.087890625, 24.33837890625, 25.5888671875, 26.83935546875, 28.08984375, 29.34033203125, 30.5908203125, 31.84130859375, 33.091796875, 34.34228515625, 35.5927734375, 36.84326171875, 38.09375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 9.0, 11.0, 26.0, 35.0, 66.0, 110.0, 188.0, 394.0, 595.0, 1007.0, 1699.0, 2881.0, 4666.0, 7516.0, 11817.0, 18901.0, 28009.0, 41984.0, 60360.0, 85415.0, 116305.0, 154867.0, 196223.0, 240090.0, 281656.0, 318345.0, 342013.0, 348847.0, 341479.0, 318216.0, 284817.0, 242966.0, 197815.0, 156626.0, 117820.0, 86702.0, 61330.0, 42729.0, 28986.0, 18860.0, 12024.0, 7702.0, 4805.0, 2889.0, 1887.0, 1057.0, 638.0, 382.0, 223.0, 129.0, 88.0, 41.0, 26.0, 10.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.859375, -24.044921875, -23.23046875, -22.416015625, -21.6015625, -20.787109375, -19.97265625, -19.158203125, -18.34375, -17.529296875, -16.71484375, -15.900390625, -15.0859375, -14.271484375, -13.45703125, -12.642578125, -11.828125, -11.013671875, -10.19921875, -9.384765625, -8.5703125, -7.755859375, -6.94140625, -6.126953125, -5.3125, -4.498046875, -3.68359375, -2.869140625, -2.0546875, -1.240234375, -0.42578125, 0.388671875, 1.203125, 2.017578125, 2.83203125, 3.646484375, 4.4609375, 5.275390625, 6.08984375, 6.904296875, 7.71875, 8.533203125, 9.34765625, 10.162109375, 10.9765625, 11.791015625, 12.60546875, 13.419921875, 14.234375, 15.048828125, 15.86328125, 16.677734375, 17.4921875, 18.306640625, 19.12109375, 19.935546875, 20.75, 21.564453125, 22.37890625, 23.193359375, 24.0078125, 24.822265625, 25.63671875, 26.451171875, 27.265625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 10.0, 7.0, 12.0, 13.0, 20.0, 34.0, 37.0, 50.0, 64.0, 62.0, 65.0, 68.0, 87.0, 91.0, 137.0, 134.0, 144.0, 146.0, 155.0, 176.0, 169.0, 191.0, 182.0, 205.0, 205.0, 173.0, 161.0, 151.0, 132.0, 153.0, 101.0, 107.0, 96.0, 90.0, 79.0, 71.0, 54.0, 44.0, 35.0, 31.0, 37.0, 24.0, 26.0, 11.0, 13.0, 8.0, 1.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8203125, -15.3077392578125, -14.795166015625, -14.2825927734375, -13.77001953125, -13.2574462890625, -12.744873046875, -12.2322998046875, -11.7197265625, -11.2071533203125, -10.694580078125, -10.1820068359375, -9.66943359375, -9.1568603515625, -8.644287109375, -8.1317138671875, -7.619140625, -7.1065673828125, -6.593994140625, -6.0814208984375, -5.56884765625, -5.0562744140625, -4.543701171875, -4.0311279296875, -3.5185546875, -3.0059814453125, -2.493408203125, -1.9808349609375, -1.46826171875, -0.9556884765625, -0.443115234375, 0.0694580078125, 0.58203125, 1.0946044921875, 1.607177734375, 2.1197509765625, 2.63232421875, 3.1448974609375, 3.657470703125, 4.1700439453125, 4.6826171875, 5.1951904296875, 5.707763671875, 6.2203369140625, 6.73291015625, 7.2454833984375, 7.758056640625, 8.2706298828125, 8.783203125, 9.2957763671875, 9.808349609375, 10.3209228515625, 10.83349609375, 11.3460693359375, 11.858642578125, 12.3712158203125, 12.8837890625, 13.3963623046875, 13.908935546875, 14.4215087890625, 14.93408203125, 15.4466552734375, 15.959228515625, 16.4718017578125, 16.984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 4.0, 3.0, 6.0, 6.0, 10.0, 9.0, 8.0, 23.0, 14.0, 13.0, 20.0, 17.0, 32.0, 27.0, 28.0, 27.0, 24.0, 39.0, 35.0, 40.0, 35.0, 22.0, 50.0, 30.0, 41.0, 41.0, 30.0, 32.0, 34.0, 43.0, 30.0, 30.0, 23.0, 29.0, 16.0, 24.0, 17.0, 9.0, 14.0, 9.0, 13.0, 11.0, 10.0, 5.0, 6.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-38.281551361083984, -37.16537094116211, -36.0491943359375, -34.933013916015625, -33.81683349609375, -32.70065689086914, -31.584476470947266, -30.468297958374023, -29.35211944580078, -28.23594093322754, -27.119762420654297, -26.003582000732422, -24.88740348815918, -23.771224975585938, -22.655044555664062, -21.53886604309082, -20.422687530517578, -19.306509017944336, -18.190330505371094, -17.07415008544922, -15.957971572875977, -14.841793060302734, -13.725613594055176, -12.609434127807617, -11.493255615234375, -10.377077102661133, -9.260897636413574, -8.144718170166016, -7.028539657592773, -5.912360668182373, -4.796181678771973, -3.6800026893615723, -2.563823699951172, -1.4476447105407715, -0.3314657211303711, 0.7847132682800293, 1.9008922576904297, 3.01707124710083, 4.1332502365112305, 5.249429225921631, 6.365608215332031, 7.481787204742432, 8.597966194152832, 9.71414566040039, 10.830324172973633, 11.946502685546875, 13.062682151794434, 14.178861618041992, 15.295040130615234, 16.411218643188477, 17.52739715576172, 18.643577575683594, 19.759756088256836, 20.875934600830078, 21.992115020751953, 23.108293533325195, 24.224472045898438, 25.34065055847168, 26.456829071044922, 27.573009490966797, 28.68918800354004, 29.80536651611328, 30.921546936035156, 32.037723541259766, 33.15390396118164]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 9.0, 2.0, 7.0, 15.0, 9.0, 8.0, 14.0, 22.0, 17.0, 18.0, 19.0, 20.0, 21.0, 32.0, 43.0, 31.0, 25.0, 30.0, 27.0, 29.0, 56.0, 34.0, 46.0, 31.0, 37.0, 37.0, 37.0, 29.0, 45.0, 28.0, 23.0, 27.0, 25.0, 22.0, 20.0, 16.0, 11.0, 8.0, 10.0, 14.0, 10.0, 12.0, 6.0, 6.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-45.38016128540039, -44.0014762878418, -42.62278747558594, -41.244102478027344, -39.86541748046875, -38.486732482910156, -37.1080436706543, -35.7293586730957, -34.35067367553711, -32.971988677978516, -31.59330177307129, -30.214614868164062, -28.83592987060547, -27.457242965698242, -26.078556060791016, -24.699871063232422, -23.321184158325195, -21.94249725341797, -20.563812255859375, -19.18512535095215, -17.806440353393555, -16.427753448486328, -15.049067497253418, -13.670381546020508, -12.291695594787598, -10.913009643554688, -9.534323692321777, -8.155637741088867, -6.776951313018799, -5.398265361785889, -4.01957893371582, -2.64089298248291, -1.26220703125, 0.11647903919219971, 1.4951651096343994, 2.8738512992858887, 4.252537250518799, 5.631223201751709, 7.009909629821777, 8.388595581054688, 9.767281532287598, 11.145967483520508, 12.524653434753418, 13.903339385986328, 15.282026290893555, 16.66071128845215, 18.039398193359375, 19.41808319091797, 20.796770095825195, 22.175457000732422, 23.554141998291016, 24.932828903198242, 26.311513900756836, 27.690200805664062, 29.068885803222656, 30.447572708129883, 31.82625961303711, 33.2049446105957, 34.58363342285156, 35.962318420410156, 37.34100341796875, 38.719688415527344, 40.0983772277832, 41.4770622253418, 42.85574722290039]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 8.0, 10.0, 12.0, 27.0, 38.0, 40.0, 61.0, 79.0, 113.0, 147.0, 225.0, 273.0, 416.0, 589.0, 867.0, 1324.0, 2123.0, 3520.0, 6730.0, 13630.0, 29721.0, 68946.0, 162849.0, 308153.0, 246269.0, 112023.0, 46850.0, 20456.0, 9810.0, 5073.0, 2827.0, 1713.0, 1096.0, 736.0, 493.0, 361.0, 263.0, 186.0, 126.0, 106.0, 83.0, 43.0, 38.0, 33.0, 19.0, 11.0, 12.0, 4.0, 6.0, 2.0, 8.0, 2.0, 5.0], "bins": [-12.8203125, -12.45166015625, -12.0830078125, -11.71435546875, -11.345703125, -10.97705078125, -10.6083984375, -10.23974609375, -9.87109375, -9.50244140625, -9.1337890625, -8.76513671875, -8.396484375, -8.02783203125, -7.6591796875, -7.29052734375, -6.921875, -6.55322265625, -6.1845703125, -5.81591796875, -5.447265625, -5.07861328125, -4.7099609375, -4.34130859375, -3.97265625, -3.60400390625, -3.2353515625, -2.86669921875, -2.498046875, -2.12939453125, -1.7607421875, -1.39208984375, -1.0234375, -0.65478515625, -0.2861328125, 0.08251953125, 0.451171875, 0.81982421875, 1.1884765625, 1.55712890625, 1.92578125, 2.29443359375, 2.6630859375, 3.03173828125, 3.400390625, 3.76904296875, 4.1376953125, 4.50634765625, 4.875, 5.24365234375, 5.6123046875, 5.98095703125, 6.349609375, 6.71826171875, 7.0869140625, 7.45556640625, 7.82421875, 8.19287109375, 8.5615234375, 8.93017578125, 9.298828125, 9.66748046875, 10.0361328125, 10.40478515625, 10.7734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 2.0, 6.0, 15.0, 9.0, 9.0, 14.0, 21.0, 16.0, 19.0, 18.0, 22.0, 19.0, 33.0, 44.0, 30.0, 25.0, 27.0, 31.0, 29.0, 52.0, 37.0, 43.0, 34.0, 36.0, 37.0, 39.0, 28.0, 46.0, 27.0, 19.0, 31.0, 25.0, 21.0, 21.0, 17.0, 10.0, 9.0, 10.0, 15.0, 9.0, 12.0, 5.0, 7.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-45.59375, -44.21533203125, -42.8369140625, -41.45849609375, -40.080078125, -38.70166015625, -37.3232421875, -35.94482421875, -34.56640625, -33.18798828125, -31.8095703125, -30.43115234375, -29.052734375, -27.67431640625, -26.2958984375, -24.91748046875, -23.5390625, -22.16064453125, -20.7822265625, -19.40380859375, -18.025390625, -16.64697265625, -15.2685546875, -13.89013671875, -12.51171875, -11.13330078125, -9.7548828125, -8.37646484375, -6.998046875, -5.61962890625, -4.2412109375, -2.86279296875, -1.484375, -0.10595703125, 1.2724609375, 2.65087890625, 4.029296875, 5.40771484375, 6.7861328125, 8.16455078125, 9.54296875, 10.92138671875, 12.2998046875, 13.67822265625, 15.056640625, 16.43505859375, 17.8134765625, 19.19189453125, 20.5703125, 21.94873046875, 23.3271484375, 24.70556640625, 26.083984375, 27.46240234375, 28.8408203125, 30.21923828125, 31.59765625, 32.97607421875, 34.3544921875, 35.73291015625, 37.111328125, 38.48974609375, 39.8681640625, 41.24658203125, 42.625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 17.0, 20.0, 21.0, 33.0, 38.0, 76.0, 87.0, 93.0, 155.0, 231.0, 337.0, 476.0, 738.0, 1177.0, 2060.0, 3393.0, 6316.0, 12086.0, 24590.0, 55012.0, 134868.0, 326912.0, 279388.0, 109334.0, 45898.0, 21083.0, 10434.0, 5541.0, 3051.0, 1760.0, 1118.0, 699.0, 472.0, 326.0, 227.0, 130.0, 93.0, 66.0, 52.0, 40.0, 26.0, 19.0, 15.0, 10.0, 11.0, 11.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6953125, -8.413818359375, -8.13232421875, -7.850830078125, -7.5693359375, -7.287841796875, -7.00634765625, -6.724853515625, -6.443359375, -6.161865234375, -5.88037109375, -5.598876953125, -5.3173828125, -5.035888671875, -4.75439453125, -4.472900390625, -4.19140625, -3.909912109375, -3.62841796875, -3.346923828125, -3.0654296875, -2.783935546875, -2.50244140625, -2.220947265625, -1.939453125, -1.657958984375, -1.37646484375, -1.094970703125, -0.8134765625, -0.531982421875, -0.25048828125, 0.031005859375, 0.3125, 0.593994140625, 0.87548828125, 1.156982421875, 1.4384765625, 1.719970703125, 2.00146484375, 2.282958984375, 2.564453125, 2.845947265625, 3.12744140625, 3.408935546875, 3.6904296875, 3.971923828125, 4.25341796875, 4.534912109375, 4.81640625, 5.097900390625, 5.37939453125, 5.660888671875, 5.9423828125, 6.223876953125, 6.50537109375, 6.786865234375, 7.068359375, 7.349853515625, 7.63134765625, 7.912841796875, 8.1943359375, 8.475830078125, 8.75732421875, 9.038818359375, 9.3203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 8.0, 9.0, 10.0, 16.0, 14.0, 17.0, 15.0, 28.0, 22.0, 23.0, 28.0, 34.0, 30.0, 39.0, 41.0, 48.0, 42.0, 33.0, 38.0, 40.0, 46.0, 44.0, 39.0, 32.0, 32.0, 34.0, 36.0, 13.0, 24.0, 33.0, 14.0, 25.0, 19.0, 9.0, 21.0, 18.0, 10.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.796875, -30.747802734375, -29.69873046875, -28.649658203125, -27.6005859375, -26.551513671875, -25.50244140625, -24.453369140625, -23.404296875, -22.355224609375, -21.30615234375, -20.257080078125, -19.2080078125, -18.158935546875, -17.10986328125, -16.060791015625, -15.01171875, -13.962646484375, -12.91357421875, -11.864501953125, -10.8154296875, -9.766357421875, -8.71728515625, -7.668212890625, -6.619140625, -5.570068359375, -4.52099609375, -3.471923828125, -2.4228515625, -1.373779296875, -0.32470703125, 0.724365234375, 1.7734375, 2.822509765625, 3.87158203125, 4.920654296875, 5.9697265625, 7.018798828125, 8.06787109375, 9.116943359375, 10.166015625, 11.215087890625, 12.26416015625, 13.313232421875, 14.3623046875, 15.411376953125, 16.46044921875, 17.509521484375, 18.55859375, 19.607666015625, 20.65673828125, 21.705810546875, 22.7548828125, 23.803955078125, 24.85302734375, 25.902099609375, 26.951171875, 28.000244140625, 29.04931640625, 30.098388671875, 31.1474609375, 32.196533203125, 33.24560546875, 34.294677734375, 35.34375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 4.0, 9.0, 9.0, 9.0, 23.0, 17.0, 36.0, 70.0, 79.0, 130.0, 186.0, 343.0, 602.0, 1150.0, 2371.0, 5555.0, 14941.0, 56270.0, 380187.0, 486548.0, 70994.0, 17230.0, 5951.0, 2709.0, 1326.0, 701.0, 434.0, 249.0, 165.0, 86.0, 53.0, 42.0, 31.0, 20.0, 7.0, 6.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.76953125, -4.60546875, -4.44140625, -4.27734375, -4.11328125, -3.94921875, -3.78515625, -3.62109375, -3.45703125, -3.29296875, -3.12890625, -2.96484375, -2.80078125, -2.63671875, -2.47265625, -2.30859375, -2.14453125, -1.98046875, -1.81640625, -1.65234375, -1.48828125, -1.32421875, -1.16015625, -0.99609375, -0.83203125, -0.66796875, -0.50390625, -0.33984375, -0.17578125, -0.01171875, 0.15234375, 0.31640625, 0.48046875, 0.64453125, 0.80859375, 0.97265625, 1.13671875, 1.30078125, 1.46484375, 1.62890625, 1.79296875, 1.95703125, 2.12109375, 2.28515625, 2.44921875, 2.61328125, 2.77734375, 2.94140625, 3.10546875, 3.26953125, 3.43359375, 3.59765625, 3.76171875, 3.92578125, 4.08984375, 4.25390625, 4.41796875, 4.58203125, 4.74609375, 4.91015625, 5.07421875, 5.23828125, 5.40234375, 5.56640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 7.0, 10.0, 10.0, 17.0, 20.0, 26.0, 37.0, 25.0, 41.0, 55.0, 60.0, 70.0, 80.0, 83.0, 66.0, 59.0, 63.0, 59.0, 45.0, 30.0, 36.0, 27.0, 20.0, 8.0, 9.0, 7.0, 10.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025963783264160156, -0.0002518482506275177, -0.00024405866861343384, -0.00023626908659934998, -0.0002284795045852661, -0.00022068992257118225, -0.0002129003405570984, -0.00020511075854301453, -0.00019732117652893066, -0.0001895315945148468, -0.00018174201250076294, -0.00017395243048667908, -0.00016616284847259521, -0.00015837326645851135, -0.0001505836844444275, -0.00014279410243034363, -0.00013500452041625977, -0.0001272149384021759, -0.00011942535638809204, -0.00011163577437400818, -0.00010384619235992432, -9.605661034584045e-05, -8.826702833175659e-05, -8.047744631767273e-05, -7.268786430358887e-05, -6.4898282289505e-05, -5.710870027542114e-05, -4.931911826133728e-05, -4.152953624725342e-05, -3.3739954233169556e-05, -2.5950372219085693e-05, -1.816079020500183e-05, -1.0371208190917969e-05, -2.5816261768341064e-06, 5.207955837249756e-06, 1.2997537851333618e-05, 2.078711986541748e-05, 2.8576701879501343e-05, 3.6366283893585205e-05, 4.415586590766907e-05, 5.194544792175293e-05, 5.973502993583679e-05, 6.752461194992065e-05, 7.531419396400452e-05, 8.310377597808838e-05, 9.089335799217224e-05, 9.86829400062561e-05, 0.00010647252202033997, 0.00011426210403442383, 0.00012205168604850769, 0.00012984126806259155, 0.00013763085007667542, 0.00014542043209075928, 0.00015321001410484314, 0.000160999596118927, 0.00016878917813301086, 0.00017657876014709473, 0.0001843683421611786, 0.00019215792417526245, 0.0001999475061893463, 0.00020773708820343018, 0.00021552667021751404, 0.0002233162522315979, 0.00023110583424568176, 0.00023889541625976562]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 3.0, 9.0, 17.0, 18.0, 26.0, 36.0, 41.0, 74.0, 85.0, 121.0, 176.0, 287.0, 360.0, 553.0, 828.0, 1193.0, 1776.0, 2534.0, 3926.0, 6110.0, 9329.0, 15193.0, 25213.0, 43955.0, 76882.0, 136448.0, 214896.0, 205784.0, 126831.0, 71509.0, 40745.0, 23392.0, 14110.0, 9019.0, 5679.0, 3687.0, 2428.0, 1663.0, 1069.0, 773.0, 556.0, 373.0, 253.0, 180.0, 133.0, 75.0, 56.0, 46.0, 30.0, 25.0, 17.0, 16.0, 6.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.521484375, -3.403839111328125, -3.28619384765625, -3.168548583984375, -3.0509033203125, -2.933258056640625, -2.81561279296875, -2.697967529296875, -2.580322265625, -2.462677001953125, -2.34503173828125, -2.227386474609375, -2.1097412109375, -1.992095947265625, -1.87445068359375, -1.756805419921875, -1.63916015625, -1.521514892578125, -1.40386962890625, -1.286224365234375, -1.1685791015625, -1.050933837890625, -0.93328857421875, -0.815643310546875, -0.697998046875, -0.580352783203125, -0.46270751953125, -0.345062255859375, -0.2274169921875, -0.109771728515625, 0.00787353515625, 0.125518798828125, 0.2431640625, 0.360809326171875, 0.47845458984375, 0.596099853515625, 0.7137451171875, 0.831390380859375, 0.94903564453125, 1.066680908203125, 1.184326171875, 1.301971435546875, 1.41961669921875, 1.537261962890625, 1.6549072265625, 1.772552490234375, 1.89019775390625, 2.007843017578125, 2.12548828125, 2.243133544921875, 2.36077880859375, 2.478424072265625, 2.5960693359375, 2.713714599609375, 2.83135986328125, 2.949005126953125, 3.066650390625, 3.184295654296875, 3.30194091796875, 3.419586181640625, 3.5372314453125, 3.654876708984375, 3.77252197265625, 3.890167236328125, 4.0078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 4.0, 3.0, 3.0, 2.0, 7.0, 4.0, 3.0, 10.0, 8.0, 10.0, 10.0, 15.0, 17.0, 14.0, 14.0, 21.0, 24.0, 36.0, 25.0, 37.0, 41.0, 41.0, 53.0, 42.0, 66.0, 70.0, 51.0, 52.0, 48.0, 39.0, 35.0, 26.0, 20.0, 22.0, 21.0, 20.0, 20.0, 10.0, 8.0, 9.0, 11.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 3.0], "bins": [-1.841796875, -1.7885589599609375, -1.735321044921875, -1.6820831298828125, -1.62884521484375, -1.5756072998046875, -1.522369384765625, -1.4691314697265625, -1.4158935546875, -1.3626556396484375, -1.309417724609375, -1.2561798095703125, -1.20294189453125, -1.1497039794921875, -1.096466064453125, -1.0432281494140625, -0.989990234375, -0.9367523193359375, -0.883514404296875, -0.8302764892578125, -0.77703857421875, -0.7238006591796875, -0.670562744140625, -0.6173248291015625, -0.5640869140625, -0.5108489990234375, -0.457611083984375, -0.4043731689453125, -0.35113525390625, -0.2978973388671875, -0.244659423828125, -0.1914215087890625, -0.13818359375, -0.0849456787109375, -0.031707763671875, 0.0215301513671875, 0.07476806640625, 0.1280059814453125, 0.181243896484375, 0.2344818115234375, 0.2877197265625, 0.3409576416015625, 0.394195556640625, 0.4474334716796875, 0.50067138671875, 0.5539093017578125, 0.607147216796875, 0.6603851318359375, 0.713623046875, 0.7668609619140625, 0.820098876953125, 0.8733367919921875, 0.92657470703125, 0.9798126220703125, 1.033050537109375, 1.0862884521484375, 1.1395263671875, 1.1927642822265625, 1.246002197265625, 1.2992401123046875, 1.35247802734375, 1.4057159423828125, 1.458953857421875, 1.5121917724609375, 1.5654296875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 2.0, 4.0, 9.0, 13.0, 9.0, 25.0, 5.0, 23.0, 22.0, 19.0, 25.0, 30.0, 24.0, 33.0, 34.0, 24.0, 30.0, 36.0, 41.0, 28.0, 41.0, 35.0, 38.0, 42.0, 33.0, 27.0, 33.0, 44.0, 32.0, 26.0, 30.0, 21.0, 21.0, 22.0, 14.0, 14.0, 9.0, 12.0, 11.0, 17.0, 8.0, 1.0, 5.0, 6.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-37.31319046020508, -36.2159423828125, -35.11869812011719, -34.02145004272461, -32.92420196533203, -31.826955795288086, -30.72970962524414, -29.632461547851562, -28.535215377807617, -27.437969207763672, -26.340721130371094, -25.24347496032715, -24.146228790283203, -23.048980712890625, -21.95173454284668, -20.854488372802734, -19.757240295410156, -18.65999412536621, -17.562746047973633, -16.465499877929688, -15.368252754211426, -14.271005630493164, -13.173759460449219, -12.076512336730957, -10.979265213012695, -9.882018089294434, -8.784770965576172, -7.687524795532227, -6.590277671813965, -5.493030548095703, -4.3957839012146, -3.298537254333496, -2.2012939453125, -1.1040470600128174, -0.006800174713134766, 1.0904467105865479, 2.1876935958862305, 3.284940719604492, 4.382187366485596, 5.479434013366699, 6.576681137084961, 7.673928260803223, 8.771175384521484, 9.86842155456543, 10.965668678283691, 12.062915802001953, 13.160161972045898, 14.25740909576416, 15.354656219482422, 16.451902389526367, 17.549150466918945, 18.64639663696289, 19.74364471435547, 20.840890884399414, 21.93813705444336, 23.035385131835938, 24.132631301879883, 25.229877471923828, 26.327125549316406, 27.42437171936035, 28.521617889404297, 29.618865966796875, 30.71611213684082, 31.813358306884766, 32.910606384277344]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 7.0, 13.0, 11.0, 11.0, 11.0, 14.0, 22.0, 17.0, 21.0, 19.0, 21.0, 28.0, 36.0, 36.0, 32.0, 23.0, 31.0, 39.0, 38.0, 41.0, 36.0, 43.0, 33.0, 43.0, 28.0, 45.0, 21.0, 41.0, 18.0, 35.0, 23.0, 25.0, 23.0, 13.0, 11.0, 11.0, 8.0, 13.0, 10.0, 8.0, 10.0, 7.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-46.150108337402344, -44.76209259033203, -43.37407684326172, -41.986061096191406, -40.598045349121094, -39.21002960205078, -37.82201385498047, -36.433998107910156, -35.045982360839844, -33.65796661376953, -32.26995086669922, -30.881935119628906, -29.493919372558594, -28.10590362548828, -26.717885971069336, -25.329870223999023, -23.941852569580078, -22.553836822509766, -21.165821075439453, -19.77780532836914, -18.389789581298828, -17.001773834228516, -15.61375617980957, -14.225740432739258, -12.837724685668945, -11.449708938598633, -10.06169319152832, -8.673676490783691, -7.285660743713379, -5.897644996643066, -4.5096282958984375, -3.121612548828125, -1.7335968017578125, -0.3455808162689209, 1.0424351692199707, 2.4304513931274414, 3.818467140197754, 5.206482887268066, 6.594499588012695, 7.982515335083008, 9.37053108215332, 10.758546829223633, 12.146562576293945, 13.534579277038574, 14.922595024108887, 16.310611724853516, 17.698627471923828, 19.08664321899414, 20.474658966064453, 21.862674713134766, 23.250690460205078, 24.63870620727539, 26.026721954345703, 27.414737701416016, 28.80275535583496, 30.190771102905273, 31.578786849975586, 32.96680450439453, 34.354820251464844, 35.742835998535156, 37.13085174560547, 38.51886749267578, 39.906883239746094, 41.294898986816406, 42.68291473388672]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 10.0, 10.0, 17.0, 18.0, 32.0, 40.0, 101.0, 119.0, 206.0, 329.0, 502.0, 843.0, 1276.0, 1904.0, 2999.0, 4473.0, 6883.0, 10142.0, 14381.0, 20720.0, 28239.0, 38555.0, 50250.0, 62855.0, 75240.0, 86270.0, 92459.0, 93423.0, 89856.0, 81058.0, 70250.0, 56895.0, 44638.0, 33871.0, 24841.0, 17780.0, 12408.0, 8305.0, 5667.0, 3731.0, 2415.0, 1608.0, 1068.0, 671.0, 443.0, 284.0, 167.0, 106.0, 74.0, 39.0, 34.0, 16.0, 12.0, 8.0, 6.0, 7.0, 1.0, 5.0], "bins": [-24.453125, -23.71826171875, -22.9833984375, -22.24853515625, -21.513671875, -20.77880859375, -20.0439453125, -19.30908203125, -18.57421875, -17.83935546875, -17.1044921875, -16.36962890625, -15.634765625, -14.89990234375, -14.1650390625, -13.43017578125, -12.6953125, -11.96044921875, -11.2255859375, -10.49072265625, -9.755859375, -9.02099609375, -8.2861328125, -7.55126953125, -6.81640625, -6.08154296875, -5.3466796875, -4.61181640625, -3.876953125, -3.14208984375, -2.4072265625, -1.67236328125, -0.9375, -0.20263671875, 0.5322265625, 1.26708984375, 2.001953125, 2.73681640625, 3.4716796875, 4.20654296875, 4.94140625, 5.67626953125, 6.4111328125, 7.14599609375, 7.880859375, 8.61572265625, 9.3505859375, 10.08544921875, 10.8203125, 11.55517578125, 12.2900390625, 13.02490234375, 13.759765625, 14.49462890625, 15.2294921875, 15.96435546875, 16.69921875, 17.43408203125, 18.1689453125, 18.90380859375, 19.638671875, 20.37353515625, 21.1083984375, 21.84326171875, 22.578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 8.0, 11.0, 13.0, 9.0, 11.0, 15.0, 22.0, 19.0, 20.0, 21.0, 16.0, 35.0, 33.0, 38.0, 30.0, 24.0, 28.0, 40.0, 41.0, 42.0, 35.0, 42.0, 32.0, 44.0, 30.0, 44.0, 25.0, 34.0, 22.0, 36.0, 22.0, 21.0, 23.0, 14.0, 11.0, 12.0, 7.0, 16.0, 6.0, 9.0, 10.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-45.28125, -43.9150390625, -42.548828125, -41.1826171875, -39.81640625, -38.4501953125, -37.083984375, -35.7177734375, -34.3515625, -32.9853515625, -31.619140625, -30.2529296875, -28.88671875, -27.5205078125, -26.154296875, -24.7880859375, -23.421875, -22.0556640625, -20.689453125, -19.3232421875, -17.95703125, -16.5908203125, -15.224609375, -13.8583984375, -12.4921875, -11.1259765625, -9.759765625, -8.3935546875, -7.02734375, -5.6611328125, -4.294921875, -2.9287109375, -1.5625, -0.1962890625, 1.169921875, 2.5361328125, 3.90234375, 5.2685546875, 6.634765625, 8.0009765625, 9.3671875, 10.7333984375, 12.099609375, 13.4658203125, 14.83203125, 16.1982421875, 17.564453125, 18.9306640625, 20.296875, 21.6630859375, 23.029296875, 24.3955078125, 25.76171875, 27.1279296875, 28.494140625, 29.8603515625, 31.2265625, 32.5927734375, 33.958984375, 35.3251953125, 36.69140625, 38.0576171875, 39.423828125, 40.7900390625, 42.15625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 10.0, 12.0, 14.0, 23.0, 46.0, 73.0, 97.0, 171.0, 228.0, 379.0, 633.0, 1007.0, 1525.0, 2508.0, 4007.0, 6161.0, 9637.0, 14749.0, 22343.0, 32021.0, 45591.0, 61586.0, 78560.0, 94532.0, 104498.0, 108002.0, 103158.0, 91658.0, 75627.0, 58039.0, 42598.0, 30345.0, 20630.0, 13656.0, 8924.0, 5711.0, 3717.0, 2236.0, 1448.0, 867.0, 567.0, 376.0, 193.0, 137.0, 92.0, 67.0, 34.0, 31.0, 12.0, 9.0, 9.0, 2.0, 5.0, 0.0, 2.0], "bins": [-29.390625, -28.536376953125, -27.68212890625, -26.827880859375, -25.9736328125, -25.119384765625, -24.26513671875, -23.410888671875, -22.556640625, -21.702392578125, -20.84814453125, -19.993896484375, -19.1396484375, -18.285400390625, -17.43115234375, -16.576904296875, -15.72265625, -14.868408203125, -14.01416015625, -13.159912109375, -12.3056640625, -11.451416015625, -10.59716796875, -9.742919921875, -8.888671875, -8.034423828125, -7.18017578125, -6.325927734375, -5.4716796875, -4.617431640625, -3.76318359375, -2.908935546875, -2.0546875, -1.200439453125, -0.34619140625, 0.508056640625, 1.3623046875, 2.216552734375, 3.07080078125, 3.925048828125, 4.779296875, 5.633544921875, 6.48779296875, 7.342041015625, 8.1962890625, 9.050537109375, 9.90478515625, 10.759033203125, 11.61328125, 12.467529296875, 13.32177734375, 14.176025390625, 15.0302734375, 15.884521484375, 16.73876953125, 17.593017578125, 18.447265625, 19.301513671875, 20.15576171875, 21.010009765625, 21.8642578125, 22.718505859375, 23.57275390625, 24.427001953125, 25.28125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 9.0, 9.0, 5.0, 11.0, 16.0, 19.0, 28.0, 20.0, 23.0, 29.0, 31.0, 33.0, 31.0, 38.0, 44.0, 38.0, 32.0, 39.0, 50.0, 28.0, 44.0, 37.0, 36.0, 52.0, 33.0, 23.0, 21.0, 33.0, 28.0, 22.0, 24.0, 22.0, 15.0, 14.0, 8.0, 11.0, 9.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.28125, -29.32568359375, -28.3701171875, -27.41455078125, -26.458984375, -25.50341796875, -24.5478515625, -23.59228515625, -22.63671875, -21.68115234375, -20.7255859375, -19.77001953125, -18.814453125, -17.85888671875, -16.9033203125, -15.94775390625, -14.9921875, -14.03662109375, -13.0810546875, -12.12548828125, -11.169921875, -10.21435546875, -9.2587890625, -8.30322265625, -7.34765625, -6.39208984375, -5.4365234375, -4.48095703125, -3.525390625, -2.56982421875, -1.6142578125, -0.65869140625, 0.296875, 1.25244140625, 2.2080078125, 3.16357421875, 4.119140625, 5.07470703125, 6.0302734375, 6.98583984375, 7.94140625, 8.89697265625, 9.8525390625, 10.80810546875, 11.763671875, 12.71923828125, 13.6748046875, 14.63037109375, 15.5859375, 16.54150390625, 17.4970703125, 18.45263671875, 19.408203125, 20.36376953125, 21.3193359375, 22.27490234375, 23.23046875, 24.18603515625, 25.1416015625, 26.09716796875, 27.052734375, 28.00830078125, 28.9638671875, 29.91943359375, 30.875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 8.0, 9.0, 28.0, 41.0, 46.0, 65.0, 108.0, 193.0, 278.0, 413.0, 749.0, 1132.0, 1757.0, 2922.0, 4686.0, 7664.0, 12040.0, 19385.0, 30161.0, 45635.0, 65517.0, 87804.0, 108702.0, 122515.0, 123231.0, 111860.0, 92782.0, 69525.0, 49674.0, 33076.0, 21135.0, 13552.0, 8363.0, 5148.0, 3205.0, 1919.0, 1178.0, 791.0, 483.0, 293.0, 183.0, 123.0, 75.0, 39.0, 28.0, 18.0, 11.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.484375, -12.095458984375, -11.70654296875, -11.317626953125, -10.9287109375, -10.539794921875, -10.15087890625, -9.761962890625, -9.373046875, -8.984130859375, -8.59521484375, -8.206298828125, -7.8173828125, -7.428466796875, -7.03955078125, -6.650634765625, -6.26171875, -5.872802734375, -5.48388671875, -5.094970703125, -4.7060546875, -4.317138671875, -3.92822265625, -3.539306640625, -3.150390625, -2.761474609375, -2.37255859375, -1.983642578125, -1.5947265625, -1.205810546875, -0.81689453125, -0.427978515625, -0.0390625, 0.349853515625, 0.73876953125, 1.127685546875, 1.5166015625, 1.905517578125, 2.29443359375, 2.683349609375, 3.072265625, 3.461181640625, 3.85009765625, 4.239013671875, 4.6279296875, 5.016845703125, 5.40576171875, 5.794677734375, 6.18359375, 6.572509765625, 6.96142578125, 7.350341796875, 7.7392578125, 8.128173828125, 8.51708984375, 8.906005859375, 9.294921875, 9.683837890625, 10.07275390625, 10.461669921875, 10.8505859375, 11.239501953125, 11.62841796875, 12.017333984375, 12.40625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 3.0, 6.0, 4.0, 7.0, 11.0, 9.0, 17.0, 15.0, 23.0, 22.0, 29.0, 28.0, 42.0, 37.0, 27.0, 33.0, 50.0, 37.0, 40.0, 40.0, 46.0, 46.0, 47.0, 42.0, 46.0, 40.0, 26.0, 28.0, 22.0, 36.0, 26.0, 22.0, 16.0, 14.0, 11.0, 9.0, 7.0, 5.0, 11.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001125335693359375, -0.0010876953601837158, -0.0010500550270080566, -0.0010124146938323975, -0.0009747743606567383, -0.0009371340274810791, -0.0008994936943054199, -0.0008618533611297607, -0.0008242130279541016, -0.0007865726947784424, -0.0007489323616027832, -0.000711292028427124, -0.0006736516952514648, -0.0006360113620758057, -0.0005983710289001465, -0.0005607306957244873, -0.0005230903625488281, -0.00048545002937316895, -0.00044780969619750977, -0.0004101693630218506, -0.0003725290298461914, -0.0003348886966705322, -0.00029724836349487305, -0.00025960803031921387, -0.0002219676971435547, -0.0001843273639678955, -0.00014668703079223633, -0.00010904669761657715, -7.140636444091797e-05, -3.376603126525879e-05, 3.874301910400391e-06, 4.151463508605957e-05, 7.915496826171875e-05, 0.00011679530143737793, 0.0001544356346130371, 0.0001920759677886963, 0.00022971630096435547, 0.00026735663414001465, 0.00030499696731567383, 0.000342637300491333, 0.0003802776336669922, 0.00041791796684265137, 0.00045555830001831055, 0.0004931986331939697, 0.0005308389663696289, 0.0005684792995452881, 0.0006061196327209473, 0.0006437599658966064, 0.0006814002990722656, 0.0007190406322479248, 0.000756680965423584, 0.0007943212985992432, 0.0008319616317749023, 0.0008696019649505615, 0.0009072422981262207, 0.0009448826313018799, 0.000982522964477539, 0.0010201632976531982, 0.0010578036308288574, 0.0010954439640045166, 0.0011330842971801758, 0.001170724630355835, 0.0012083649635314941, 0.0012460052967071533, 0.0012836456298828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 9.0, 12.0, 16.0, 20.0, 26.0, 37.0, 61.0, 118.0, 153.0, 237.0, 436.0, 681.0, 1151.0, 1884.0, 3186.0, 5336.0, 9351.0, 15946.0, 27196.0, 44833.0, 71453.0, 104184.0, 135104.0, 150816.0, 143993.0, 116267.0, 82626.0, 53363.0, 32900.0, 19612.0, 11210.0, 6721.0, 3852.0, 2236.0, 1365.0, 808.0, 528.0, 305.0, 185.0, 133.0, 78.0, 45.0, 33.0, 19.0, 15.0, 10.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.578125, -14.051513671875, -13.52490234375, -12.998291015625, -12.4716796875, -11.945068359375, -11.41845703125, -10.891845703125, -10.365234375, -9.838623046875, -9.31201171875, -8.785400390625, -8.2587890625, -7.732177734375, -7.20556640625, -6.678955078125, -6.15234375, -5.625732421875, -5.09912109375, -4.572509765625, -4.0458984375, -3.519287109375, -2.99267578125, -2.466064453125, -1.939453125, -1.412841796875, -0.88623046875, -0.359619140625, 0.1669921875, 0.693603515625, 1.22021484375, 1.746826171875, 2.2734375, 2.800048828125, 3.32666015625, 3.853271484375, 4.3798828125, 4.906494140625, 5.43310546875, 5.959716796875, 6.486328125, 7.012939453125, 7.53955078125, 8.066162109375, 8.5927734375, 9.119384765625, 9.64599609375, 10.172607421875, 10.69921875, 11.225830078125, 11.75244140625, 12.279052734375, 12.8056640625, 13.332275390625, 13.85888671875, 14.385498046875, 14.912109375, 15.438720703125, 15.96533203125, 16.491943359375, 17.0185546875, 17.545166015625, 18.07177734375, 18.598388671875, 19.125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 1.0, 4.0, 2.0, 3.0, 2.0, 9.0, 6.0, 10.0, 6.0, 12.0, 12.0, 12.0, 18.0, 29.0, 33.0, 28.0, 40.0, 44.0, 52.0, 63.0, 70.0, 64.0, 64.0, 51.0, 46.0, 56.0, 57.0, 42.0, 27.0, 20.0, 27.0, 17.0, 13.0, 10.0, 9.0, 13.0, 5.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.625, -9.3443603515625, -9.063720703125, -8.7830810546875, -8.50244140625, -8.2218017578125, -7.941162109375, -7.6605224609375, -7.3798828125, -7.0992431640625, -6.818603515625, -6.5379638671875, -6.25732421875, -5.9766845703125, -5.696044921875, -5.4154052734375, -5.134765625, -4.8541259765625, -4.573486328125, -4.2928466796875, -4.01220703125, -3.7315673828125, -3.450927734375, -3.1702880859375, -2.8896484375, -2.6090087890625, -2.328369140625, -2.0477294921875, -1.76708984375, -1.4864501953125, -1.205810546875, -0.9251708984375, -0.64453125, -0.3638916015625, -0.083251953125, 0.1973876953125, 0.47802734375, 0.7586669921875, 1.039306640625, 1.3199462890625, 1.6005859375, 1.8812255859375, 2.161865234375, 2.4425048828125, 2.72314453125, 3.0037841796875, 3.284423828125, 3.5650634765625, 3.845703125, 4.1263427734375, 4.406982421875, 4.6876220703125, 4.96826171875, 5.2489013671875, 5.529541015625, 5.8101806640625, 6.0908203125, 6.3714599609375, 6.652099609375, 6.9327392578125, 7.21337890625, 7.4940185546875, 7.774658203125, 8.0552978515625, 8.3359375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 4.0, 9.0, 10.0, 11.0, 18.0, 12.0, 13.0, 15.0, 19.0, 24.0, 32.0, 27.0, 27.0, 35.0, 25.0, 28.0, 43.0, 39.0, 39.0, 31.0, 40.0, 35.0, 47.0, 40.0, 42.0, 34.0, 39.0, 23.0, 25.0, 31.0, 27.0, 20.0, 19.0, 18.0, 16.0, 12.0, 12.0, 6.0, 6.0, 7.0, 8.0, 5.0, 4.0, 8.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-40.16423797607422, -39.02663803100586, -37.8890380859375, -36.75143814086914, -35.61383819580078, -34.47623825073242, -33.33863830566406, -32.20103454589844, -31.06343650817871, -29.92583656311035, -28.788236618041992, -27.650636672973633, -26.51303482055664, -25.37543487548828, -24.237834930419922, -23.100234985351562, -21.962635040283203, -20.825035095214844, -19.687435150146484, -18.549835205078125, -17.412235260009766, -16.274635314941406, -15.137033462524414, -13.999433517456055, -12.861833572387695, -11.724233627319336, -10.586633682250977, -9.4490327835083, -8.311432838439941, -7.173832893371582, -6.0362324714660645, -4.898632049560547, -3.761035919189453, -2.6234357357025146, -1.4858355522155762, -0.3482353687286377, 0.7893648147583008, 1.9269647598266602, 3.0645651817321777, 4.202165603637695, 5.339765548706055, 6.477365493774414, 7.614965915679932, 8.75256633758545, 9.890166282653809, 11.027766227722168, 12.165367126464844, 13.302967071533203, 14.440567016601562, 15.578166961669922, 16.71576690673828, 17.85336685180664, 18.990966796875, 20.12856674194336, 21.26616859436035, 22.40376853942871, 23.54136848449707, 24.67896842956543, 25.81656837463379, 26.95416831970215, 28.09177017211914, 29.2293701171875, 30.36697006225586, 31.50457000732422, 32.64216995239258]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 8.0, 16.0, 6.0, 11.0, 12.0, 15.0, 16.0, 17.0, 25.0, 18.0, 36.0, 24.0, 32.0, 30.0, 43.0, 40.0, 41.0, 39.0, 32.0, 35.0, 29.0, 39.0, 38.0, 34.0, 32.0, 38.0, 26.0, 35.0, 34.0, 21.0, 25.0, 21.0, 23.0, 18.0, 11.0, 16.0, 13.0, 7.0, 7.0, 7.0, 8.0, 0.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.95582580566406, -39.48414993286133, -38.01247787475586, -36.540802001953125, -35.069129943847656, -33.59745407104492, -32.12577819824219, -30.654104232788086, -29.182430267333984, -27.710756301879883, -26.23908233642578, -24.767406463623047, -23.295732498168945, -21.824058532714844, -20.35238265991211, -18.880708694458008, -17.409034729003906, -15.937360763549805, -14.465685844421387, -12.994010925292969, -11.522336959838867, -10.050662994384766, -8.578988075256348, -7.10731315612793, -5.635639190673828, -4.163964748382568, -2.6922903060913086, -1.2206158638000488, 0.25105857849121094, 1.7227330207824707, 3.1944074630737305, 4.666082382202148, 6.137760162353516, 7.609434604644775, 9.081109046936035, 10.552783966064453, 12.024457931518555, 13.496131896972656, 14.967806816101074, 16.439481735229492, 17.911155700683594, 19.382829666137695, 20.854503631591797, 22.32617950439453, 23.797853469848633, 25.269527435302734, 26.74120330810547, 28.21287727355957, 29.684551239013672, 31.156225204467773, 32.627899169921875, 34.09957504272461, 35.571250915527344, 37.04292297363281, 38.51459884643555, 39.98627471923828, 41.45794677734375, 42.929622650146484, 44.40129470825195, 45.87297058105469, 47.344642639160156, 48.81631851196289, 50.287994384765625, 51.759666442871094, 53.23134231567383]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 7.0, 10.0, 18.0, 33.0, 52.0, 119.0, 192.0, 364.0, 687.0, 1085.0, 2015.0, 3581.0, 5995.0, 10215.0, 17136.0, 27630.0, 43883.0, 68905.0, 102949.0, 149058.0, 206406.0, 271871.0, 336925.0, 389016.0, 422898.0, 425441.0, 397648.0, 346329.0, 282141.0, 216983.0, 157815.0, 110128.0, 73519.0, 47714.0, 30028.0, 18640.0, 11075.0, 6508.0, 3984.0, 2235.0, 1297.0, 781.0, 421.0, 259.0, 140.0, 71.0, 45.0, 23.0, 12.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.078125, -28.111572265625, -27.14501953125, -26.178466796875, -25.2119140625, -24.245361328125, -23.27880859375, -22.312255859375, -21.345703125, -20.379150390625, -19.41259765625, -18.446044921875, -17.4794921875, -16.512939453125, -15.54638671875, -14.579833984375, -13.61328125, -12.646728515625, -11.68017578125, -10.713623046875, -9.7470703125, -8.780517578125, -7.81396484375, -6.847412109375, -5.880859375, -4.914306640625, -3.94775390625, -2.981201171875, -2.0146484375, -1.048095703125, -0.08154296875, 0.885009765625, 1.8515625, 2.818115234375, 3.78466796875, 4.751220703125, 5.7177734375, 6.684326171875, 7.65087890625, 8.617431640625, 9.583984375, 10.550537109375, 11.51708984375, 12.483642578125, 13.4501953125, 14.416748046875, 15.38330078125, 16.349853515625, 17.31640625, 18.282958984375, 19.24951171875, 20.216064453125, 21.1826171875, 22.149169921875, 23.11572265625, 24.082275390625, 25.048828125, 26.015380859375, 26.98193359375, 27.948486328125, 28.9150390625, 29.881591796875, 30.84814453125, 31.814697265625, 32.78125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 3.0, 6.0, 3.0, 4.0, 6.0, 8.0, 14.0, 5.0, 11.0, 20.0, 16.0, 12.0, 19.0, 26.0, 25.0, 29.0, 29.0, 34.0, 33.0, 39.0, 46.0, 37.0, 38.0, 30.0, 35.0, 34.0, 42.0, 34.0, 37.0, 36.0, 26.0, 35.0, 39.0, 25.0, 22.0, 24.0, 19.0, 20.0, 18.0, 14.0, 11.0, 7.0, 6.0, 9.0, 8.0, 3.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.34375, -33.091796875, -31.83984375, -30.587890625, -29.3359375, -28.083984375, -26.83203125, -25.580078125, -24.328125, -23.076171875, -21.82421875, -20.572265625, -19.3203125, -18.068359375, -16.81640625, -15.564453125, -14.3125, -13.060546875, -11.80859375, -10.556640625, -9.3046875, -8.052734375, -6.80078125, -5.548828125, -4.296875, -3.044921875, -1.79296875, -0.541015625, 0.7109375, 1.962890625, 3.21484375, 4.466796875, 5.71875, 6.970703125, 8.22265625, 9.474609375, 10.7265625, 11.978515625, 13.23046875, 14.482421875, 15.734375, 16.986328125, 18.23828125, 19.490234375, 20.7421875, 21.994140625, 23.24609375, 24.498046875, 25.75, 27.001953125, 28.25390625, 29.505859375, 30.7578125, 32.009765625, 33.26171875, 34.513671875, 35.765625, 37.017578125, 38.26953125, 39.521484375, 40.7734375, 42.025390625, 43.27734375, 44.529296875, 45.78125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 12.0, 14.0, 38.0, 49.0, 105.0, 180.0, 277.0, 470.0, 822.0, 1386.0, 2288.0, 3883.0, 6446.0, 10395.0, 16268.0, 25050.0, 37660.0, 55122.0, 79353.0, 110326.0, 146614.0, 189736.0, 234185.0, 276798.0, 314621.0, 340514.0, 353254.0, 347104.0, 327833.0, 291935.0, 251826.0, 205568.0, 162269.0, 122662.0, 90072.0, 64488.0, 43969.0, 29609.0, 19309.0, 12442.0, 7678.0, 4670.0, 2747.0, 1719.0, 1041.0, 601.0, 390.0, 206.0, 116.0, 80.0, 36.0, 26.0, 14.0, 9.0, 4.0, 2.0, 2.0, 2.0], "bins": [-28.046875, -27.18896484375, -26.3310546875, -25.47314453125, -24.615234375, -23.75732421875, -22.8994140625, -22.04150390625, -21.18359375, -20.32568359375, -19.4677734375, -18.60986328125, -17.751953125, -16.89404296875, -16.0361328125, -15.17822265625, -14.3203125, -13.46240234375, -12.6044921875, -11.74658203125, -10.888671875, -10.03076171875, -9.1728515625, -8.31494140625, -7.45703125, -6.59912109375, -5.7412109375, -4.88330078125, -4.025390625, -3.16748046875, -2.3095703125, -1.45166015625, -0.59375, 0.26416015625, 1.1220703125, 1.97998046875, 2.837890625, 3.69580078125, 4.5537109375, 5.41162109375, 6.26953125, 7.12744140625, 7.9853515625, 8.84326171875, 9.701171875, 10.55908203125, 11.4169921875, 12.27490234375, 13.1328125, 13.99072265625, 14.8486328125, 15.70654296875, 16.564453125, 17.42236328125, 18.2802734375, 19.13818359375, 19.99609375, 20.85400390625, 21.7119140625, 22.56982421875, 23.427734375, 24.28564453125, 25.1435546875, 26.00146484375, 26.859375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 5.0, 4.0, 5.0, 12.0, 16.0, 9.0, 27.0, 28.0, 34.0, 39.0, 46.0, 62.0, 78.0, 82.0, 77.0, 95.0, 102.0, 115.0, 135.0, 152.0, 160.0, 156.0, 179.0, 172.0, 185.0, 167.0, 196.0, 185.0, 137.0, 165.0, 156.0, 155.0, 143.0, 107.0, 107.0, 102.0, 91.0, 76.0, 57.0, 61.0, 24.0, 36.0, 34.0, 24.0, 17.0, 15.0, 13.0, 10.0, 3.0, 3.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-16.640625, -16.10546875, -15.5703125, -15.03515625, -14.5, -13.96484375, -13.4296875, -12.89453125, -12.359375, -11.82421875, -11.2890625, -10.75390625, -10.21875, -9.68359375, -9.1484375, -8.61328125, -8.078125, -7.54296875, -7.0078125, -6.47265625, -5.9375, -5.40234375, -4.8671875, -4.33203125, -3.796875, -3.26171875, -2.7265625, -2.19140625, -1.65625, -1.12109375, -0.5859375, -0.05078125, 0.484375, 1.01953125, 1.5546875, 2.08984375, 2.625, 3.16015625, 3.6953125, 4.23046875, 4.765625, 5.30078125, 5.8359375, 6.37109375, 6.90625, 7.44140625, 7.9765625, 8.51171875, 9.046875, 9.58203125, 10.1171875, 10.65234375, 11.1875, 11.72265625, 12.2578125, 12.79296875, 13.328125, 13.86328125, 14.3984375, 14.93359375, 15.46875, 16.00390625, 16.5390625, 17.07421875, 17.609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 7.0, 6.0, 12.0, 10.0, 11.0, 18.0, 19.0, 16.0, 26.0, 25.0, 21.0, 30.0, 24.0, 37.0, 30.0, 51.0, 36.0, 49.0, 50.0, 44.0, 48.0, 31.0, 48.0, 37.0, 39.0, 40.0, 33.0, 31.0, 23.0, 26.0, 21.0, 13.0, 14.0, 15.0, 9.0, 11.0, 16.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-45.899723052978516, -44.56438064575195, -43.229034423828125, -41.89369201660156, -40.558349609375, -39.22300338745117, -37.88766098022461, -36.55231475830078, -35.21697235107422, -33.881629943847656, -32.54628372192383, -31.210941314697266, -29.87559700012207, -28.540252685546875, -27.204910278320312, -25.869565963745117, -24.534223556518555, -23.19887924194336, -21.863536834716797, -20.5281925201416, -19.192848205566406, -17.857505798339844, -16.52216148376465, -15.186817169189453, -13.851473808288574, -12.516130447387695, -11.1807861328125, -9.845442771911621, -8.510099411010742, -7.174755096435547, -5.839411735534668, -4.504067420959473, -3.1687240600585938, -1.8333803415298462, -0.49803662300109863, 0.8373069763183594, 2.1726508140563965, 3.5079946517944336, 4.8433380126953125, 6.178682327270508, 7.514025688171387, 8.849369049072266, 10.184713363647461, 11.52005672454834, 12.855400085449219, 14.190744400024414, 15.526087760925293, 16.861431121826172, 18.196775436401367, 19.532119750976562, 20.867462158203125, 22.20280647277832, 23.538150787353516, 24.873493194580078, 26.208837509155273, 27.54418182373047, 28.87952423095703, 30.214868545532227, 31.55021095275879, 32.885555267333984, 34.22089767456055, 35.556243896484375, 36.89158630371094, 38.2269287109375, 39.56227493286133]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 9.0, 12.0, 8.0, 11.0, 14.0, 14.0, 16.0, 23.0, 27.0, 29.0, 34.0, 32.0, 29.0, 36.0, 35.0, 36.0, 48.0, 42.0, 33.0, 32.0, 34.0, 46.0, 45.0, 42.0, 35.0, 25.0, 38.0, 27.0, 28.0, 28.0, 19.0, 18.0, 16.0, 16.0, 9.0, 6.0, 12.0, 12.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.74152755737305, -45.17896270751953, -43.616397857666016, -42.0538330078125, -40.49127197265625, -38.928707122802734, -37.36614227294922, -35.8035774230957, -34.24101257324219, -32.67844772338867, -31.11588478088379, -29.553319931030273, -27.99075698852539, -26.428192138671875, -24.86562728881836, -23.303062438964844, -21.740501403808594, -20.177936553955078, -18.615373611450195, -17.05280876159668, -15.49024486541748, -13.927680969238281, -12.365116119384766, -10.802552223205566, -9.239988327026367, -7.677424430847168, -6.1148600578308105, -4.552295684814453, -2.989731788635254, -1.4271678924560547, 0.13539695739746094, 1.6979608535766602, 3.2605247497558594, 4.823088645935059, 6.385653018951416, 7.948217391967773, 9.510781288146973, 11.073345184326172, 12.635910034179688, 14.198473930358887, 15.761037826538086, 17.3236026763916, 18.886165618896484, 20.44873046875, 22.011295318603516, 23.5738582611084, 25.136423110961914, 26.698986053466797, 28.261550903320312, 29.824115753173828, 31.38667869567871, 32.949241638183594, 34.51180648803711, 36.074371337890625, 37.63693618774414, 39.199501037597656, 40.762062072753906, 42.32462692260742, 43.88719177246094, 45.44975280761719, 47.0123176574707, 48.57488250732422, 50.137447357177734, 51.70001220703125, 53.262577056884766]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 16.0, 14.0, 22.0, 34.0, 39.0, 50.0, 79.0, 121.0, 157.0, 229.0, 336.0, 465.0, 754.0, 1048.0, 1549.0, 2583.0, 4072.0, 6737.0, 11348.0, 19485.0, 34755.0, 62892.0, 114706.0, 192563.0, 227053.0, 159353.0, 90399.0, 49762.0, 27724.0, 15774.0, 9185.0, 5401.0, 3438.0, 2115.0, 1380.0, 974.0, 579.0, 419.0, 283.0, 172.0, 145.0, 103.0, 69.0, 63.0, 29.0, 20.0, 12.0, 9.0, 9.0, 6.0, 12.0, 6.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.53125, -7.298095703125, -7.06494140625, -6.831787109375, -6.5986328125, -6.365478515625, -6.13232421875, -5.899169921875, -5.666015625, -5.432861328125, -5.19970703125, -4.966552734375, -4.7333984375, -4.500244140625, -4.26708984375, -4.033935546875, -3.80078125, -3.567626953125, -3.33447265625, -3.101318359375, -2.8681640625, -2.635009765625, -2.40185546875, -2.168701171875, -1.935546875, -1.702392578125, -1.46923828125, -1.236083984375, -1.0029296875, -0.769775390625, -0.53662109375, -0.303466796875, -0.0703125, 0.162841796875, 0.39599609375, 0.629150390625, 0.8623046875, 1.095458984375, 1.32861328125, 1.561767578125, 1.794921875, 2.028076171875, 2.26123046875, 2.494384765625, 2.7275390625, 2.960693359375, 3.19384765625, 3.427001953125, 3.66015625, 3.893310546875, 4.12646484375, 4.359619140625, 4.5927734375, 4.825927734375, 5.05908203125, 5.292236328125, 5.525390625, 5.758544921875, 5.99169921875, 6.224853515625, 6.4580078125, 6.691162109375, 6.92431640625, 7.157470703125, 7.390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 6.0, 9.0, 12.0, 10.0, 7.0, 15.0, 15.0, 17.0, 23.0, 26.0, 28.0, 38.0, 30.0, 29.0, 37.0, 34.0, 37.0, 45.0, 48.0, 32.0, 29.0, 40.0, 42.0, 43.0, 43.0, 33.0, 29.0, 36.0, 25.0, 28.0, 29.0, 19.0, 17.0, 19.0, 14.0, 7.0, 9.0, 13.0, 9.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.59375, -45.02734375, -43.4609375, -41.89453125, -40.328125, -38.76171875, -37.1953125, -35.62890625, -34.0625, -32.49609375, -30.9296875, -29.36328125, -27.796875, -26.23046875, -24.6640625, -23.09765625, -21.53125, -19.96484375, -18.3984375, -16.83203125, -15.265625, -13.69921875, -12.1328125, -10.56640625, -9.0, -7.43359375, -5.8671875, -4.30078125, -2.734375, -1.16796875, 0.3984375, 1.96484375, 3.53125, 5.09765625, 6.6640625, 8.23046875, 9.796875, 11.36328125, 12.9296875, 14.49609375, 16.0625, 17.62890625, 19.1953125, 20.76171875, 22.328125, 23.89453125, 25.4609375, 27.02734375, 28.59375, 30.16015625, 31.7265625, 33.29296875, 34.859375, 36.42578125, 37.9921875, 39.55859375, 41.125, 42.69140625, 44.2578125, 45.82421875, 47.390625, 48.95703125, 50.5234375, 52.08984375, 53.65625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 7.0, 8.0, 9.0, 5.0, 12.0, 13.0, 19.0, 22.0, 27.0, 47.0, 48.0, 73.0, 132.0, 201.0, 286.0, 454.0, 723.0, 1185.0, 1880.0, 3273.0, 5804.0, 11804.0, 24614.0, 57172.0, 147577.0, 353881.0, 262765.0, 98532.0, 39653.0, 17826.0, 8776.0, 4690.0, 2637.0, 1534.0, 974.0, 642.0, 393.0, 293.0, 185.0, 135.0, 74.0, 54.0, 44.0, 25.0, 20.0, 4.0, 6.0, 8.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.6796875, -9.384521484375, -9.08935546875, -8.794189453125, -8.4990234375, -8.203857421875, -7.90869140625, -7.613525390625, -7.318359375, -7.023193359375, -6.72802734375, -6.432861328125, -6.1376953125, -5.842529296875, -5.54736328125, -5.252197265625, -4.95703125, -4.661865234375, -4.36669921875, -4.071533203125, -3.7763671875, -3.481201171875, -3.18603515625, -2.890869140625, -2.595703125, -2.300537109375, -2.00537109375, -1.710205078125, -1.4150390625, -1.119873046875, -0.82470703125, -0.529541015625, -0.234375, 0.060791015625, 0.35595703125, 0.651123046875, 0.9462890625, 1.241455078125, 1.53662109375, 1.831787109375, 2.126953125, 2.422119140625, 2.71728515625, 3.012451171875, 3.3076171875, 3.602783203125, 3.89794921875, 4.193115234375, 4.48828125, 4.783447265625, 5.07861328125, 5.373779296875, 5.6689453125, 5.964111328125, 6.25927734375, 6.554443359375, 6.849609375, 7.144775390625, 7.43994140625, 7.735107421875, 8.0302734375, 8.325439453125, 8.62060546875, 8.915771484375, 9.2109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 6.0, 8.0, 11.0, 14.0, 7.0, 18.0, 20.0, 19.0, 20.0, 26.0, 18.0, 38.0, 32.0, 38.0, 33.0, 40.0, 35.0, 39.0, 33.0, 38.0, 35.0, 39.0, 30.0, 39.0, 30.0, 38.0, 35.0, 33.0, 18.0, 25.0, 26.0, 22.0, 22.0, 16.0, 12.0, 15.0, 11.0, 14.0, 6.0, 12.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-29.25, -28.31689453125, -27.3837890625, -26.45068359375, -25.517578125, -24.58447265625, -23.6513671875, -22.71826171875, -21.78515625, -20.85205078125, -19.9189453125, -18.98583984375, -18.052734375, -17.11962890625, -16.1865234375, -15.25341796875, -14.3203125, -13.38720703125, -12.4541015625, -11.52099609375, -10.587890625, -9.65478515625, -8.7216796875, -7.78857421875, -6.85546875, -5.92236328125, -4.9892578125, -4.05615234375, -3.123046875, -2.18994140625, -1.2568359375, -0.32373046875, 0.609375, 1.54248046875, 2.4755859375, 3.40869140625, 4.341796875, 5.27490234375, 6.2080078125, 7.14111328125, 8.07421875, 9.00732421875, 9.9404296875, 10.87353515625, 11.806640625, 12.73974609375, 13.6728515625, 14.60595703125, 15.5390625, 16.47216796875, 17.4052734375, 18.33837890625, 19.271484375, 20.20458984375, 21.1376953125, 22.07080078125, 23.00390625, 23.93701171875, 24.8701171875, 25.80322265625, 26.736328125, 27.66943359375, 28.6025390625, 29.53564453125, 30.46875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 8.0, 10.0, 16.0, 20.0, 33.0, 39.0, 51.0, 60.0, 74.0, 111.0, 151.0, 221.0, 314.0, 466.0, 654.0, 1090.0, 1823.0, 3024.0, 6034.0, 12922.0, 35326.0, 135680.0, 537504.0, 228037.0, 50820.0, 17192.0, 7399.0, 3867.0, 2075.0, 1195.0, 765.0, 508.0, 326.0, 203.0, 154.0, 126.0, 63.0, 50.0, 38.0, 26.0, 21.0, 15.0, 16.0, 10.0, 6.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888671875, -3.76959228515625, -3.6505126953125, -3.53143310546875, -3.412353515625, -3.29327392578125, -3.1741943359375, -3.05511474609375, -2.93603515625, -2.81695556640625, -2.6978759765625, -2.57879638671875, -2.459716796875, -2.34063720703125, -2.2215576171875, -2.10247802734375, -1.9833984375, -1.86431884765625, -1.7452392578125, -1.62615966796875, -1.507080078125, -1.38800048828125, -1.2689208984375, -1.14984130859375, -1.03076171875, -0.91168212890625, -0.7926025390625, -0.67352294921875, -0.554443359375, -0.43536376953125, -0.3162841796875, -0.19720458984375, -0.078125, 0.04095458984375, 0.1600341796875, 0.27911376953125, 0.398193359375, 0.51727294921875, 0.6363525390625, 0.75543212890625, 0.87451171875, 0.99359130859375, 1.1126708984375, 1.23175048828125, 1.350830078125, 1.46990966796875, 1.5889892578125, 1.70806884765625, 1.8271484375, 1.94622802734375, 2.0653076171875, 2.18438720703125, 2.303466796875, 2.42254638671875, 2.5416259765625, 2.66070556640625, 2.77978515625, 2.89886474609375, 3.0179443359375, 3.13702392578125, 3.256103515625, 3.37518310546875, 3.4942626953125, 3.61334228515625, 3.732421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 4.0, 15.0, 5.0, 13.0, 12.0, 12.0, 33.0, 25.0, 30.0, 47.0, 43.0, 55.0, 56.0, 50.0, 67.0, 79.0, 51.0, 65.0, 53.0, 54.0, 49.0, 33.0, 36.0, 22.0, 19.0, 15.0, 14.0, 13.0, 9.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001652240753173828, -0.00015932321548461914, -0.00015342235565185547, -0.0001475214958190918, -0.00014162063598632812, -0.00013571977615356445, -0.00012981891632080078, -0.0001239180564880371, -0.00011801719665527344, -0.00011211633682250977, -0.0001062154769897461, -0.00010031461715698242, -9.441375732421875e-05, -8.851289749145508e-05, -8.26120376586914e-05, -7.671117782592773e-05, -7.081031799316406e-05, -6.490945816040039e-05, -5.900859832763672e-05, -5.310773849487305e-05, -4.7206878662109375e-05, -4.13060188293457e-05, -3.540515899658203e-05, -2.950429916381836e-05, -2.3603439331054688e-05, -1.7702579498291016e-05, -1.1801719665527344e-05, -5.900859832763672e-06, 0.0, 5.900859832763672e-06, 1.1801719665527344e-05, 1.7702579498291016e-05, 2.3603439331054688e-05, 2.950429916381836e-05, 3.540515899658203e-05, 4.13060188293457e-05, 4.7206878662109375e-05, 5.310773849487305e-05, 5.900859832763672e-05, 6.490945816040039e-05, 7.081031799316406e-05, 7.671117782592773e-05, 8.26120376586914e-05, 8.851289749145508e-05, 9.441375732421875e-05, 0.00010031461715698242, 0.0001062154769897461, 0.00011211633682250977, 0.00011801719665527344, 0.0001239180564880371, 0.00012981891632080078, 0.00013571977615356445, 0.00014162063598632812, 0.0001475214958190918, 0.00015342235565185547, 0.00015932321548461914, 0.0001652240753173828, 0.00017112493515014648, 0.00017702579498291016, 0.00018292665481567383, 0.0001888275146484375, 0.00019472837448120117, 0.00020062923431396484, 0.00020653009414672852, 0.0002124309539794922]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 10.0, 17.0, 10.0, 30.0, 25.0, 44.0, 72.0, 118.0, 144.0, 244.0, 367.0, 499.0, 788.0, 1193.0, 2071.0, 3217.0, 5146.0, 8619.0, 14540.0, 25389.0, 45702.0, 82066.0, 149266.0, 231491.0, 204863.0, 119189.0, 65567.0, 36696.0, 20572.0, 11842.0, 7053.0, 4272.0, 2581.0, 1736.0, 1053.0, 672.0, 439.0, 291.0, 215.0, 143.0, 86.0, 66.0, 40.0, 34.0, 19.0, 20.0, 13.0, 12.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-3.796875, -3.68115234375, -3.5654296875, -3.44970703125, -3.333984375, -3.21826171875, -3.1025390625, -2.98681640625, -2.87109375, -2.75537109375, -2.6396484375, -2.52392578125, -2.408203125, -2.29248046875, -2.1767578125, -2.06103515625, -1.9453125, -1.82958984375, -1.7138671875, -1.59814453125, -1.482421875, -1.36669921875, -1.2509765625, -1.13525390625, -1.01953125, -0.90380859375, -0.7880859375, -0.67236328125, -0.556640625, -0.44091796875, -0.3251953125, -0.20947265625, -0.09375, 0.02197265625, 0.1376953125, 0.25341796875, 0.369140625, 0.48486328125, 0.6005859375, 0.71630859375, 0.83203125, 0.94775390625, 1.0634765625, 1.17919921875, 1.294921875, 1.41064453125, 1.5263671875, 1.64208984375, 1.7578125, 1.87353515625, 1.9892578125, 2.10498046875, 2.220703125, 2.33642578125, 2.4521484375, 2.56787109375, 2.68359375, 2.79931640625, 2.9150390625, 3.03076171875, 3.146484375, 3.26220703125, 3.3779296875, 3.49365234375, 3.609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 5.0, 4.0, 9.0, 6.0, 15.0, 12.0, 26.0, 20.0, 34.0, 43.0, 44.0, 52.0, 66.0, 74.0, 69.0, 46.0, 73.0, 62.0, 52.0, 46.0, 42.0, 39.0, 24.0, 27.0, 20.0, 17.0, 25.0, 10.0, 5.0, 3.0, 5.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.2109375, -2.1513519287109375, -2.091766357421875, -2.0321807861328125, -1.97259521484375, -1.9130096435546875, -1.853424072265625, -1.7938385009765625, -1.7342529296875, -1.6746673583984375, -1.615081787109375, -1.5554962158203125, -1.49591064453125, -1.4363250732421875, -1.376739501953125, -1.3171539306640625, -1.257568359375, -1.1979827880859375, -1.138397216796875, -1.0788116455078125, -1.01922607421875, -0.9596405029296875, -0.900054931640625, -0.8404693603515625, -0.7808837890625, -0.7212982177734375, -0.661712646484375, -0.6021270751953125, -0.54254150390625, -0.4829559326171875, -0.423370361328125, -0.3637847900390625, -0.30419921875, -0.2446136474609375, -0.185028076171875, -0.1254425048828125, -0.06585693359375, -0.0062713623046875, 0.053314208984375, 0.1128997802734375, 0.1724853515625, 0.2320709228515625, 0.291656494140625, 0.3512420654296875, 0.41082763671875, 0.4704132080078125, 0.529998779296875, 0.5895843505859375, 0.649169921875, 0.7087554931640625, 0.768341064453125, 0.8279266357421875, 0.88751220703125, 0.9470977783203125, 1.006683349609375, 1.0662689208984375, 1.1258544921875, 1.1854400634765625, 1.245025634765625, 1.3046112060546875, 1.36419677734375, 1.4237823486328125, 1.483367919921875, 1.5429534912109375, 1.6025390625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 10.0, 6.0, 5.0, 12.0, 12.0, 18.0, 12.0, 20.0, 23.0, 21.0, 24.0, 21.0, 24.0, 36.0, 31.0, 39.0, 45.0, 42.0, 52.0, 52.0, 37.0, 39.0, 52.0, 38.0, 32.0, 47.0, 32.0, 23.0, 39.0, 21.0, 26.0, 20.0, 12.0, 14.0, 13.0, 11.0, 13.0, 7.0, 7.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.39806365966797, -44.05989074707031, -42.72171401977539, -41.383541107177734, -40.04536437988281, -38.707191467285156, -37.3690185546875, -36.030845642089844, -34.69266891479492, -33.354496002197266, -32.016319274902344, -30.678146362304688, -29.3399715423584, -28.00179672241211, -26.663623809814453, -25.325448989868164, -23.987274169921875, -22.649099349975586, -21.310924530029297, -19.97275161743164, -18.63457679748535, -17.296401977539062, -15.95822811126709, -14.620054244995117, -13.281879425048828, -11.943704605102539, -10.605530738830566, -9.267356872558594, -7.929182052612305, -6.591007709503174, -5.252833366394043, -3.9146595001220703, -2.5764808654785156, -1.2383065223693848, 0.0998678207397461, 1.438042163848877, 2.776216506958008, 4.114390850067139, 5.4525651931762695, 6.790739059448242, 8.128913879394531, 9.46708869934082, 10.805262565612793, 12.143436431884766, 13.481611251831055, 14.819786071777344, 16.157958984375, 17.49613380432129, 18.834308624267578, 20.172483444213867, 21.510658264160156, 22.848831176757812, 24.1870059967041, 25.52518081665039, 26.863353729248047, 28.201528549194336, 29.539703369140625, 30.877878189086914, 32.2160530090332, 33.55422592163086, 34.89240264892578, 36.23057556152344, 37.568748474121094, 38.90692138671875, 40.24509811401367]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 7.0, 12.0, 8.0, 11.0, 12.0, 14.0, 13.0, 15.0, 22.0, 27.0, 29.0, 39.0, 24.0, 30.0, 40.0, 25.0, 44.0, 39.0, 48.0, 34.0, 28.0, 33.0, 45.0, 41.0, 44.0, 33.0, 32.0, 31.0, 34.0, 22.0, 25.0, 25.0, 18.0, 15.0, 17.0, 14.0, 6.0, 7.0, 11.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.02246856689453, -44.48436737060547, -42.946266174316406, -41.408164978027344, -39.870059967041016, -38.33195877075195, -36.79385757446289, -35.25575637817383, -33.717655181884766, -32.1795539855957, -30.641450881958008, -29.103349685668945, -27.565248489379883, -26.027145385742188, -24.489044189453125, -22.950942993164062, -21.412839889526367, -19.874738693237305, -18.33663558959961, -16.798534393310547, -15.260433197021484, -13.722331047058105, -12.184228897094727, -10.646127700805664, -9.108025550842285, -7.5699238777160645, -6.031822204589844, -4.493720054626465, -2.955618381500244, -1.4175167083740234, 0.12058544158935547, 1.658686637878418, 3.196788787841797, 4.734890460968018, 6.272992134094238, 7.811094284057617, 9.34919548034668, 10.887297630310059, 12.425399780273438, 13.9635009765625, 15.501603126525879, 17.039705276489258, 18.57780647277832, 20.115909576416016, 21.654010772705078, 23.19211196899414, 24.730213165283203, 26.268314361572266, 27.80641746520996, 29.344518661499023, 30.88262176513672, 32.42072296142578, 33.958824157714844, 35.496925354003906, 37.03502655029297, 38.57312774658203, 40.11123275756836, 41.64933395385742, 43.187435150146484, 44.72554016113281, 46.263641357421875, 47.80174255371094, 49.33984375, 50.87794494628906, 52.416046142578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 8.0, 7.0, 14.0, 20.0, 38.0, 67.0, 107.0, 183.0, 297.0, 481.0, 850.0, 1498.0, 2604.0, 4348.0, 7350.0, 11946.0, 19682.0, 30130.0, 45457.0, 63858.0, 84322.0, 103513.0, 116490.0, 118651.0, 110884.0, 95344.0, 74671.0, 54469.0, 37702.0, 24519.0, 15556.0, 9624.0, 5759.0, 3315.0, 1958.0, 1143.0, 662.0, 432.0, 254.0, 126.0, 86.0, 45.0, 33.0, 26.0, 6.0, 8.0, 7.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-30.890625, -29.989013671875, -29.08740234375, -28.185791015625, -27.2841796875, -26.382568359375, -25.48095703125, -24.579345703125, -23.677734375, -22.776123046875, -21.87451171875, -20.972900390625, -20.0712890625, -19.169677734375, -18.26806640625, -17.366455078125, -16.46484375, -15.563232421875, -14.66162109375, -13.760009765625, -12.8583984375, -11.956787109375, -11.05517578125, -10.153564453125, -9.251953125, -8.350341796875, -7.44873046875, -6.547119140625, -5.6455078125, -4.743896484375, -3.84228515625, -2.940673828125, -2.0390625, -1.137451171875, -0.23583984375, 0.665771484375, 1.5673828125, 2.468994140625, 3.37060546875, 4.272216796875, 5.173828125, 6.075439453125, 6.97705078125, 7.878662109375, 8.7802734375, 9.681884765625, 10.58349609375, 11.485107421875, 12.38671875, 13.288330078125, 14.18994140625, 15.091552734375, 15.9931640625, 16.894775390625, 17.79638671875, 18.697998046875, 19.599609375, 20.501220703125, 21.40283203125, 22.304443359375, 23.2060546875, 24.107666015625, 25.00927734375, 25.910888671875, 26.8125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 5.0, 12.0, 8.0, 12.0, 12.0, 15.0, 10.0, 23.0, 17.0, 27.0, 34.0, 34.0, 28.0, 28.0, 39.0, 23.0, 52.0, 34.0, 49.0, 30.0, 32.0, 38.0, 38.0, 41.0, 43.0, 35.0, 32.0, 32.0, 29.0, 27.0, 24.0, 22.0, 20.0, 16.0, 14.0, 14.0, 5.0, 9.0, 9.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-44.96875, -43.46044921875, -41.9521484375, -40.44384765625, -38.935546875, -37.42724609375, -35.9189453125, -34.41064453125, -32.90234375, -31.39404296875, -29.8857421875, -28.37744140625, -26.869140625, -25.36083984375, -23.8525390625, -22.34423828125, -20.8359375, -19.32763671875, -17.8193359375, -16.31103515625, -14.802734375, -13.29443359375, -11.7861328125, -10.27783203125, -8.76953125, -7.26123046875, -5.7529296875, -4.24462890625, -2.736328125, -1.22802734375, 0.2802734375, 1.78857421875, 3.296875, 4.80517578125, 6.3134765625, 7.82177734375, 9.330078125, 10.83837890625, 12.3466796875, 13.85498046875, 15.36328125, 16.87158203125, 18.3798828125, 19.88818359375, 21.396484375, 22.90478515625, 24.4130859375, 25.92138671875, 27.4296875, 28.93798828125, 30.4462890625, 31.95458984375, 33.462890625, 34.97119140625, 36.4794921875, 37.98779296875, 39.49609375, 41.00439453125, 42.5126953125, 44.02099609375, 45.529296875, 47.03759765625, 48.5458984375, 50.05419921875, 51.5625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 8.0, 16.0, 32.0, 34.0, 56.0, 99.0, 168.0, 240.0, 366.0, 560.0, 906.0, 1453.0, 2189.0, 3522.0, 5295.0, 7928.0, 12035.0, 17584.0, 26077.0, 36100.0, 48571.0, 63023.0, 77489.0, 89573.0, 98178.0, 100267.0, 95768.0, 85661.0, 72517.0, 58059.0, 43884.0, 32396.0, 22737.0, 15696.0, 10531.0, 6805.0, 4555.0, 2858.0, 1899.0, 1225.0, 822.0, 494.0, 337.0, 203.0, 120.0, 96.0, 55.0, 28.0, 16.0, 15.0, 7.0, 7.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.71875, -24.947021484375, -24.17529296875, -23.403564453125, -22.6318359375, -21.860107421875, -21.08837890625, -20.316650390625, -19.544921875, -18.773193359375, -18.00146484375, -17.229736328125, -16.4580078125, -15.686279296875, -14.91455078125, -14.142822265625, -13.37109375, -12.599365234375, -11.82763671875, -11.055908203125, -10.2841796875, -9.512451171875, -8.74072265625, -7.968994140625, -7.197265625, -6.425537109375, -5.65380859375, -4.882080078125, -4.1103515625, -3.338623046875, -2.56689453125, -1.795166015625, -1.0234375, -0.251708984375, 0.52001953125, 1.291748046875, 2.0634765625, 2.835205078125, 3.60693359375, 4.378662109375, 5.150390625, 5.922119140625, 6.69384765625, 7.465576171875, 8.2373046875, 9.009033203125, 9.78076171875, 10.552490234375, 11.32421875, 12.095947265625, 12.86767578125, 13.639404296875, 14.4111328125, 15.182861328125, 15.95458984375, 16.726318359375, 17.498046875, 18.269775390625, 19.04150390625, 19.813232421875, 20.5849609375, 21.356689453125, 22.12841796875, 22.900146484375, 23.671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 6.0, 11.0, 18.0, 15.0, 12.0, 20.0, 15.0, 25.0, 22.0, 28.0, 33.0, 30.0, 30.0, 34.0, 29.0, 26.0, 35.0, 34.0, 34.0, 38.0, 31.0, 40.0, 34.0, 34.0, 35.0, 31.0, 32.0, 24.0, 35.0, 9.0, 29.0, 25.0, 21.0, 15.0, 21.0, 13.0, 12.0, 6.0, 5.0, 10.0, 7.0, 0.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-29.65625, -28.7841796875, -27.912109375, -27.0400390625, -26.16796875, -25.2958984375, -24.423828125, -23.5517578125, -22.6796875, -21.8076171875, -20.935546875, -20.0634765625, -19.19140625, -18.3193359375, -17.447265625, -16.5751953125, -15.703125, -14.8310546875, -13.958984375, -13.0869140625, -12.21484375, -11.3427734375, -10.470703125, -9.5986328125, -8.7265625, -7.8544921875, -6.982421875, -6.1103515625, -5.23828125, -4.3662109375, -3.494140625, -2.6220703125, -1.75, -0.8779296875, -0.005859375, 0.8662109375, 1.73828125, 2.6103515625, 3.482421875, 4.3544921875, 5.2265625, 6.0986328125, 6.970703125, 7.8427734375, 8.71484375, 9.5869140625, 10.458984375, 11.3310546875, 12.203125, 13.0751953125, 13.947265625, 14.8193359375, 15.69140625, 16.5634765625, 17.435546875, 18.3076171875, 19.1796875, 20.0517578125, 20.923828125, 21.7958984375, 22.66796875, 23.5400390625, 24.412109375, 25.2841796875, 26.15625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 3.0, 12.0, 15.0, 20.0, 39.0, 49.0, 65.0, 123.0, 165.0, 285.0, 389.0, 667.0, 1091.0, 1683.0, 2846.0, 4627.0, 7502.0, 12472.0, 20687.0, 31666.0, 47701.0, 67428.0, 88713.0, 108974.0, 120962.0, 121694.0, 110646.0, 91447.0, 69528.0, 49592.0, 32939.0, 21003.0, 12882.0, 8039.0, 4898.0, 2856.0, 1836.0, 1096.0, 688.0, 435.0, 299.0, 156.0, 127.0, 74.0, 42.0, 37.0, 19.0, 15.0, 15.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.921875, -10.570068359375, -10.21826171875, -9.866455078125, -9.5146484375, -9.162841796875, -8.81103515625, -8.459228515625, -8.107421875, -7.755615234375, -7.40380859375, -7.052001953125, -6.7001953125, -6.348388671875, -5.99658203125, -5.644775390625, -5.29296875, -4.941162109375, -4.58935546875, -4.237548828125, -3.8857421875, -3.533935546875, -3.18212890625, -2.830322265625, -2.478515625, -2.126708984375, -1.77490234375, -1.423095703125, -1.0712890625, -0.719482421875, -0.36767578125, -0.015869140625, 0.3359375, 0.687744140625, 1.03955078125, 1.391357421875, 1.7431640625, 2.094970703125, 2.44677734375, 2.798583984375, 3.150390625, 3.502197265625, 3.85400390625, 4.205810546875, 4.5576171875, 4.909423828125, 5.26123046875, 5.613037109375, 5.96484375, 6.316650390625, 6.66845703125, 7.020263671875, 7.3720703125, 7.723876953125, 8.07568359375, 8.427490234375, 8.779296875, 9.131103515625, 9.48291015625, 9.834716796875, 10.1865234375, 10.538330078125, 10.89013671875, 11.241943359375, 11.59375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 2.0, 10.0, 10.0, 8.0, 10.0, 17.0, 21.0, 20.0, 28.0, 25.0, 40.0, 43.0, 41.0, 40.0, 53.0, 31.0, 44.0, 44.0, 44.0, 43.0, 49.0, 46.0, 48.0, 45.0, 39.0, 30.0, 23.0, 20.0, 22.0, 17.0, 16.0, 12.0, 11.0, 4.0, 9.0, 5.0, 7.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010890960693359375, -0.00105363130569458, -0.0010181665420532227, -0.0009827017784118652, -0.0009472370147705078, -0.0009117722511291504, -0.000876307487487793, -0.0008408427238464355, -0.0008053779602050781, -0.0007699131965637207, -0.0007344484329223633, -0.0006989836692810059, -0.0006635189056396484, -0.000628054141998291, -0.0005925893783569336, -0.0005571246147155762, -0.0005216598510742188, -0.00048619508743286133, -0.0004507303237915039, -0.0004152655601501465, -0.00037980079650878906, -0.00034433603286743164, -0.0003088712692260742, -0.0002734065055847168, -0.00023794174194335938, -0.00020247697830200195, -0.00016701221466064453, -0.0001315474510192871, -9.608268737792969e-05, -6.0617923736572266e-05, -2.5153160095214844e-05, 1.0311603546142578e-05, 4.57763671875e-05, 8.124113082885742e-05, 0.00011670589447021484, 0.00015217065811157227, 0.0001876354217529297, 0.0002231001853942871, 0.00025856494903564453, 0.00029402971267700195, 0.0003294944763183594, 0.0003649592399597168, 0.0004004240036010742, 0.00043588876724243164, 0.00047135353088378906, 0.0005068182945251465, 0.0005422830581665039, 0.0005777478218078613, 0.0006132125854492188, 0.0006486773490905762, 0.0006841421127319336, 0.000719606876373291, 0.0007550716400146484, 0.0007905364036560059, 0.0008260011672973633, 0.0008614659309387207, 0.0008969306945800781, 0.0009323954582214355, 0.000967860221862793, 0.0010033249855041504, 0.0010387897491455078, 0.0010742545127868652, 0.0011097192764282227, 0.00114518404006958, 0.0011806488037109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 11.0, 20.0, 30.0, 56.0, 58.0, 127.0, 193.0, 342.0, 584.0, 945.0, 1674.0, 2873.0, 5022.0, 8670.0, 15290.0, 25387.0, 41914.0, 65804.0, 94688.0, 122643.0, 139828.0, 140123.0, 122129.0, 93533.0, 64805.0, 41472.0, 25198.0, 14865.0, 8636.0, 4887.0, 2868.0, 1552.0, 877.0, 584.0, 329.0, 201.0, 118.0, 71.0, 50.0, 29.0, 21.0, 17.0, 6.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.0546875, -14.5982666015625, -14.141845703125, -13.6854248046875, -13.22900390625, -12.7725830078125, -12.316162109375, -11.8597412109375, -11.4033203125, -10.9468994140625, -10.490478515625, -10.0340576171875, -9.57763671875, -9.1212158203125, -8.664794921875, -8.2083740234375, -7.751953125, -7.2955322265625, -6.839111328125, -6.3826904296875, -5.92626953125, -5.4698486328125, -5.013427734375, -4.5570068359375, -4.1005859375, -3.6441650390625, -3.187744140625, -2.7313232421875, -2.27490234375, -1.8184814453125, -1.362060546875, -0.9056396484375, -0.44921875, 0.0072021484375, 0.463623046875, 0.9200439453125, 1.37646484375, 1.8328857421875, 2.289306640625, 2.7457275390625, 3.2021484375, 3.6585693359375, 4.114990234375, 4.5714111328125, 5.02783203125, 5.4842529296875, 5.940673828125, 6.3970947265625, 6.853515625, 7.3099365234375, 7.766357421875, 8.2227783203125, 8.67919921875, 9.1356201171875, 9.592041015625, 10.0484619140625, 10.5048828125, 10.9613037109375, 11.417724609375, 11.8741455078125, 12.33056640625, 12.7869873046875, 13.243408203125, 13.6998291015625, 14.15625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 7.0, 3.0, 4.0, 9.0, 12.0, 25.0, 19.0, 22.0, 42.0, 47.0, 45.0, 46.0, 59.0, 46.0, 84.0, 61.0, 67.0, 75.0, 59.0, 56.0, 50.0, 35.0, 23.0, 23.0, 16.0, 10.0, 10.0, 7.0, 5.0, 7.0, 2.0, 9.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9140625, -8.6209716796875, -8.327880859375, -8.0347900390625, -7.74169921875, -7.4486083984375, -7.155517578125, -6.8624267578125, -6.5693359375, -6.2762451171875, -5.983154296875, -5.6900634765625, -5.39697265625, -5.1038818359375, -4.810791015625, -4.5177001953125, -4.224609375, -3.9315185546875, -3.638427734375, -3.3453369140625, -3.05224609375, -2.7591552734375, -2.466064453125, -2.1729736328125, -1.8798828125, -1.5867919921875, -1.293701171875, -1.0006103515625, -0.70751953125, -0.4144287109375, -0.121337890625, 0.1717529296875, 0.46484375, 0.7579345703125, 1.051025390625, 1.3441162109375, 1.63720703125, 1.9302978515625, 2.223388671875, 2.5164794921875, 2.8095703125, 3.1026611328125, 3.395751953125, 3.6888427734375, 3.98193359375, 4.2750244140625, 4.568115234375, 4.8612060546875, 5.154296875, 5.4473876953125, 5.740478515625, 6.0335693359375, 6.32666015625, 6.6197509765625, 6.912841796875, 7.2059326171875, 7.4990234375, 7.7921142578125, 8.085205078125, 8.3782958984375, 8.67138671875, 8.9644775390625, 9.257568359375, 9.5506591796875, 9.84375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 7.0, 4.0, 4.0, 12.0, 14.0, 14.0, 20.0, 27.0, 24.0, 29.0, 30.0, 39.0, 31.0, 36.0, 32.0, 43.0, 48.0, 51.0, 45.0, 46.0, 46.0, 46.0, 37.0, 37.0, 38.0, 30.0, 30.0, 34.0, 26.0, 22.0, 13.0, 19.0, 13.0, 14.0, 8.0, 7.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-45.24540710449219, -43.857357025146484, -42.469303131103516, -41.08125305175781, -39.69320297241211, -38.305152893066406, -36.91709899902344, -35.529048919677734, -34.14099884033203, -32.75294876098633, -31.364896774291992, -29.976844787597656, -28.588794708251953, -27.200742721557617, -25.81269073486328, -24.424640655517578, -23.03658676147461, -21.648534774780273, -20.26048469543457, -18.872432708740234, -17.48438262939453, -16.096330642700195, -14.70827865600586, -13.32022762298584, -11.93217658996582, -10.5441255569458, -9.156074523925781, -7.768022537231445, -6.379971504211426, -4.991920471191406, -3.6038684844970703, -2.215817451477051, -0.8277702331542969, 0.5602810382843018, 1.9483323097229004, 3.336383819580078, 4.724434852600098, 6.112485885620117, 7.500537872314453, 8.888588905334473, 10.276639938354492, 11.664690971374512, 13.052742004394531, 14.440793991088867, 15.828845024108887, 17.216896057128906, 18.604948043823242, 19.993000030517578, 21.38105010986328, 22.769102096557617, 24.15715217590332, 25.545204162597656, 26.93325424194336, 28.321306228637695, 29.70935821533203, 31.097408294677734, 32.48545837402344, 33.87350845336914, 35.26156234741211, 36.64961242675781, 38.037662506103516, 39.42571258544922, 40.81376647949219, 42.20181655883789, 43.58987045288086]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 3.0, 10.0, 5.0, 7.0, 11.0, 8.0, 14.0, 15.0, 13.0, 18.0, 33.0, 29.0, 24.0, 36.0, 39.0, 42.0, 40.0, 28.0, 58.0, 42.0, 41.0, 44.0, 42.0, 42.0, 38.0, 30.0, 39.0, 40.0, 25.0, 31.0, 30.0, 19.0, 22.0, 17.0, 11.0, 23.0, 6.0, 9.0, 9.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-60.93818664550781, -59.21961975097656, -57.50105285644531, -55.78248977661133, -54.06392288208008, -52.34535598754883, -50.62678909301758, -48.908226013183594, -47.189659118652344, -45.471092224121094, -43.752525329589844, -42.03396224975586, -40.31539535522461, -38.59682846069336, -36.87826156616211, -35.159698486328125, -33.441131591796875, -31.722564697265625, -30.003999710083008, -28.285432815551758, -26.56686782836914, -24.84830093383789, -23.12973403930664, -21.411169052124023, -19.69260025024414, -17.97403335571289, -16.255468368530273, -14.536901473999023, -12.818336486816406, -11.099769592285156, -9.381203651428223, -7.662637710571289, -5.944072723388672, -4.225506782531738, -2.5069406032562256, -0.7883744239807129, 0.9301915168762207, 2.6487579345703125, 4.367323875427246, 6.08588981628418, 7.804455757141113, 9.523021697998047, 11.24158763885498, 12.960153579711914, 14.678720474243164, 16.39728546142578, 18.11585235595703, 19.83441925048828, 21.5529842376709, 23.27155113220215, 24.990116119384766, 26.708683013916016, 28.427248001098633, 30.145814895629883, 31.8643798828125, 33.58294677734375, 35.301513671875, 37.02008056640625, 38.7386474609375, 40.457210540771484, 42.175777435302734, 43.894344329833984, 45.612911224365234, 47.33147430419922, 49.05004119873047]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 19.0, 18.0, 39.0, 66.0, 89.0, 186.0, 278.0, 460.0, 782.0, 1275.0, 2058.0, 3450.0, 5184.0, 8225.0, 12747.0, 19678.0, 29596.0, 43896.0, 63140.0, 87264.0, 120739.0, 159185.0, 203988.0, 249419.0, 293515.0, 330145.0, 351675.0, 357998.0, 345966.0, 317365.0, 276975.0, 232675.0, 185472.0, 144060.0, 107223.0, 76837.0, 54556.0, 37465.0, 25151.0, 16494.0, 10791.0, 6936.0, 4280.0, 2757.0, 1640.0, 1016.0, 610.0, 366.0, 228.0, 120.0, 89.0, 39.0, 27.0, 12.0, 16.0, 1.0, 1.0, 2.0], "bins": [-28.171875, -27.325927734375, -26.47998046875, -25.634033203125, -24.7880859375, -23.942138671875, -23.09619140625, -22.250244140625, -21.404296875, -20.558349609375, -19.71240234375, -18.866455078125, -18.0205078125, -17.174560546875, -16.32861328125, -15.482666015625, -14.63671875, -13.790771484375, -12.94482421875, -12.098876953125, -11.2529296875, -10.406982421875, -9.56103515625, -8.715087890625, -7.869140625, -7.023193359375, -6.17724609375, -5.331298828125, -4.4853515625, -3.639404296875, -2.79345703125, -1.947509765625, -1.1015625, -0.255615234375, 0.59033203125, 1.436279296875, 2.2822265625, 3.128173828125, 3.97412109375, 4.820068359375, 5.666015625, 6.511962890625, 7.35791015625, 8.203857421875, 9.0498046875, 9.895751953125, 10.74169921875, 11.587646484375, 12.43359375, 13.279541015625, 14.12548828125, 14.971435546875, 15.8173828125, 16.663330078125, 17.50927734375, 18.355224609375, 19.201171875, 20.047119140625, 20.89306640625, 21.739013671875, 22.5849609375, 23.430908203125, 24.27685546875, 25.122802734375, 25.96875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 5.0, 10.0, 8.0, 9.0, 17.0, 15.0, 14.0, 23.0, 35.0, 25.0, 28.0, 38.0, 36.0, 41.0, 36.0, 37.0, 50.0, 52.0, 33.0, 42.0, 47.0, 44.0, 30.0, 37.0, 36.0, 34.0, 29.0, 29.0, 25.0, 27.0, 16.0, 18.0, 17.0, 13.0, 6.0, 8.0, 6.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-51.71875, -50.25390625, -48.7890625, -47.32421875, -45.859375, -44.39453125, -42.9296875, -41.46484375, -40.0, -38.53515625, -37.0703125, -35.60546875, -34.140625, -32.67578125, -31.2109375, -29.74609375, -28.28125, -26.81640625, -25.3515625, -23.88671875, -22.421875, -20.95703125, -19.4921875, -18.02734375, -16.5625, -15.09765625, -13.6328125, -12.16796875, -10.703125, -9.23828125, -7.7734375, -6.30859375, -4.84375, -3.37890625, -1.9140625, -0.44921875, 1.015625, 2.48046875, 3.9453125, 5.41015625, 6.875, 8.33984375, 9.8046875, 11.26953125, 12.734375, 14.19921875, 15.6640625, 17.12890625, 18.59375, 20.05859375, 21.5234375, 22.98828125, 24.453125, 25.91796875, 27.3828125, 28.84765625, 30.3125, 31.77734375, 33.2421875, 34.70703125, 36.171875, 37.63671875, 39.1015625, 40.56640625, 42.03125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 8.0, 6.0, 11.0, 26.0, 42.0, 76.0, 145.0, 263.0, 504.0, 854.0, 1313.0, 2419.0, 3873.0, 6228.0, 10296.0, 15930.0, 24471.0, 36347.0, 53564.0, 75852.0, 103607.0, 138143.0, 177342.0, 218928.0, 259414.0, 296572.0, 323688.0, 338474.0, 338434.0, 325385.0, 297148.0, 261885.0, 220956.0, 179217.0, 140065.0, 105874.0, 76999.0, 54628.0, 37312.0, 24898.0, 16295.0, 10474.0, 6585.0, 3905.0, 2420.0, 1475.0, 804.0, 497.0, 270.0, 172.0, 81.0, 57.0, 29.0, 20.0, 10.0, 4.0, 5.0, 1.0, 0.0, 1.0], "bins": [-27.78125, -26.913818359375, -26.04638671875, -25.178955078125, -24.3115234375, -23.444091796875, -22.57666015625, -21.709228515625, -20.841796875, -19.974365234375, -19.10693359375, -18.239501953125, -17.3720703125, -16.504638671875, -15.63720703125, -14.769775390625, -13.90234375, -13.034912109375, -12.16748046875, -11.300048828125, -10.4326171875, -9.565185546875, -8.69775390625, -7.830322265625, -6.962890625, -6.095458984375, -5.22802734375, -4.360595703125, -3.4931640625, -2.625732421875, -1.75830078125, -0.890869140625, -0.0234375, 0.843994140625, 1.71142578125, 2.578857421875, 3.4462890625, 4.313720703125, 5.18115234375, 6.048583984375, 6.916015625, 7.783447265625, 8.65087890625, 9.518310546875, 10.3857421875, 11.253173828125, 12.12060546875, 12.988037109375, 13.85546875, 14.722900390625, 15.59033203125, 16.457763671875, 17.3251953125, 18.192626953125, 19.06005859375, 19.927490234375, 20.794921875, 21.662353515625, 22.52978515625, 23.397216796875, 24.2646484375, 25.132080078125, 25.99951171875, 26.866943359375, 27.734375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 9.0, 14.0, 18.0, 15.0, 39.0, 25.0, 36.0, 46.0, 66.0, 61.0, 66.0, 94.0, 99.0, 105.0, 119.0, 126.0, 188.0, 189.0, 173.0, 157.0, 214.0, 199.0, 207.0, 174.0, 213.0, 152.0, 166.0, 145.0, 142.0, 112.0, 111.0, 104.0, 93.0, 77.0, 59.0, 47.0, 35.0, 35.0, 27.0, 24.0, 22.0, 12.0, 15.0, 10.0, 13.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-18.28125, -17.704345703125, -17.12744140625, -16.550537109375, -15.9736328125, -15.396728515625, -14.81982421875, -14.242919921875, -13.666015625, -13.089111328125, -12.51220703125, -11.935302734375, -11.3583984375, -10.781494140625, -10.20458984375, -9.627685546875, -9.05078125, -8.473876953125, -7.89697265625, -7.320068359375, -6.7431640625, -6.166259765625, -5.58935546875, -5.012451171875, -4.435546875, -3.858642578125, -3.28173828125, -2.704833984375, -2.1279296875, -1.551025390625, -0.97412109375, -0.397216796875, 0.1796875, 0.756591796875, 1.33349609375, 1.910400390625, 2.4873046875, 3.064208984375, 3.64111328125, 4.218017578125, 4.794921875, 5.371826171875, 5.94873046875, 6.525634765625, 7.1025390625, 7.679443359375, 8.25634765625, 8.833251953125, 9.41015625, 9.987060546875, 10.56396484375, 11.140869140625, 11.7177734375, 12.294677734375, 12.87158203125, 13.448486328125, 14.025390625, 14.602294921875, 15.17919921875, 15.756103515625, 16.3330078125, 16.909912109375, 17.48681640625, 18.063720703125, 18.640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 6.0, 12.0, 10.0, 12.0, 17.0, 15.0, 25.0, 25.0, 28.0, 34.0, 33.0, 44.0, 52.0, 47.0, 51.0, 52.0, 53.0, 41.0, 60.0, 56.0, 41.0, 36.0, 40.0, 35.0, 51.0, 26.0, 22.0, 15.0, 16.0, 11.0, 8.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.50125503540039, -50.83865737915039, -49.17605972290039, -47.51346206665039, -45.850868225097656, -44.188270568847656, -42.525672912597656, -40.863075256347656, -39.200477600097656, -37.537879943847656, -35.875282287597656, -34.212684631347656, -32.550086975097656, -30.88749122619629, -29.224895477294922, -27.562297821044922, -25.899700164794922, -24.237102508544922, -22.574504852294922, -20.911909103393555, -19.249311447143555, -17.586713790893555, -15.924117088317871, -14.261520385742188, -12.598922729492188, -10.936325073242188, -9.273728370666504, -7.611131191253662, -5.94853401184082, -4.28593635559082, -2.6233396530151367, -0.9607429504394531, 0.7018585205078125, 2.3644556999206543, 4.027052879333496, 5.689650058746338, 7.35224723815918, 9.01484489440918, 10.677441596984863, 12.340038299560547, 14.002635955810547, 15.665233612060547, 17.327831268310547, 18.990427017211914, 20.653024673461914, 22.315622329711914, 23.97821807861328, 25.64081573486328, 27.30341339111328, 28.96601104736328, 30.62860870361328, 32.29120635986328, 33.95380401611328, 35.61640167236328, 37.278995513916016, 38.941593170166016, 40.604190826416016, 42.266788482666016, 43.929386138916016, 45.591983795166016, 47.25457763671875, 48.91717529296875, 50.57977294921875, 52.24237060546875, 53.90496826171875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 9.0, 12.0, 10.0, 11.0, 12.0, 10.0, 20.0, 17.0, 21.0, 11.0, 22.0, 33.0, 29.0, 32.0, 28.0, 29.0, 36.0, 32.0, 43.0, 40.0, 27.0, 43.0, 36.0, 35.0, 42.0, 30.0, 30.0, 36.0, 26.0, 31.0, 32.0, 28.0, 19.0, 20.0, 20.0, 13.0, 19.0, 5.0, 10.0, 4.0, 10.0, 8.0, 5.0, 1.0, 6.0, 4.0, 1.0, 3.0, 1.0], "bins": [-53.713653564453125, -52.21208953857422, -50.71052551269531, -49.208961486816406, -47.707393646240234, -46.20582962036133, -44.70426559448242, -43.202701568603516, -41.701133728027344, -40.19956970214844, -38.69800567626953, -37.196441650390625, -35.69487380981445, -34.19330978393555, -32.69174575805664, -31.190181732177734, -29.688617706298828, -28.187053680419922, -26.685487747192383, -25.183923721313477, -23.682357788085938, -22.18079376220703, -20.679229736328125, -19.17766571044922, -17.67609977722168, -16.174535751342773, -14.672969818115234, -13.171405792236328, -11.669840812683105, -10.168275833129883, -8.666711807250977, -7.165146827697754, -5.663585662841797, -4.162020683288574, -2.6604561805725098, -1.1588916778564453, 0.34267330169677734, 1.84423828125, 3.3458023071289062, 4.847367286682129, 6.348932266235352, 7.850497245788574, 9.352062225341797, 10.853626251220703, 12.355191230773926, 13.856756210327148, 15.358320236206055, 16.859886169433594, 18.3614501953125, 19.863014221191406, 21.364580154418945, 22.86614418029785, 24.36771011352539, 25.869274139404297, 27.370838165283203, 28.87240219116211, 30.37396812438965, 31.875532150268555, 33.377098083496094, 34.878662109375, 36.380226135253906, 37.88179016113281, 39.38335418701172, 40.88492202758789, 42.3864860534668]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 8.0, 15.0, 24.0, 37.0, 59.0, 95.0, 144.0, 216.0, 372.0, 548.0, 880.0, 1456.0, 2414.0, 3883.0, 6398.0, 10389.0, 17470.0, 30577.0, 54530.0, 96561.0, 163322.0, 222683.0, 180844.0, 109113.0, 61824.0, 34970.0, 19942.0, 11705.0, 7004.0, 4148.0, 2592.0, 1566.0, 1040.0, 617.0, 399.0, 235.0, 144.0, 117.0, 61.0, 54.0, 31.0, 21.0, 18.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.8984375, -6.6868896484375, -6.475341796875, -6.2637939453125, -6.05224609375, -5.8406982421875, -5.629150390625, -5.4176025390625, -5.2060546875, -4.9945068359375, -4.782958984375, -4.5714111328125, -4.35986328125, -4.1483154296875, -3.936767578125, -3.7252197265625, -3.513671875, -3.3021240234375, -3.090576171875, -2.8790283203125, -2.66748046875, -2.4559326171875, -2.244384765625, -2.0328369140625, -1.8212890625, -1.6097412109375, -1.398193359375, -1.1866455078125, -0.97509765625, -0.7635498046875, -0.552001953125, -0.3404541015625, -0.12890625, 0.0826416015625, 0.294189453125, 0.5057373046875, 0.71728515625, 0.9288330078125, 1.140380859375, 1.3519287109375, 1.5634765625, 1.7750244140625, 1.986572265625, 2.1981201171875, 2.40966796875, 2.6212158203125, 2.832763671875, 3.0443115234375, 3.255859375, 3.4674072265625, 3.678955078125, 3.8905029296875, 4.10205078125, 4.3135986328125, 4.525146484375, 4.7366943359375, 4.9482421875, 5.1597900390625, 5.371337890625, 5.5828857421875, 5.79443359375, 6.0059814453125, 6.217529296875, 6.4290771484375, 6.640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 9.0, 12.0, 10.0, 12.0, 11.0, 10.0, 19.0, 17.0, 22.0, 11.0, 23.0, 31.0, 30.0, 33.0, 27.0, 30.0, 36.0, 32.0, 43.0, 39.0, 27.0, 44.0, 35.0, 36.0, 41.0, 30.0, 32.0, 35.0, 26.0, 30.0, 33.0, 28.0, 18.0, 21.0, 19.0, 14.0, 17.0, 7.0, 9.0, 5.0, 9.0, 9.0, 4.0, 1.0, 6.0, 4.0, 1.0, 3.0, 1.0], "bins": [-53.875, -52.37255859375, -50.8701171875, -49.36767578125, -47.865234375, -46.36279296875, -44.8603515625, -43.35791015625, -41.85546875, -40.35302734375, -38.8505859375, -37.34814453125, -35.845703125, -34.34326171875, -32.8408203125, -31.33837890625, -29.8359375, -28.33349609375, -26.8310546875, -25.32861328125, -23.826171875, -22.32373046875, -20.8212890625, -19.31884765625, -17.81640625, -16.31396484375, -14.8115234375, -13.30908203125, -11.806640625, -10.30419921875, -8.8017578125, -7.29931640625, -5.796875, -4.29443359375, -2.7919921875, -1.28955078125, 0.212890625, 1.71533203125, 3.2177734375, 4.72021484375, 6.22265625, 7.72509765625, 9.2275390625, 10.72998046875, 12.232421875, 13.73486328125, 15.2373046875, 16.73974609375, 18.2421875, 19.74462890625, 21.2470703125, 22.74951171875, 24.251953125, 25.75439453125, 27.2568359375, 28.75927734375, 30.26171875, 31.76416015625, 33.2666015625, 34.76904296875, 36.271484375, 37.77392578125, 39.2763671875, 40.77880859375, 42.28125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 14.0, 18.0, 25.0, 27.0, 61.0, 59.0, 88.0, 137.0, 193.0, 267.0, 413.0, 577.0, 873.0, 1364.0, 2078.0, 3483.0, 5892.0, 10825.0, 20793.0, 43058.0, 95022.0, 220771.0, 328801.0, 168497.0, 72965.0, 33628.0, 16443.0, 8837.0, 4950.0, 2921.0, 1828.0, 1179.0, 737.0, 568.0, 349.0, 241.0, 168.0, 117.0, 74.0, 77.0, 47.0, 23.0, 24.0, 16.0, 9.0, 4.0, 9.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.83984375, -7.58966064453125, -7.3394775390625, -7.08929443359375, -6.839111328125, -6.58892822265625, -6.3387451171875, -6.08856201171875, -5.83837890625, -5.58819580078125, -5.3380126953125, -5.08782958984375, -4.837646484375, -4.58746337890625, -4.3372802734375, -4.08709716796875, -3.8369140625, -3.58673095703125, -3.3365478515625, -3.08636474609375, -2.836181640625, -2.58599853515625, -2.3358154296875, -2.08563232421875, -1.83544921875, -1.58526611328125, -1.3350830078125, -1.08489990234375, -0.834716796875, -0.58453369140625, -0.3343505859375, -0.08416748046875, 0.166015625, 0.41619873046875, 0.6663818359375, 0.91656494140625, 1.166748046875, 1.41693115234375, 1.6671142578125, 1.91729736328125, 2.16748046875, 2.41766357421875, 2.6678466796875, 2.91802978515625, 3.168212890625, 3.41839599609375, 3.6685791015625, 3.91876220703125, 4.1689453125, 4.41912841796875, 4.6693115234375, 4.91949462890625, 5.169677734375, 5.41986083984375, 5.6700439453125, 5.92022705078125, 6.17041015625, 6.42059326171875, 6.6707763671875, 6.92095947265625, 7.171142578125, 7.42132568359375, 7.6715087890625, 7.92169189453125, 8.171875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 12.0, 7.0, 8.0, 17.0, 19.0, 16.0, 16.0, 18.0, 30.0, 31.0, 27.0, 33.0, 40.0, 37.0, 33.0, 39.0, 36.0, 38.0, 48.0, 41.0, 48.0, 29.0, 41.0, 42.0, 32.0, 36.0, 31.0, 32.0, 21.0, 19.0, 15.0, 13.0, 18.0, 22.0, 7.0, 11.0, 5.0, 9.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-35.46875, -34.457275390625, -33.44580078125, -32.434326171875, -31.4228515625, -30.411376953125, -29.39990234375, -28.388427734375, -27.376953125, -26.365478515625, -25.35400390625, -24.342529296875, -23.3310546875, -22.319580078125, -21.30810546875, -20.296630859375, -19.28515625, -18.273681640625, -17.26220703125, -16.250732421875, -15.2392578125, -14.227783203125, -13.21630859375, -12.204833984375, -11.193359375, -10.181884765625, -9.17041015625, -8.158935546875, -7.1474609375, -6.135986328125, -5.12451171875, -4.113037109375, -3.1015625, -2.090087890625, -1.07861328125, -0.067138671875, 0.9443359375, 1.955810546875, 2.96728515625, 3.978759765625, 4.990234375, 6.001708984375, 7.01318359375, 8.024658203125, 9.0361328125, 10.047607421875, 11.05908203125, 12.070556640625, 13.08203125, 14.093505859375, 15.10498046875, 16.116455078125, 17.1279296875, 18.139404296875, 19.15087890625, 20.162353515625, 21.173828125, 22.185302734375, 23.19677734375, 24.208251953125, 25.2197265625, 26.231201171875, 27.24267578125, 28.254150390625, 29.265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 6.0, 8.0, 10.0, 6.0, 18.0, 23.0, 29.0, 46.0, 69.0, 88.0, 150.0, 256.0, 476.0, 901.0, 1995.0, 5474.0, 20491.0, 184290.0, 748059.0, 67623.0, 11789.0, 3581.0, 1516.0, 714.0, 322.0, 197.0, 123.0, 82.0, 58.0, 43.0, 22.0, 24.0, 13.0, 10.0, 8.0, 9.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.1640625, -6.948974609375, -6.73388671875, -6.518798828125, -6.3037109375, -6.088623046875, -5.87353515625, -5.658447265625, -5.443359375, -5.228271484375, -5.01318359375, -4.798095703125, -4.5830078125, -4.367919921875, -4.15283203125, -3.937744140625, -3.72265625, -3.507568359375, -3.29248046875, -3.077392578125, -2.8623046875, -2.647216796875, -2.43212890625, -2.217041015625, -2.001953125, -1.786865234375, -1.57177734375, -1.356689453125, -1.1416015625, -0.926513671875, -0.71142578125, -0.496337890625, -0.28125, -0.066162109375, 0.14892578125, 0.364013671875, 0.5791015625, 0.794189453125, 1.00927734375, 1.224365234375, 1.439453125, 1.654541015625, 1.86962890625, 2.084716796875, 2.2998046875, 2.514892578125, 2.72998046875, 2.945068359375, 3.16015625, 3.375244140625, 3.59033203125, 3.805419921875, 4.0205078125, 4.235595703125, 4.45068359375, 4.665771484375, 4.880859375, 5.095947265625, 5.31103515625, 5.526123046875, 5.7412109375, 5.956298828125, 6.17138671875, 6.386474609375, 6.6015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 12.0, 8.0, 8.0, 14.0, 16.0, 26.0, 36.0, 70.0, 85.0, 108.0, 112.0, 120.0, 96.0, 62.0, 65.0, 42.0, 26.0, 19.0, 11.0, 10.0, 8.0, 7.0, 3.0, 6.0, 4.0, 4.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0003476142883300781, -0.00033862143754959106, -0.000329628586769104, -0.00032063573598861694, -0.0003116428852081299, -0.0003026500344276428, -0.00029365718364715576, -0.0002846643328666687, -0.00027567148208618164, -0.0002666786313056946, -0.0002576857805252075, -0.00024869292974472046, -0.0002397000789642334, -0.00023070722818374634, -0.00022171437740325928, -0.00021272152662277222, -0.00020372867584228516, -0.0001947358250617981, -0.00018574297428131104, -0.00017675012350082397, -0.00016775727272033691, -0.00015876442193984985, -0.0001497715711593628, -0.00014077872037887573, -0.00013178586959838867, -0.0001227930188179016, -0.00011380016803741455, -0.00010480731725692749, -9.581446647644043e-05, -8.682161569595337e-05, -7.782876491546631e-05, -6.883591413497925e-05, -5.984306335449219e-05, -5.085021257400513e-05, -4.1857361793518066e-05, -3.2864511013031006e-05, -2.3871660232543945e-05, -1.4878809452056885e-05, -5.885958671569824e-06, 3.1068921089172363e-06, 1.2099742889404297e-05, 2.1092593669891357e-05, 3.0085444450378418e-05, 3.907829523086548e-05, 4.807114601135254e-05, 5.70639967918396e-05, 6.605684757232666e-05, 7.504969835281372e-05, 8.404254913330078e-05, 9.303539991378784e-05, 0.0001020282506942749, 0.00011102110147476196, 0.00012001395225524902, 0.00012900680303573608, 0.00013799965381622314, 0.0001469925045967102, 0.00015598535537719727, 0.00016497820615768433, 0.0001739710569381714, 0.00018296390771865845, 0.0001919567584991455, 0.00020094960927963257, 0.00020994246006011963, 0.0002189353108406067, 0.00022792816162109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 13.0, 14.0, 14.0, 24.0, 29.0, 51.0, 55.0, 91.0, 124.0, 173.0, 218.0, 343.0, 498.0, 666.0, 1102.0, 1734.0, 3172.0, 6166.0, 13838.0, 34243.0, 94907.0, 274367.0, 374288.0, 150979.0, 52100.0, 20198.0, 8728.0, 4119.0, 2225.0, 1366.0, 816.0, 539.0, 422.0, 249.0, 178.0, 151.0, 112.0, 60.0, 48.0, 49.0, 29.0, 20.0, 16.0, 5.0, 5.0, 5.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.1044921875, -4.935546875, -4.7666015625, -4.59765625, -4.4287109375, -4.259765625, -4.0908203125, -3.921875, -3.7529296875, -3.583984375, -3.4150390625, -3.24609375, -3.0771484375, -2.908203125, -2.7392578125, -2.5703125, -2.4013671875, -2.232421875, -2.0634765625, -1.89453125, -1.7255859375, -1.556640625, -1.3876953125, -1.21875, -1.0498046875, -0.880859375, -0.7119140625, -0.54296875, -0.3740234375, -0.205078125, -0.0361328125, 0.1328125, 0.3017578125, 0.470703125, 0.6396484375, 0.80859375, 0.9775390625, 1.146484375, 1.3154296875, 1.484375, 1.6533203125, 1.822265625, 1.9912109375, 2.16015625, 2.3291015625, 2.498046875, 2.6669921875, 2.8359375, 3.0048828125, 3.173828125, 3.3427734375, 3.51171875, 3.6806640625, 3.849609375, 4.0185546875, 4.1875, 4.3564453125, 4.525390625, 4.6943359375, 4.86328125, 5.0322265625, 5.201171875, 5.3701171875, 5.5390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 3.0, 9.0, 7.0, 8.0, 6.0, 22.0, 19.0, 14.0, 26.0, 20.0, 33.0, 29.0, 58.0, 59.0, 72.0, 75.0, 84.0, 90.0, 55.0, 47.0, 39.0, 35.0, 24.0, 28.0, 23.0, 20.0, 12.0, 22.0, 14.0, 9.0, 8.0, 8.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.271484375, -1.23211669921875, -1.1927490234375, -1.15338134765625, -1.114013671875, -1.07464599609375, -1.0352783203125, -0.99591064453125, -0.95654296875, -0.91717529296875, -0.8778076171875, -0.83843994140625, -0.799072265625, -0.75970458984375, -0.7203369140625, -0.68096923828125, -0.6416015625, -0.60223388671875, -0.5628662109375, -0.52349853515625, -0.484130859375, -0.44476318359375, -0.4053955078125, -0.36602783203125, -0.32666015625, -0.28729248046875, -0.2479248046875, -0.20855712890625, -0.169189453125, -0.12982177734375, -0.0904541015625, -0.05108642578125, -0.01171875, 0.02764892578125, 0.0670166015625, 0.10638427734375, 0.145751953125, 0.18511962890625, 0.2244873046875, 0.26385498046875, 0.30322265625, 0.34259033203125, 0.3819580078125, 0.42132568359375, 0.460693359375, 0.50006103515625, 0.5394287109375, 0.57879638671875, 0.6181640625, 0.65753173828125, 0.6968994140625, 0.73626708984375, 0.775634765625, 0.81500244140625, 0.8543701171875, 0.89373779296875, 0.93310546875, 0.97247314453125, 1.0118408203125, 1.05120849609375, 1.090576171875, 1.12994384765625, 1.1693115234375, 1.20867919921875, 1.248046875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 9.0, 2.0, 4.0, 12.0, 10.0, 16.0, 12.0, 15.0, 16.0, 33.0, 24.0, 29.0, 36.0, 40.0, 51.0, 52.0, 37.0, 54.0, 55.0, 57.0, 46.0, 59.0, 40.0, 43.0, 39.0, 38.0, 40.0, 37.0, 20.0, 18.0, 15.0, 17.0, 8.0, 6.0, 10.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84889602661133, -51.19302749633789, -49.53715896606445, -47.88129425048828, -46.225425720214844, -44.569557189941406, -42.91368865966797, -41.25782012939453, -39.601951599121094, -37.946083068847656, -36.29021453857422, -34.63434600830078, -32.97848129272461, -31.322612762451172, -29.666744232177734, -28.010875701904297, -26.355010986328125, -24.699142456054688, -23.043275833129883, -21.387407302856445, -19.73154067993164, -18.075672149658203, -16.419803619384766, -14.763936042785645, -13.108068466186523, -11.452200889587402, -9.796333312988281, -8.140464782714844, -6.484597206115723, -4.828729629516602, -3.172861099243164, -1.516993522644043, 0.13887405395507812, 1.7947418689727783, 3.4506096839904785, 5.106477737426758, 6.762345314025879, 8.418212890625, 10.074081420898438, 11.729948997497559, 13.38581657409668, 15.0416841506958, 16.697551727294922, 18.35342025756836, 20.009288787841797, 21.6651554107666, 23.32102394104004, 24.976890563964844, 26.63275909423828, 28.28862762451172, 29.944494247436523, 31.60036277770996, 33.256229400634766, 34.9120979309082, 36.56796646118164, 38.22383499145508, 39.87969970703125, 41.53556823730469, 43.191436767578125, 44.84730529785156, 46.503170013427734, 48.15903854370117, 49.81490707397461, 51.47077560424805, 53.126644134521484]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 2.0, 4.0, 4.0, 9.0, 10.0, 12.0, 15.0, 8.0, 8.0, 24.0, 16.0, 21.0, 10.0, 21.0, 34.0, 31.0, 34.0, 24.0, 28.0, 40.0, 33.0, 45.0, 35.0, 30.0, 43.0, 39.0, 37.0, 36.0, 34.0, 30.0, 32.0, 28.0, 30.0, 31.0, 26.0, 21.0, 20.0, 21.0, 15.0, 14.0, 7.0, 7.0, 6.0, 9.0, 10.0, 3.0, 0.0, 6.0, 4.0, 1.0, 3.0, 1.0], "bins": [-53.85544204711914, -52.34960174560547, -50.84375762939453, -49.33791732788086, -47.83207702636719, -46.32623291015625, -44.82039260864258, -43.314552307128906, -41.80870819091797, -40.3028678894043, -38.79702377319336, -37.29118347167969, -35.785343170166016, -34.279502868652344, -32.773658752441406, -31.267818450927734, -29.761978149414062, -28.256135940551758, -26.750295639038086, -25.24445343017578, -23.73861312866211, -22.232770919799805, -20.7269287109375, -19.221088409423828, -17.715246200561523, -16.20940399169922, -14.703563690185547, -13.197721481323242, -11.691880226135254, -10.186038970947266, -8.680196762084961, -7.174355506896973, -5.668510437011719, -4.1626691818237305, -2.656827449798584, -1.1509857177734375, 0.3548555374145508, 1.860696792602539, 3.3665390014648438, 4.872380256652832, 6.37822151184082, 7.884062767028809, 9.389904022216797, 10.895746231079102, 12.40158748626709, 13.907428741455078, 15.413270950317383, 16.919113159179688, 18.42495346069336, 19.930795669555664, 21.436635971069336, 22.94247817993164, 24.448318481445312, 25.954160690307617, 27.460002899169922, 28.965843200683594, 30.4716854095459, 31.977527618408203, 33.483367919921875, 34.98921203613281, 36.495052337646484, 38.000892639160156, 39.506736755371094, 41.012577056884766, 42.51841735839844]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 8.0, 11.0, 24.0, 48.0, 64.0, 120.0, 176.0, 311.0, 490.0, 771.0, 1261.0, 2094.0, 3196.0, 5252.0, 8280.0, 12425.0, 18425.0, 26687.0, 36855.0, 50167.0, 64577.0, 78079.0, 90307.0, 98037.0, 99253.0, 95045.0, 85229.0, 72258.0, 57613.0, 43906.0, 32156.0, 22566.0, 15263.0, 10129.0, 6548.0, 4186.0, 2558.0, 1652.0, 966.0, 612.0, 409.0, 220.0, 145.0, 72.0, 50.0, 25.0, 16.0, 8.0, 4.0, 6.0, 0.0, 2.0, 3.0, 1.0], "bins": [-25.65625, -24.907470703125, -24.15869140625, -23.409912109375, -22.6611328125, -21.912353515625, -21.16357421875, -20.414794921875, -19.666015625, -18.917236328125, -18.16845703125, -17.419677734375, -16.6708984375, -15.922119140625, -15.17333984375, -14.424560546875, -13.67578125, -12.927001953125, -12.17822265625, -11.429443359375, -10.6806640625, -9.931884765625, -9.18310546875, -8.434326171875, -7.685546875, -6.936767578125, -6.18798828125, -5.439208984375, -4.6904296875, -3.941650390625, -3.19287109375, -2.444091796875, -1.6953125, -0.946533203125, -0.19775390625, 0.551025390625, 1.2998046875, 2.048583984375, 2.79736328125, 3.546142578125, 4.294921875, 5.043701171875, 5.79248046875, 6.541259765625, 7.2900390625, 8.038818359375, 8.78759765625, 9.536376953125, 10.28515625, 11.033935546875, 11.78271484375, 12.531494140625, 13.2802734375, 14.029052734375, 14.77783203125, 15.526611328125, 16.275390625, 17.024169921875, 17.77294921875, 18.521728515625, 19.2705078125, 20.019287109375, 20.76806640625, 21.516845703125, 22.265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 10.0, 11.0, 12.0, 15.0, 8.0, 11.0, 22.0, 18.0, 19.0, 10.0, 23.0, 30.0, 34.0, 29.0, 26.0, 31.0, 38.0, 31.0, 48.0, 33.0, 33.0, 40.0, 39.0, 35.0, 34.0, 36.0, 30.0, 33.0, 26.0, 31.0, 30.0, 27.0, 20.0, 23.0, 19.0, 13.0, 15.0, 6.0, 10.0, 5.0, 10.0, 9.0, 3.0, 1.0, 5.0, 5.0, 0.0, 4.0, 1.0], "bins": [-52.5625, -51.091796875, -49.62109375, -48.150390625, -46.6796875, -45.208984375, -43.73828125, -42.267578125, -40.796875, -39.326171875, -37.85546875, -36.384765625, -34.9140625, -33.443359375, -31.97265625, -30.501953125, -29.03125, -27.560546875, -26.08984375, -24.619140625, -23.1484375, -21.677734375, -20.20703125, -18.736328125, -17.265625, -15.794921875, -14.32421875, -12.853515625, -11.3828125, -9.912109375, -8.44140625, -6.970703125, -5.5, -4.029296875, -2.55859375, -1.087890625, 0.3828125, 1.853515625, 3.32421875, 4.794921875, 6.265625, 7.736328125, 9.20703125, 10.677734375, 12.1484375, 13.619140625, 15.08984375, 16.560546875, 18.03125, 19.501953125, 20.97265625, 22.443359375, 23.9140625, 25.384765625, 26.85546875, 28.326171875, 29.796875, 31.267578125, 32.73828125, 34.208984375, 35.6796875, 37.150390625, 38.62109375, 40.091796875, 41.5625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 13.0, 14.0, 36.0, 54.0, 91.0, 148.0, 196.0, 280.0, 470.0, 746.0, 1112.0, 1763.0, 2661.0, 3935.0, 5808.0, 8563.0, 12365.0, 17997.0, 24517.0, 33426.0, 44387.0, 55597.0, 68415.0, 79185.0, 87085.0, 91352.0, 90010.0, 84979.0, 75788.0, 63973.0, 51531.0, 40506.0, 30068.0, 22249.0, 15981.0, 10966.0, 7510.0, 4987.0, 3370.0, 2226.0, 1546.0, 942.0, 622.0, 389.0, 247.0, 171.0, 109.0, 66.0, 48.0, 22.0, 17.0, 13.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.953125, -21.240966796875, -20.52880859375, -19.816650390625, -19.1044921875, -18.392333984375, -17.68017578125, -16.968017578125, -16.255859375, -15.543701171875, -14.83154296875, -14.119384765625, -13.4072265625, -12.695068359375, -11.98291015625, -11.270751953125, -10.55859375, -9.846435546875, -9.13427734375, -8.422119140625, -7.7099609375, -6.997802734375, -6.28564453125, -5.573486328125, -4.861328125, -4.149169921875, -3.43701171875, -2.724853515625, -2.0126953125, -1.300537109375, -0.58837890625, 0.123779296875, 0.8359375, 1.548095703125, 2.26025390625, 2.972412109375, 3.6845703125, 4.396728515625, 5.10888671875, 5.821044921875, 6.533203125, 7.245361328125, 7.95751953125, 8.669677734375, 9.3818359375, 10.093994140625, 10.80615234375, 11.518310546875, 12.23046875, 12.942626953125, 13.65478515625, 14.366943359375, 15.0791015625, 15.791259765625, 16.50341796875, 17.215576171875, 17.927734375, 18.639892578125, 19.35205078125, 20.064208984375, 20.7763671875, 21.488525390625, 22.20068359375, 22.912841796875, 23.625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 7.0, 12.0, 17.0, 8.0, 20.0, 13.0, 24.0, 23.0, 16.0, 30.0, 29.0, 37.0, 25.0, 34.0, 46.0, 34.0, 41.0, 38.0, 30.0, 40.0, 35.0, 41.0, 39.0, 34.0, 33.0, 33.0, 35.0, 31.0, 30.0, 21.0, 22.0, 21.0, 13.0, 9.0, 12.0, 11.0, 3.0, 12.0, 6.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-35.9375, -34.921875, -33.90625, -32.890625, -31.875, -30.859375, -29.84375, -28.828125, -27.8125, -26.796875, -25.78125, -24.765625, -23.75, -22.734375, -21.71875, -20.703125, -19.6875, -18.671875, -17.65625, -16.640625, -15.625, -14.609375, -13.59375, -12.578125, -11.5625, -10.546875, -9.53125, -8.515625, -7.5, -6.484375, -5.46875, -4.453125, -3.4375, -2.421875, -1.40625, -0.390625, 0.625, 1.640625, 2.65625, 3.671875, 4.6875, 5.703125, 6.71875, 7.734375, 8.75, 9.765625, 10.78125, 11.796875, 12.8125, 13.828125, 14.84375, 15.859375, 16.875, 17.890625, 18.90625, 19.921875, 20.9375, 21.953125, 22.96875, 23.984375, 25.0, 26.015625, 27.03125, 28.046875, 29.0625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 9.0, 6.0, 13.0, 16.0, 28.0, 31.0, 56.0, 77.0, 98.0, 122.0, 208.0, 310.0, 398.0, 683.0, 1052.0, 1814.0, 3298.0, 6967.0, 15555.0, 35632.0, 76645.0, 141659.0, 202342.0, 213752.0, 164942.0, 96220.0, 47195.0, 20617.0, 8987.0, 4145.0, 2167.0, 1177.0, 763.0, 471.0, 326.0, 241.0, 168.0, 93.0, 74.0, 68.0, 36.0, 28.0, 18.0, 18.0, 11.0, 7.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-21.296875, -20.65478515625, -20.0126953125, -19.37060546875, -18.728515625, -18.08642578125, -17.4443359375, -16.80224609375, -16.16015625, -15.51806640625, -14.8759765625, -14.23388671875, -13.591796875, -12.94970703125, -12.3076171875, -11.66552734375, -11.0234375, -10.38134765625, -9.7392578125, -9.09716796875, -8.455078125, -7.81298828125, -7.1708984375, -6.52880859375, -5.88671875, -5.24462890625, -4.6025390625, -3.96044921875, -3.318359375, -2.67626953125, -2.0341796875, -1.39208984375, -0.75, -0.10791015625, 0.5341796875, 1.17626953125, 1.818359375, 2.46044921875, 3.1025390625, 3.74462890625, 4.38671875, 5.02880859375, 5.6708984375, 6.31298828125, 6.955078125, 7.59716796875, 8.2392578125, 8.88134765625, 9.5234375, 10.16552734375, 10.8076171875, 11.44970703125, 12.091796875, 12.73388671875, 13.3759765625, 14.01806640625, 14.66015625, 15.30224609375, 15.9443359375, 16.58642578125, 17.228515625, 17.87060546875, 18.5126953125, 19.15478515625, 19.796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 8.0, 8.0, 10.0, 15.0, 19.0, 19.0, 30.0, 20.0, 37.0, 40.0, 35.0, 54.0, 51.0, 43.0, 55.0, 64.0, 53.0, 53.0, 61.0, 51.0, 46.0, 39.0, 31.0, 26.0, 28.0, 20.0, 19.0, 23.0, 6.0, 12.0, 2.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013170242309570312, -0.0012707114219665527, -0.0012243986129760742, -0.0011780858039855957, -0.0011317729949951172, -0.0010854601860046387, -0.0010391473770141602, -0.0009928345680236816, -0.0009465217590332031, -0.0009002089500427246, -0.0008538961410522461, -0.0008075833320617676, -0.0007612705230712891, -0.0007149577140808105, -0.000668644905090332, -0.0006223320960998535, -0.000576019287109375, -0.0005297064781188965, -0.00048339366912841797, -0.00043708086013793945, -0.00039076805114746094, -0.0003444552421569824, -0.0002981424331665039, -0.0002518296241760254, -0.00020551681518554688, -0.00015920400619506836, -0.00011289119720458984, -6.657838821411133e-05, -2.0265579223632812e-05, 2.6047229766845703e-05, 7.236003875732422e-05, 0.00011867284774780273, 0.00016498565673828125, 0.00021129846572875977, 0.0002576112747192383, 0.0003039240837097168, 0.0003502368927001953, 0.00039654970169067383, 0.00044286251068115234, 0.0004891753196716309, 0.0005354881286621094, 0.0005818009376525879, 0.0006281137466430664, 0.0006744265556335449, 0.0007207393646240234, 0.000767052173614502, 0.0008133649826049805, 0.000859677791595459, 0.0009059906005859375, 0.000952303409576416, 0.0009986162185668945, 0.001044929027557373, 0.0010912418365478516, 0.00113755464553833, 0.0011838674545288086, 0.0012301802635192871, 0.0012764930725097656, 0.0013228058815002441, 0.0013691186904907227, 0.0014154314994812012, 0.0014617443084716797, 0.0015080571174621582, 0.0015543699264526367, 0.0016006827354431152, 0.0016469955444335938]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 5.0, 5.0, 6.0, 11.0, 13.0, 18.0, 19.0, 34.0, 40.0, 55.0, 69.0, 85.0, 148.0, 185.0, 246.0, 390.0, 612.0, 910.0, 1437.0, 2320.0, 4167.0, 7627.0, 15389.0, 31685.0, 63587.0, 114856.0, 173616.0, 201202.0, 175957.0, 118901.0, 66418.0, 33220.0, 16229.0, 8132.0, 4141.0, 2376.0, 1526.0, 893.0, 597.0, 399.0, 269.0, 197.0, 149.0, 103.0, 82.0, 59.0, 46.0, 35.0, 21.0, 21.0, 15.0, 9.0, 12.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0], "bins": [-20.5625, -19.910400390625, -19.25830078125, -18.606201171875, -17.9541015625, -17.302001953125, -16.64990234375, -15.997802734375, -15.345703125, -14.693603515625, -14.04150390625, -13.389404296875, -12.7373046875, -12.085205078125, -11.43310546875, -10.781005859375, -10.12890625, -9.476806640625, -8.82470703125, -8.172607421875, -7.5205078125, -6.868408203125, -6.21630859375, -5.564208984375, -4.912109375, -4.260009765625, -3.60791015625, -2.955810546875, -2.3037109375, -1.651611328125, -0.99951171875, -0.347412109375, 0.3046875, 0.956787109375, 1.60888671875, 2.260986328125, 2.9130859375, 3.565185546875, 4.21728515625, 4.869384765625, 5.521484375, 6.173583984375, 6.82568359375, 7.477783203125, 8.1298828125, 8.781982421875, 9.43408203125, 10.086181640625, 10.73828125, 11.390380859375, 12.04248046875, 12.694580078125, 13.3466796875, 13.998779296875, 14.65087890625, 15.302978515625, 15.955078125, 16.607177734375, 17.25927734375, 17.911376953125, 18.5634765625, 19.215576171875, 19.86767578125, 20.519775390625, 21.171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 8.0, 6.0, 12.0, 6.0, 12.0, 12.0, 18.0, 19.0, 26.0, 37.0, 32.0, 38.0, 49.0, 51.0, 55.0, 67.0, 60.0, 64.0, 52.0, 64.0, 57.0, 44.0, 42.0, 37.0, 28.0, 28.0, 17.0, 14.0, 9.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 1.0, 7.0, 1.0, 5.0, 2.0, 0.0, 1.0], "bins": [-8.7578125, -8.52984619140625, -8.3018798828125, -8.07391357421875, -7.845947265625, -7.61798095703125, -7.3900146484375, -7.16204833984375, -6.93408203125, -6.70611572265625, -6.4781494140625, -6.25018310546875, -6.022216796875, -5.79425048828125, -5.5662841796875, -5.33831787109375, -5.1103515625, -4.88238525390625, -4.6544189453125, -4.42645263671875, -4.198486328125, -3.97052001953125, -3.7425537109375, -3.51458740234375, -3.28662109375, -3.05865478515625, -2.8306884765625, -2.60272216796875, -2.374755859375, -2.14678955078125, -1.9188232421875, -1.69085693359375, -1.462890625, -1.23492431640625, -1.0069580078125, -0.77899169921875, -0.551025390625, -0.32305908203125, -0.0950927734375, 0.13287353515625, 0.36083984375, 0.58880615234375, 0.8167724609375, 1.04473876953125, 1.272705078125, 1.50067138671875, 1.7286376953125, 1.95660400390625, 2.1845703125, 2.41253662109375, 2.6405029296875, 2.86846923828125, 3.096435546875, 3.32440185546875, 3.5523681640625, 3.78033447265625, 4.00830078125, 4.23626708984375, 4.4642333984375, 4.69219970703125, 4.920166015625, 5.14813232421875, 5.3760986328125, 5.60406494140625, 5.83203125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 9.0, 4.0, 7.0, 13.0, 12.0, 15.0, 16.0, 21.0, 33.0, 16.0, 32.0, 41.0, 39.0, 38.0, 40.0, 51.0, 54.0, 55.0, 39.0, 42.0, 49.0, 53.0, 36.0, 38.0, 39.0, 43.0, 36.0, 31.0, 21.0, 15.0, 7.0, 17.0, 10.0, 9.0, 7.0, 7.0, 7.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.55038833618164, -50.966552734375, -49.38271713256836, -47.79888153076172, -46.21504592895508, -44.63121032714844, -43.0473747253418, -41.463539123535156, -39.879703521728516, -38.295867919921875, -36.712032318115234, -35.128196716308594, -33.54436111450195, -31.960525512695312, -30.376689910888672, -28.79285430908203, -27.20901870727539, -25.62518310546875, -24.04134750366211, -22.45751190185547, -20.873676300048828, -19.289840698242188, -17.706005096435547, -16.122169494628906, -14.538333892822266, -12.954498291015625, -11.370662689208984, -9.786827087402344, -8.202991485595703, -6.6191558837890625, -5.035320281982422, -3.4514846801757812, -1.8676528930664062, -0.2838172912597656, 1.300018310546875, 2.8838539123535156, 4.467689514160156, 6.051525115966797, 7.6353607177734375, 9.219196319580078, 10.803031921386719, 12.38686752319336, 13.970703125, 15.55453872680664, 17.13837432861328, 18.722209930419922, 20.306045532226562, 21.889881134033203, 23.473716735839844, 25.057552337646484, 26.641387939453125, 28.225223541259766, 29.809059143066406, 31.392894744873047, 32.97673034667969, 34.56056594848633, 36.14440155029297, 37.72823715209961, 39.31207275390625, 40.89590835571289, 42.47974395751953, 44.06357955932617, 45.64741516113281, 47.23125076293945, 48.815086364746094]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 1.0, 7.0, 7.0, 6.0, 13.0, 11.0, 20.0, 21.0, 18.0, 19.0, 14.0, 23.0, 31.0, 23.0, 40.0, 33.0, 42.0, 41.0, 34.0, 39.0, 44.0, 45.0, 48.0, 37.0, 33.0, 38.0, 51.0, 29.0, 33.0, 31.0, 21.0, 23.0, 16.0, 23.0, 16.0, 10.0, 22.0, 8.0, 8.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.95321273803711, -54.19675827026367, -52.440303802490234, -50.6838493347168, -48.92739486694336, -47.17094039916992, -45.41448211669922, -43.65802764892578, -41.901573181152344, -40.145118713378906, -38.38866424560547, -36.63220977783203, -34.875755310058594, -33.119300842285156, -31.362844467163086, -29.60638999938965, -27.849937438964844, -26.093482971191406, -24.33702850341797, -22.58057403564453, -20.824119567871094, -19.067665100097656, -17.311208724975586, -15.554754257202148, -13.798299789428711, -12.041845321655273, -10.285390853881836, -8.528935432434082, -6.7724809646606445, -5.016026496887207, -3.259571075439453, -1.5031166076660156, 0.25333404541015625, 2.009788751602173, 3.7662434577941895, 5.522698402404785, 7.279152870178223, 9.03560733795166, 10.792062759399414, 12.548517227172852, 14.304971694946289, 16.061426162719727, 17.817880630493164, 19.574337005615234, 21.330791473388672, 23.08724594116211, 24.843700408935547, 26.600154876708984, 28.356609344482422, 30.11306381225586, 31.869518280029297, 33.625972747802734, 35.38242721557617, 37.13888168334961, 38.89533996582031, 40.65179443359375, 42.40824890136719, 44.164703369140625, 45.92115783691406, 47.6776123046875, 49.43406677246094, 51.190521240234375, 52.94697570800781, 54.70343017578125, 56.45988464355469]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 3.0, 11.0, 17.0, 29.0, 55.0, 110.0, 180.0, 287.0, 496.0, 831.0, 1459.0, 2298.0, 3733.0, 6149.0, 9794.0, 15011.0, 22972.0, 34176.0, 50806.0, 71543.0, 99305.0, 133676.0, 173647.0, 217803.0, 262955.0, 302769.0, 332441.0, 349552.0, 350054.0, 333763.0, 303300.0, 264438.0, 220588.0, 174918.0, 135276.0, 100305.0, 71669.0, 50341.0, 34353.0, 23241.0, 14749.0, 9586.0, 6028.0, 3773.0, 2349.0, 1430.0, 883.0, 482.0, 271.0, 177.0, 102.0, 47.0, 23.0, 12.0, 11.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-28.125, -27.218017578125, -26.31103515625, -25.404052734375, -24.4970703125, -23.590087890625, -22.68310546875, -21.776123046875, -20.869140625, -19.962158203125, -19.05517578125, -18.148193359375, -17.2412109375, -16.334228515625, -15.42724609375, -14.520263671875, -13.61328125, -12.706298828125, -11.79931640625, -10.892333984375, -9.9853515625, -9.078369140625, -8.17138671875, -7.264404296875, -6.357421875, -5.450439453125, -4.54345703125, -3.636474609375, -2.7294921875, -1.822509765625, -0.91552734375, -0.008544921875, 0.8984375, 1.805419921875, 2.71240234375, 3.619384765625, 4.5263671875, 5.433349609375, 6.34033203125, 7.247314453125, 8.154296875, 9.061279296875, 9.96826171875, 10.875244140625, 11.7822265625, 12.689208984375, 13.59619140625, 14.503173828125, 15.41015625, 16.317138671875, 17.22412109375, 18.131103515625, 19.0380859375, 19.945068359375, 20.85205078125, 21.759033203125, 22.666015625, 23.572998046875, 24.47998046875, 25.386962890625, 26.2939453125, 27.200927734375, 28.10791015625, 29.014892578125, 29.921875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 2.0, 6.0, 6.0, 8.0, 10.0, 13.0, 18.0, 19.0, 20.0, 23.0, 12.0, 26.0, 21.0, 27.0, 35.0, 37.0, 35.0, 39.0, 44.0, 31.0, 45.0, 44.0, 51.0, 41.0, 30.0, 39.0, 42.0, 42.0, 32.0, 26.0, 23.0, 25.0, 17.0, 20.0, 20.0, 14.0, 17.0, 11.0, 8.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.96875, -47.44140625, -45.9140625, -44.38671875, -42.859375, -41.33203125, -39.8046875, -38.27734375, -36.75, -35.22265625, -33.6953125, -32.16796875, -30.640625, -29.11328125, -27.5859375, -26.05859375, -24.53125, -23.00390625, -21.4765625, -19.94921875, -18.421875, -16.89453125, -15.3671875, -13.83984375, -12.3125, -10.78515625, -9.2578125, -7.73046875, -6.203125, -4.67578125, -3.1484375, -1.62109375, -0.09375, 1.43359375, 2.9609375, 4.48828125, 6.015625, 7.54296875, 9.0703125, 10.59765625, 12.125, 13.65234375, 15.1796875, 16.70703125, 18.234375, 19.76171875, 21.2890625, 22.81640625, 24.34375, 25.87109375, 27.3984375, 28.92578125, 30.453125, 31.98046875, 33.5078125, 35.03515625, 36.5625, 38.08984375, 39.6171875, 41.14453125, 42.671875, 44.19921875, 45.7265625, 47.25390625, 48.78125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 12.0, 14.0, 25.0, 41.0, 62.0, 120.0, 258.0, 484.0, 736.0, 1333.0, 2300.0, 3858.0, 6330.0, 9996.0, 16013.0, 24392.0, 36534.0, 53172.0, 76026.0, 103795.0, 139149.0, 176918.0, 219422.0, 259528.0, 296401.0, 321917.0, 338015.0, 336925.0, 324070.0, 297040.0, 262051.0, 221247.0, 180569.0, 141552.0, 106473.0, 77420.0, 54584.0, 37358.0, 25126.0, 16567.0, 10447.0, 6428.0, 3979.0, 2356.0, 1373.0, 816.0, 457.0, 267.0, 143.0, 81.0, 54.0, 28.0, 15.0, 7.0, 6.0, 2.0, 2.0, 1.0], "bins": [-30.71875, -29.788818359375, -28.85888671875, -27.928955078125, -26.9990234375, -26.069091796875, -25.13916015625, -24.209228515625, -23.279296875, -22.349365234375, -21.41943359375, -20.489501953125, -19.5595703125, -18.629638671875, -17.69970703125, -16.769775390625, -15.83984375, -14.909912109375, -13.97998046875, -13.050048828125, -12.1201171875, -11.190185546875, -10.26025390625, -9.330322265625, -8.400390625, -7.470458984375, -6.54052734375, -5.610595703125, -4.6806640625, -3.750732421875, -2.82080078125, -1.890869140625, -0.9609375, -0.031005859375, 0.89892578125, 1.828857421875, 2.7587890625, 3.688720703125, 4.61865234375, 5.548583984375, 6.478515625, 7.408447265625, 8.33837890625, 9.268310546875, 10.1982421875, 11.128173828125, 12.05810546875, 12.988037109375, 13.91796875, 14.847900390625, 15.77783203125, 16.707763671875, 17.6376953125, 18.567626953125, 19.49755859375, 20.427490234375, 21.357421875, 22.287353515625, 23.21728515625, 24.147216796875, 25.0771484375, 26.007080078125, 26.93701171875, 27.866943359375, 28.796875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 4.0, 7.0, 11.0, 12.0, 22.0, 23.0, 32.0, 36.0, 61.0, 70.0, 69.0, 91.0, 120.0, 147.0, 162.0, 151.0, 163.0, 204.0, 208.0, 197.0, 230.0, 218.0, 231.0, 222.0, 204.0, 179.0, 169.0, 143.0, 146.0, 84.0, 96.0, 78.0, 59.0, 56.0, 50.0, 32.0, 31.0, 14.0, 16.0, 8.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.984375, -20.234375, -19.484375, -18.734375, -17.984375, -17.234375, -16.484375, -15.734375, -14.984375, -14.234375, -13.484375, -12.734375, -11.984375, -11.234375, -10.484375, -9.734375, -8.984375, -8.234375, -7.484375, -6.734375, -5.984375, -5.234375, -4.484375, -3.734375, -2.984375, -2.234375, -1.484375, -0.734375, 0.015625, 0.765625, 1.515625, 2.265625, 3.015625, 3.765625, 4.515625, 5.265625, 6.015625, 6.765625, 7.515625, 8.265625, 9.015625, 9.765625, 10.515625, 11.265625, 12.015625, 12.765625, 13.515625, 14.265625, 15.015625, 15.765625, 16.515625, 17.265625, 18.015625, 18.765625, 19.515625, 20.265625, 21.015625, 21.765625, 22.515625, 23.265625, 24.015625, 24.765625, 25.515625, 26.265625, 27.015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 3.0, 3.0, 6.0, 6.0, 13.0, 15.0, 9.0, 18.0, 17.0, 16.0, 21.0, 22.0, 20.0, 23.0, 28.0, 28.0, 43.0, 38.0, 36.0, 40.0, 42.0, 42.0, 53.0, 43.0, 45.0, 27.0, 42.0, 43.0, 27.0, 31.0, 27.0, 29.0, 31.0, 18.0, 21.0, 16.0, 13.0, 10.0, 6.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.8953742980957, -43.49043273925781, -42.08549499511719, -40.6805534362793, -39.275611877441406, -37.87067413330078, -36.46573257446289, -35.060791015625, -33.655853271484375, -32.250911712646484, -30.84597396850586, -29.44103240966797, -28.03609275817871, -26.631153106689453, -25.226211547851562, -23.821271896362305, -22.416332244873047, -21.01139259338379, -19.60645294189453, -18.20151138305664, -16.796571731567383, -15.391632080078125, -13.98669147491455, -12.581750869750977, -11.176811218261719, -9.771871566772461, -8.366930961608887, -6.961990833282471, -5.557050704956055, -4.152110576629639, -2.7471704483032227, -1.3422298431396484, 0.06270599365234375, 1.4676461219787598, 2.872586250305176, 4.277526378631592, 5.682466506958008, 7.087406635284424, 8.49234676361084, 9.897287368774414, 11.302227020263672, 12.70716667175293, 14.112107276916504, 15.517047882080078, 16.921987533569336, 18.326927185058594, 19.731868743896484, 21.136808395385742, 22.541748046875, 23.946687698364258, 25.351627349853516, 26.756568908691406, 28.161508560180664, 29.566448211669922, 30.971389770507812, 32.37632751464844, 33.78126907348633, 35.18621063232422, 36.591148376464844, 37.996089935302734, 39.401031494140625, 40.80596923828125, 42.21091079711914, 43.61585235595703, 45.020790100097656]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 4.0, 5.0, 4.0, 8.0, 6.0, 8.0, 17.0, 13.0, 11.0, 16.0, 17.0, 19.0, 27.0, 25.0, 24.0, 31.0, 28.0, 34.0, 43.0, 39.0, 43.0, 29.0, 39.0, 37.0, 41.0, 45.0, 36.0, 35.0, 38.0, 30.0, 33.0, 25.0, 22.0, 18.0, 19.0, 27.0, 16.0, 18.0, 13.0, 9.0, 10.0, 9.0, 5.0, 3.0, 10.0, 8.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.34261703491211, -47.694156646728516, -46.04570007324219, -44.397239685058594, -42.748783111572266, -41.10032272338867, -39.451866149902344, -37.80340576171875, -36.154945373535156, -34.50648498535156, -32.858028411865234, -31.20956802368164, -29.561111450195312, -27.91265106201172, -26.264192581176758, -24.615734100341797, -22.96727752685547, -21.318819046020508, -19.670360565185547, -18.021900177001953, -16.373443603515625, -14.724984169006348, -13.07652473449707, -11.42806625366211, -9.779607772827148, -8.131149291992188, -6.482690334320068, -4.834231376647949, -3.1857728958129883, -1.5373144149780273, 0.11114501953125, 1.759603500366211, 3.408061981201172, 5.056520462036133, 6.704979419708252, 8.353438377380371, 10.001896858215332, 11.650355339050293, 13.29881477355957, 14.947273254394531, 16.595731735229492, 18.244190216064453, 19.892648696899414, 21.541107177734375, 23.18956756591797, 24.838024139404297, 26.48648452758789, 28.13494300842285, 29.783401489257812, 31.431859970092773, 33.080318450927734, 34.72877883911133, 36.377235412597656, 38.02569580078125, 39.674156188964844, 41.32261276245117, 42.9710693359375, 44.619529724121094, 46.26798629760742, 47.916446685791016, 49.564903259277344, 51.21336364746094, 52.86182403564453, 54.51028060913086, 56.15874099731445]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 9.0, 12.0, 23.0, 27.0, 40.0, 75.0, 88.0, 141.0, 210.0, 345.0, 497.0, 733.0, 1076.0, 1561.0, 2315.0, 3674.0, 5398.0, 8105.0, 12369.0, 18811.0, 28409.0, 43097.0, 65267.0, 97917.0, 138983.0, 164861.0, 144818.0, 103976.0, 69962.0, 46044.0, 30367.0, 19957.0, 13323.0, 8745.0, 5696.0, 3844.0, 2513.0, 1767.0, 1103.0, 794.0, 546.0, 368.0, 241.0, 142.0, 103.0, 81.0, 41.0, 30.0, 25.0, 13.0, 6.0, 11.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.3984375, -4.2674560546875, -4.136474609375, -4.0054931640625, -3.87451171875, -3.7435302734375, -3.612548828125, -3.4815673828125, -3.3505859375, -3.2196044921875, -3.088623046875, -2.9576416015625, -2.82666015625, -2.6956787109375, -2.564697265625, -2.4337158203125, -2.302734375, -2.1717529296875, -2.040771484375, -1.9097900390625, -1.77880859375, -1.6478271484375, -1.516845703125, -1.3858642578125, -1.2548828125, -1.1239013671875, -0.992919921875, -0.8619384765625, -0.73095703125, -0.5999755859375, -0.468994140625, -0.3380126953125, -0.20703125, -0.0760498046875, 0.054931640625, 0.1859130859375, 0.31689453125, 0.4478759765625, 0.578857421875, 0.7098388671875, 0.8408203125, 0.9718017578125, 1.102783203125, 1.2337646484375, 1.36474609375, 1.4957275390625, 1.626708984375, 1.7576904296875, 1.888671875, 2.0196533203125, 2.150634765625, 2.2816162109375, 2.41259765625, 2.5435791015625, 2.674560546875, 2.8055419921875, 2.9365234375, 3.0675048828125, 3.198486328125, 3.3294677734375, 3.46044921875, 3.5914306640625, 3.722412109375, 3.8533935546875, 3.984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 4.0, 8.0, 6.0, 8.0, 17.0, 13.0, 11.0, 18.0, 15.0, 19.0, 28.0, 23.0, 25.0, 33.0, 26.0, 35.0, 42.0, 39.0, 43.0, 31.0, 38.0, 36.0, 42.0, 44.0, 37.0, 34.0, 39.0, 29.0, 31.0, 27.0, 22.0, 17.0, 21.0, 25.0, 17.0, 18.0, 10.0, 12.0, 10.0, 9.0, 5.0, 3.0, 8.0, 9.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.25, -47.60400390625, -45.9580078125, -44.31201171875, -42.666015625, -41.02001953125, -39.3740234375, -37.72802734375, -36.08203125, -34.43603515625, -32.7900390625, -31.14404296875, -29.498046875, -27.85205078125, -26.2060546875, -24.56005859375, -22.9140625, -21.26806640625, -19.6220703125, -17.97607421875, -16.330078125, -14.68408203125, -13.0380859375, -11.39208984375, -9.74609375, -8.10009765625, -6.4541015625, -4.80810546875, -3.162109375, -1.51611328125, 0.1298828125, 1.77587890625, 3.421875, 5.06787109375, 6.7138671875, 8.35986328125, 10.005859375, 11.65185546875, 13.2978515625, 14.94384765625, 16.58984375, 18.23583984375, 19.8818359375, 21.52783203125, 23.173828125, 24.81982421875, 26.4658203125, 28.11181640625, 29.7578125, 31.40380859375, 33.0498046875, 34.69580078125, 36.341796875, 37.98779296875, 39.6337890625, 41.27978515625, 42.92578125, 44.57177734375, 46.2177734375, 47.86376953125, 49.509765625, 51.15576171875, 52.8017578125, 54.44775390625, 56.09375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 15.0, 5.0, 7.0, 17.0, 19.0, 25.0, 49.0, 39.0, 60.0, 89.0, 117.0, 167.0, 238.0, 307.0, 446.0, 647.0, 946.0, 1384.0, 2112.0, 3381.0, 5265.0, 8725.0, 15243.0, 27097.0, 51273.0, 101064.0, 203066.0, 281052.0, 165907.0, 81734.0, 41896.0, 22814.0, 12902.0, 7523.0, 4465.0, 2776.0, 1847.0, 1174.0, 792.0, 518.0, 354.0, 271.0, 191.0, 144.0, 95.0, 76.0, 53.0, 40.0, 36.0, 25.0, 24.0, 12.0, 18.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0], "bins": [-6.4375, -6.232177734375, -6.02685546875, -5.821533203125, -5.6162109375, -5.410888671875, -5.20556640625, -5.000244140625, -4.794921875, -4.589599609375, -4.38427734375, -4.178955078125, -3.9736328125, -3.768310546875, -3.56298828125, -3.357666015625, -3.15234375, -2.947021484375, -2.74169921875, -2.536376953125, -2.3310546875, -2.125732421875, -1.92041015625, -1.715087890625, -1.509765625, -1.304443359375, -1.09912109375, -0.893798828125, -0.6884765625, -0.483154296875, -0.27783203125, -0.072509765625, 0.1328125, 0.338134765625, 0.54345703125, 0.748779296875, 0.9541015625, 1.159423828125, 1.36474609375, 1.570068359375, 1.775390625, 1.980712890625, 2.18603515625, 2.391357421875, 2.5966796875, 2.802001953125, 3.00732421875, 3.212646484375, 3.41796875, 3.623291015625, 3.82861328125, 4.033935546875, 4.2392578125, 4.444580078125, 4.64990234375, 4.855224609375, 5.060546875, 5.265869140625, 5.47119140625, 5.676513671875, 5.8818359375, 6.087158203125, 6.29248046875, 6.497802734375, 6.703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 8.0, 14.0, 11.0, 12.0, 19.0, 20.0, 22.0, 18.0, 19.0, 20.0, 34.0, 29.0, 30.0, 37.0, 32.0, 43.0, 45.0, 38.0, 41.0, 44.0, 29.0, 30.0, 42.0, 40.0, 42.0, 31.0, 29.0, 23.0, 30.0, 23.0, 22.0, 23.0, 15.0, 11.0, 14.0, 13.0, 8.0, 10.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.3125, -32.20263671875, -31.0927734375, -29.98291015625, -28.873046875, -27.76318359375, -26.6533203125, -25.54345703125, -24.43359375, -23.32373046875, -22.2138671875, -21.10400390625, -19.994140625, -18.88427734375, -17.7744140625, -16.66455078125, -15.5546875, -14.44482421875, -13.3349609375, -12.22509765625, -11.115234375, -10.00537109375, -8.8955078125, -7.78564453125, -6.67578125, -5.56591796875, -4.4560546875, -3.34619140625, -2.236328125, -1.12646484375, -0.0166015625, 1.09326171875, 2.203125, 3.31298828125, 4.4228515625, 5.53271484375, 6.642578125, 7.75244140625, 8.8623046875, 9.97216796875, 11.08203125, 12.19189453125, 13.3017578125, 14.41162109375, 15.521484375, 16.63134765625, 17.7412109375, 18.85107421875, 19.9609375, 21.07080078125, 22.1806640625, 23.29052734375, 24.400390625, 25.51025390625, 26.6201171875, 27.72998046875, 28.83984375, 29.94970703125, 31.0595703125, 32.16943359375, 33.279296875, 34.38916015625, 35.4990234375, 36.60888671875, 37.71875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 13.0, 13.0, 15.0, 24.0, 50.0, 53.0, 103.0, 143.0, 228.0, 332.0, 587.0, 918.0, 1590.0, 2830.0, 5628.0, 12110.0, 32749.0, 123129.0, 495671.0, 274523.0, 61029.0, 19367.0, 8161.0, 3925.0, 2166.0, 1215.0, 703.0, 461.0, 290.0, 165.0, 99.0, 72.0, 50.0, 34.0, 19.0, 25.0, 17.0, 10.0, 11.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.501953125, -2.42059326171875, -2.3392333984375, -2.25787353515625, -2.176513671875, -2.09515380859375, -2.0137939453125, -1.93243408203125, -1.85107421875, -1.76971435546875, -1.6883544921875, -1.60699462890625, -1.525634765625, -1.44427490234375, -1.3629150390625, -1.28155517578125, -1.2001953125, -1.11883544921875, -1.0374755859375, -0.95611572265625, -0.874755859375, -0.79339599609375, -0.7120361328125, -0.63067626953125, -0.54931640625, -0.46795654296875, -0.3865966796875, -0.30523681640625, -0.223876953125, -0.14251708984375, -0.0611572265625, 0.02020263671875, 0.1015625, 0.18292236328125, 0.2642822265625, 0.34564208984375, 0.427001953125, 0.50836181640625, 0.5897216796875, 0.67108154296875, 0.75244140625, 0.83380126953125, 0.9151611328125, 0.99652099609375, 1.077880859375, 1.15924072265625, 1.2406005859375, 1.32196044921875, 1.4033203125, 1.48468017578125, 1.5660400390625, 1.64739990234375, 1.728759765625, 1.81011962890625, 1.8914794921875, 1.97283935546875, 2.05419921875, 2.13555908203125, 2.2169189453125, 2.29827880859375, 2.379638671875, 2.46099853515625, 2.5423583984375, 2.62371826171875, 2.705078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 10.0, 19.0, 13.0, 6.0, 19.0, 29.0, 35.0, 35.0, 50.0, 39.0, 41.0, 48.0, 42.0, 45.0, 49.0, 67.0, 58.0, 42.0, 25.0, 46.0, 39.0, 34.0, 22.0, 36.0, 23.0, 20.0, 17.0, 13.0, 18.0, 6.0, 9.0, 4.0, 10.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00010859966278076172, -0.00010541081428527832, -0.00010222196578979492, -9.903311729431152e-05, -9.584426879882812e-05, -9.265542030334473e-05, -8.946657180786133e-05, -8.627772331237793e-05, -8.308887481689453e-05, -7.990002632141113e-05, -7.671117782592773e-05, -7.352232933044434e-05, -7.033348083496094e-05, -6.714463233947754e-05, -6.395578384399414e-05, -6.076693534851074e-05, -5.7578086853027344e-05, -5.4389238357543945e-05, -5.120038986206055e-05, -4.801154136657715e-05, -4.482269287109375e-05, -4.163384437561035e-05, -3.844499588012695e-05, -3.5256147384643555e-05, -3.2067298889160156e-05, -2.8878450393676758e-05, -2.568960189819336e-05, -2.250075340270996e-05, -1.9311904907226562e-05, -1.6123056411743164e-05, -1.2934207916259766e-05, -9.745359420776367e-06, -6.556510925292969e-06, -3.3676624298095703e-06, -1.7881393432617188e-07, 3.0100345611572266e-06, 6.198883056640625e-06, 9.387731552124023e-06, 1.2576580047607422e-05, 1.576542854309082e-05, 1.895427703857422e-05, 2.2143125534057617e-05, 2.5331974029541016e-05, 2.8520822525024414e-05, 3.170967102050781e-05, 3.489851951599121e-05, 3.808736801147461e-05, 4.127621650695801e-05, 4.4465065002441406e-05, 4.7653913497924805e-05, 5.08427619934082e-05, 5.40316104888916e-05, 5.7220458984375e-05, 6.04093074798584e-05, 6.35981559753418e-05, 6.67870044708252e-05, 6.99758529663086e-05, 7.316470146179199e-05, 7.635354995727539e-05, 7.954239845275879e-05, 8.273124694824219e-05, 8.592009544372559e-05, 8.910894393920898e-05, 9.229779243469238e-05, 9.548664093017578e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 14.0, 18.0, 25.0, 34.0, 31.0, 44.0, 57.0, 83.0, 109.0, 195.0, 283.0, 408.0, 698.0, 976.0, 1718.0, 2666.0, 4406.0, 7531.0, 13015.0, 23387.0, 42930.0, 81458.0, 152455.0, 239386.0, 212080.0, 121363.0, 63559.0, 34102.0, 18742.0, 10648.0, 6091.0, 3650.0, 2282.0, 1423.0, 904.0, 580.0, 393.0, 243.0, 160.0, 118.0, 83.0, 53.0, 53.0, 32.0, 22.0, 16.0, 7.0, 6.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.384765625, -2.307373046875, -2.22998046875, -2.152587890625, -2.0751953125, -1.997802734375, -1.92041015625, -1.843017578125, -1.765625, -1.688232421875, -1.61083984375, -1.533447265625, -1.4560546875, -1.378662109375, -1.30126953125, -1.223876953125, -1.146484375, -1.069091796875, -0.99169921875, -0.914306640625, -0.8369140625, -0.759521484375, -0.68212890625, -0.604736328125, -0.52734375, -0.449951171875, -0.37255859375, -0.295166015625, -0.2177734375, -0.140380859375, -0.06298828125, 0.014404296875, 0.091796875, 0.169189453125, 0.24658203125, 0.323974609375, 0.4013671875, 0.478759765625, 0.55615234375, 0.633544921875, 0.7109375, 0.788330078125, 0.86572265625, 0.943115234375, 1.0205078125, 1.097900390625, 1.17529296875, 1.252685546875, 1.330078125, 1.407470703125, 1.48486328125, 1.562255859375, 1.6396484375, 1.717041015625, 1.79443359375, 1.871826171875, 1.94921875, 2.026611328125, 2.10400390625, 2.181396484375, 2.2587890625, 2.336181640625, 2.41357421875, 2.490966796875, 2.568359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 8.0, 12.0, 7.0, 13.0, 17.0, 15.0, 22.0, 35.0, 38.0, 30.0, 60.0, 60.0, 60.0, 89.0, 90.0, 71.0, 58.0, 46.0, 54.0, 35.0, 31.0, 16.0, 31.0, 16.0, 15.0, 12.0, 7.0, 6.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0263671875, -0.9969100952148438, -0.9674530029296875, -0.9379959106445312, -0.908538818359375, -0.8790817260742188, -0.8496246337890625, -0.8201675415039062, -0.79071044921875, -0.7612533569335938, -0.7317962646484375, -0.7023391723632812, -0.672882080078125, -0.6434249877929688, -0.6139678955078125, -0.5845108032226562, -0.5550537109375, -0.5255966186523438, -0.4961395263671875, -0.46668243408203125, -0.437225341796875, -0.40776824951171875, -0.3783111572265625, -0.34885406494140625, -0.31939697265625, -0.28993988037109375, -0.2604827880859375, -0.23102569580078125, -0.201568603515625, -0.17211151123046875, -0.1426544189453125, -0.11319732666015625, -0.083740234375, -0.05428314208984375, -0.0248260498046875, 0.00463104248046875, 0.034088134765625, 0.06354522705078125, 0.0930023193359375, 0.12245941162109375, 0.15191650390625, 0.18137359619140625, 0.2108306884765625, 0.24028778076171875, 0.269744873046875, 0.29920196533203125, 0.3286590576171875, 0.35811614990234375, 0.3875732421875, 0.41703033447265625, 0.4464874267578125, 0.47594451904296875, 0.505401611328125, 0.5348587036132812, 0.5643157958984375, 0.5937728881835938, 0.62322998046875, 0.6526870727539062, 0.6821441650390625, 0.7116012573242188, 0.741058349609375, 0.7705154418945312, 0.7999725341796875, 0.8294296264648438, 0.85888671875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 7.0, 5.0, 12.0, 12.0, 11.0, 16.0, 18.0, 13.0, 23.0, 22.0, 21.0, 22.0, 22.0, 30.0, 43.0, 35.0, 41.0, 37.0, 42.0, 41.0, 50.0, 44.0, 42.0, 36.0, 40.0, 37.0, 35.0, 26.0, 29.0, 30.0, 28.0, 24.0, 20.0, 17.0, 16.0, 9.0, 8.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-45.01634216308594, -43.61651611328125, -42.2166862487793, -40.81686019897461, -39.41703414916992, -38.01720428466797, -36.61737823486328, -35.217552185058594, -33.817726135253906, -32.41790008544922, -31.0180721282959, -29.618244171142578, -28.21841812133789, -26.81859016418457, -25.41876220703125, -24.018936157226562, -22.61910629272461, -21.21927833557129, -19.8194522857666, -18.41962432861328, -17.019798278808594, -15.619970321655273, -14.220142364501953, -12.82031536102295, -11.420488357543945, -10.020661354064941, -8.620834350585938, -7.221006393432617, -5.821179389953613, -4.421352386474609, -3.021524429321289, -1.6216974258422852, -0.22187423706054688, 1.1779530048370361, 2.577780246734619, 3.9776077270507812, 5.377434730529785, 6.777261734008789, 8.17708969116211, 9.576916694641113, 10.976743698120117, 12.376570701599121, 13.776397705078125, 15.176225662231445, 16.576053619384766, 17.975879669189453, 19.375707626342773, 20.775535583496094, 22.17536163330078, 23.5751895904541, 24.97501564025879, 26.37484359741211, 27.774669647216797, 29.174497604370117, 30.574325561523438, 31.974151611328125, 33.37397766113281, 34.7738037109375, 36.17363357543945, 37.57345962524414, 38.97328567504883, 40.37311553955078, 41.77294158935547, 43.172767639160156, 44.57259750366211]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 8.0, 4.0, 5.0, 4.0, 8.0, 6.0, 6.0, 19.0, 12.0, 11.0, 18.0, 15.0, 18.0, 28.0, 22.0, 28.0, 31.0, 28.0, 32.0, 42.0, 38.0, 41.0, 31.0, 40.0, 33.0, 47.0, 47.0, 33.0, 35.0, 36.0, 32.0, 28.0, 30.0, 25.0, 15.0, 22.0, 24.0, 17.0, 16.0, 12.0, 12.0, 9.0, 11.0, 5.0, 3.0, 11.0, 6.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.528865814208984, -47.878231048583984, -46.227596282958984, -44.576961517333984, -42.92633056640625, -41.27569580078125, -39.62506103515625, -37.97442626953125, -36.32379150390625, -34.67315673828125, -33.02252197265625, -31.371889114379883, -29.721254348754883, -28.070619583129883, -26.419986724853516, -24.769351959228516, -23.118717193603516, -21.468082427978516, -19.817447662353516, -18.16681480407715, -16.51618003845215, -14.865545272827148, -13.214911460876465, -11.564277648925781, -9.913642883300781, -8.263008117675781, -6.612374305725098, -4.961740016937256, -3.311105728149414, -1.660470962524414, -0.009837150573730469, 1.6407966613769531, 3.291431427001953, 4.942065715789795, 6.592700004577637, 8.24333381652832, 9.89396858215332, 11.54460334777832, 13.195237159729004, 14.845870971679688, 16.496505737304688, 18.147140502929688, 19.797775268554688, 21.448408126831055, 23.099042892456055, 24.749677658081055, 26.400310516357422, 28.050945281982422, 29.701580047607422, 31.352214813232422, 33.00284957885742, 34.65348434448242, 36.304115295410156, 37.954750061035156, 39.605384826660156, 41.256019592285156, 42.906654357910156, 44.557289123535156, 46.207923889160156, 47.858558654785156, 49.509193420410156, 51.159828186035156, 52.81045913696289, 54.46109390258789, 56.11172866821289]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 10.0, 10.0, 8.0, 22.0, 42.0, 52.0, 72.0, 126.0, 232.0, 403.0, 621.0, 945.0, 1547.0, 2567.0, 3889.0, 6067.0, 9222.0, 13839.0, 19896.0, 28091.0, 38887.0, 51081.0, 63924.0, 77225.0, 88153.0, 94525.0, 95765.0, 91133.0, 82967.0, 70808.0, 57282.0, 44069.0, 33245.0, 23486.0, 16718.0, 11187.0, 7403.0, 4804.0, 3003.0, 1949.0, 1248.0, 811.0, 458.0, 305.0, 169.0, 103.0, 89.0, 43.0, 26.0, 18.0, 11.0, 7.0, 3.0, 1.0, 2.0], "bins": [-26.015625, -25.27734375, -24.5390625, -23.80078125, -23.0625, -22.32421875, -21.5859375, -20.84765625, -20.109375, -19.37109375, -18.6328125, -17.89453125, -17.15625, -16.41796875, -15.6796875, -14.94140625, -14.203125, -13.46484375, -12.7265625, -11.98828125, -11.25, -10.51171875, -9.7734375, -9.03515625, -8.296875, -7.55859375, -6.8203125, -6.08203125, -5.34375, -4.60546875, -3.8671875, -3.12890625, -2.390625, -1.65234375, -0.9140625, -0.17578125, 0.5625, 1.30078125, 2.0390625, 2.77734375, 3.515625, 4.25390625, 4.9921875, 5.73046875, 6.46875, 7.20703125, 7.9453125, 8.68359375, 9.421875, 10.16015625, 10.8984375, 11.63671875, 12.375, 13.11328125, 13.8515625, 14.58984375, 15.328125, 16.06640625, 16.8046875, 17.54296875, 18.28125, 19.01953125, 19.7578125, 20.49609375, 21.234375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 9.0, 3.0, 5.0, 3.0, 10.0, 5.0, 7.0, 19.0, 12.0, 10.0, 18.0, 14.0, 17.0, 26.0, 26.0, 25.0, 31.0, 29.0, 29.0, 43.0, 42.0, 39.0, 30.0, 39.0, 39.0, 38.0, 48.0, 35.0, 38.0, 31.0, 36.0, 27.0, 29.0, 24.0, 19.0, 18.0, 28.0, 15.0, 19.0, 11.0, 12.0, 12.0, 10.0, 3.0, 3.0, 10.0, 9.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.84375, -47.22216796875, -45.6005859375, -43.97900390625, -42.357421875, -40.73583984375, -39.1142578125, -37.49267578125, -35.87109375, -34.24951171875, -32.6279296875, -31.00634765625, -29.384765625, -27.76318359375, -26.1416015625, -24.52001953125, -22.8984375, -21.27685546875, -19.6552734375, -18.03369140625, -16.412109375, -14.79052734375, -13.1689453125, -11.54736328125, -9.92578125, -8.30419921875, -6.6826171875, -5.06103515625, -3.439453125, -1.81787109375, -0.1962890625, 1.42529296875, 3.046875, 4.66845703125, 6.2900390625, 7.91162109375, 9.533203125, 11.15478515625, 12.7763671875, 14.39794921875, 16.01953125, 17.64111328125, 19.2626953125, 20.88427734375, 22.505859375, 24.12744140625, 25.7490234375, 27.37060546875, 28.9921875, 30.61376953125, 32.2353515625, 33.85693359375, 35.478515625, 37.10009765625, 38.7216796875, 40.34326171875, 41.96484375, 43.58642578125, 45.2080078125, 46.82958984375, 48.451171875, 50.07275390625, 51.6943359375, 53.31591796875, 54.9375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 2.0, 4.0, 11.0, 19.0, 38.0, 42.0, 78.0, 128.0, 195.0, 303.0, 399.0, 640.0, 945.0, 1430.0, 2036.0, 2976.0, 4347.0, 6405.0, 9110.0, 12948.0, 17647.0, 23769.0, 31592.0, 40298.0, 50019.0, 60613.0, 69429.0, 77429.0, 82154.0, 83129.0, 80653.0, 75235.0, 66941.0, 57398.0, 47196.0, 37618.0, 29300.0, 22025.0, 16080.0, 11434.0, 8496.0, 5723.0, 4035.0, 2707.0, 1852.0, 1306.0, 829.0, 535.0, 370.0, 245.0, 185.0, 96.0, 65.0, 32.0, 32.0, 20.0, 5.0, 10.0, 7.0, 0.0, 2.0], "bins": [-21.3125, -20.65380859375, -19.9951171875, -19.33642578125, -18.677734375, -18.01904296875, -17.3603515625, -16.70166015625, -16.04296875, -15.38427734375, -14.7255859375, -14.06689453125, -13.408203125, -12.74951171875, -12.0908203125, -11.43212890625, -10.7734375, -10.11474609375, -9.4560546875, -8.79736328125, -8.138671875, -7.47998046875, -6.8212890625, -6.16259765625, -5.50390625, -4.84521484375, -4.1865234375, -3.52783203125, -2.869140625, -2.21044921875, -1.5517578125, -0.89306640625, -0.234375, 0.42431640625, 1.0830078125, 1.74169921875, 2.400390625, 3.05908203125, 3.7177734375, 4.37646484375, 5.03515625, 5.69384765625, 6.3525390625, 7.01123046875, 7.669921875, 8.32861328125, 8.9873046875, 9.64599609375, 10.3046875, 10.96337890625, 11.6220703125, 12.28076171875, 12.939453125, 13.59814453125, 14.2568359375, 14.91552734375, 15.57421875, 16.23291015625, 16.8916015625, 17.55029296875, 18.208984375, 18.86767578125, 19.5263671875, 20.18505859375, 20.84375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 9.0, 4.0, 4.0, 9.0, 15.0, 16.0, 20.0, 22.0, 14.0, 23.0, 30.0, 26.0, 28.0, 31.0, 32.0, 36.0, 42.0, 63.0, 39.0, 35.0, 39.0, 37.0, 43.0, 40.0, 47.0, 30.0, 36.0, 38.0, 27.0, 27.0, 19.0, 19.0, 12.0, 11.0, 19.0, 15.0, 16.0, 5.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-38.21875, -37.0712890625, -35.923828125, -34.7763671875, -33.62890625, -32.4814453125, -31.333984375, -30.1865234375, -29.0390625, -27.8916015625, -26.744140625, -25.5966796875, -24.44921875, -23.3017578125, -22.154296875, -21.0068359375, -19.859375, -18.7119140625, -17.564453125, -16.4169921875, -15.26953125, -14.1220703125, -12.974609375, -11.8271484375, -10.6796875, -9.5322265625, -8.384765625, -7.2373046875, -6.08984375, -4.9423828125, -3.794921875, -2.6474609375, -1.5, -0.3525390625, 0.794921875, 1.9423828125, 3.08984375, 4.2373046875, 5.384765625, 6.5322265625, 7.6796875, 8.8271484375, 9.974609375, 11.1220703125, 12.26953125, 13.4169921875, 14.564453125, 15.7119140625, 16.859375, 18.0068359375, 19.154296875, 20.3017578125, 21.44921875, 22.5966796875, 23.744140625, 24.8916015625, 26.0390625, 27.1865234375, 28.333984375, 29.4814453125, 30.62890625, 31.7763671875, 32.923828125, 34.0712890625, 35.21875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 9.0, 11.0, 15.0, 24.0, 40.0, 70.0, 93.0, 149.0, 256.0, 407.0, 667.0, 1039.0, 1556.0, 2463.0, 3995.0, 6070.0, 9183.0, 13866.0, 20726.0, 29683.0, 40921.0, 54852.0, 69350.0, 82812.0, 93977.0, 99246.0, 99065.0, 91807.0, 80777.0, 67414.0, 52758.0, 39318.0, 28466.0, 19716.0, 13115.0, 8836.0, 5702.0, 3682.0, 2331.0, 1535.0, 872.0, 578.0, 399.0, 272.0, 155.0, 110.0, 61.0, 40.0, 31.0, 19.0, 6.0, 9.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6171875, -8.3193359375, -8.021484375, -7.7236328125, -7.42578125, -7.1279296875, -6.830078125, -6.5322265625, -6.234375, -5.9365234375, -5.638671875, -5.3408203125, -5.04296875, -4.7451171875, -4.447265625, -4.1494140625, -3.8515625, -3.5537109375, -3.255859375, -2.9580078125, -2.66015625, -2.3623046875, -2.064453125, -1.7666015625, -1.46875, -1.1708984375, -0.873046875, -0.5751953125, -0.27734375, 0.0205078125, 0.318359375, 0.6162109375, 0.9140625, 1.2119140625, 1.509765625, 1.8076171875, 2.10546875, 2.4033203125, 2.701171875, 2.9990234375, 3.296875, 3.5947265625, 3.892578125, 4.1904296875, 4.48828125, 4.7861328125, 5.083984375, 5.3818359375, 5.6796875, 5.9775390625, 6.275390625, 6.5732421875, 6.87109375, 7.1689453125, 7.466796875, 7.7646484375, 8.0625, 8.3603515625, 8.658203125, 8.9560546875, 9.25390625, 9.5517578125, 9.849609375, 10.1474609375, 10.4453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 10.0, 2.0, 8.0, 4.0, 12.0, 7.0, 5.0, 12.0, 13.0, 16.0, 19.0, 12.0, 23.0, 24.0, 34.0, 31.0, 44.0, 39.0, 44.0, 41.0, 46.0, 51.0, 56.0, 44.0, 43.0, 39.0, 44.0, 43.0, 29.0, 34.0, 35.0, 24.0, 15.0, 24.0, 15.0, 15.0, 7.0, 13.0, 5.0, 9.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0012493133544921875, -0.0012107938528060913, -0.0011722743511199951, -0.001133754849433899, -0.0010952353477478027, -0.0010567158460617065, -0.0010181963443756104, -0.0009796768426895142, -0.000941157341003418, -0.0009026378393173218, -0.0008641183376312256, -0.0008255988359451294, -0.0007870793342590332, -0.000748559832572937, -0.0007100403308868408, -0.0006715208292007446, -0.0006330013275146484, -0.0005944818258285522, -0.0005559623241424561, -0.0005174428224563599, -0.00047892332077026367, -0.0004404038190841675, -0.0004018843173980713, -0.0003633648157119751, -0.0003248453140258789, -0.0002863258123397827, -0.0002478063106536865, -0.00020928680896759033, -0.00017076730728149414, -0.00013224780559539795, -9.372830390930176e-05, -5.5208802223205566e-05, -1.6689300537109375e-05, 2.1830201148986816e-05, 6.034970283508301e-05, 9.88692045211792e-05, 0.0001373887062072754, 0.00017590820789337158, 0.00021442770957946777, 0.00025294721126556396, 0.00029146671295166016, 0.00032998621463775635, 0.00036850571632385254, 0.00040702521800994873, 0.0004455447196960449, 0.0004840642213821411, 0.0005225837230682373, 0.0005611032247543335, 0.0005996227264404297, 0.0006381422281265259, 0.0006766617298126221, 0.0007151812314987183, 0.0007537007331848145, 0.0007922202348709106, 0.0008307397365570068, 0.000869259238243103, 0.0009077787399291992, 0.0009462982416152954, 0.0009848177433013916, 0.0010233372449874878, 0.001061856746673584, 0.0011003762483596802, 0.0011388957500457764, 0.0011774152517318726, 0.0012159347534179688]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 10.0, 9.0, 26.0, 27.0, 45.0, 61.0, 83.0, 141.0, 234.0, 373.0, 545.0, 931.0, 1591.0, 2683.0, 4690.0, 8087.0, 13689.0, 23138.0, 36872.0, 56699.0, 79688.0, 103151.0, 122247.0, 128521.0, 122438.0, 105309.0, 81645.0, 57797.0, 38744.0, 24245.0, 14637.0, 8488.0, 4725.0, 2760.0, 1587.0, 973.0, 629.0, 388.0, 222.0, 143.0, 82.0, 56.0, 46.0, 27.0, 26.0, 10.0, 8.0, 11.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-13.078125, -12.64990234375, -12.2216796875, -11.79345703125, -11.365234375, -10.93701171875, -10.5087890625, -10.08056640625, -9.65234375, -9.22412109375, -8.7958984375, -8.36767578125, -7.939453125, -7.51123046875, -7.0830078125, -6.65478515625, -6.2265625, -5.79833984375, -5.3701171875, -4.94189453125, -4.513671875, -4.08544921875, -3.6572265625, -3.22900390625, -2.80078125, -2.37255859375, -1.9443359375, -1.51611328125, -1.087890625, -0.65966796875, -0.2314453125, 0.19677734375, 0.625, 1.05322265625, 1.4814453125, 1.90966796875, 2.337890625, 2.76611328125, 3.1943359375, 3.62255859375, 4.05078125, 4.47900390625, 4.9072265625, 5.33544921875, 5.763671875, 6.19189453125, 6.6201171875, 7.04833984375, 7.4765625, 7.90478515625, 8.3330078125, 8.76123046875, 9.189453125, 9.61767578125, 10.0458984375, 10.47412109375, 10.90234375, 11.33056640625, 11.7587890625, 12.18701171875, 12.615234375, 13.04345703125, 13.4716796875, 13.89990234375, 14.328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 3.0, 6.0, 3.0, 7.0, 10.0, 12.0, 14.0, 19.0, 13.0, 16.0, 22.0, 32.0, 26.0, 32.0, 39.0, 54.0, 37.0, 48.0, 47.0, 43.0, 51.0, 48.0, 46.0, 35.0, 36.0, 39.0, 41.0, 35.0, 23.0, 33.0, 20.0, 19.0, 15.0, 21.0, 12.0, 3.0, 8.0, 7.0, 5.0, 5.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.16015625, -5.975341796875, -5.79052734375, -5.605712890625, -5.4208984375, -5.236083984375, -5.05126953125, -4.866455078125, -4.681640625, -4.496826171875, -4.31201171875, -4.127197265625, -3.9423828125, -3.757568359375, -3.57275390625, -3.387939453125, -3.203125, -3.018310546875, -2.83349609375, -2.648681640625, -2.4638671875, -2.279052734375, -2.09423828125, -1.909423828125, -1.724609375, -1.539794921875, -1.35498046875, -1.170166015625, -0.9853515625, -0.800537109375, -0.61572265625, -0.430908203125, -0.24609375, -0.061279296875, 0.12353515625, 0.308349609375, 0.4931640625, 0.677978515625, 0.86279296875, 1.047607421875, 1.232421875, 1.417236328125, 1.60205078125, 1.786865234375, 1.9716796875, 2.156494140625, 2.34130859375, 2.526123046875, 2.7109375, 2.895751953125, 3.08056640625, 3.265380859375, 3.4501953125, 3.635009765625, 3.81982421875, 4.004638671875, 4.189453125, 4.374267578125, 4.55908203125, 4.743896484375, 4.9287109375, 5.113525390625, 5.29833984375, 5.483154296875, 5.66796875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 7.0, 10.0, 8.0, 9.0, 11.0, 5.0, 17.0, 17.0, 15.0, 14.0, 25.0, 22.0, 26.0, 23.0, 20.0, 35.0, 37.0, 40.0, 35.0, 37.0, 31.0, 48.0, 48.0, 43.0, 45.0, 41.0, 31.0, 36.0, 34.0, 33.0, 25.0, 25.0, 21.0, 19.0, 21.0, 15.0, 20.0, 13.0, 8.0, 3.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-43.47035598754883, -42.09918975830078, -40.728023529052734, -39.35685729980469, -37.985694885253906, -36.61452865600586, -35.24336242675781, -33.872196197509766, -32.50102996826172, -31.129863739013672, -29.758697509765625, -28.38753318786621, -27.016366958618164, -25.645200729370117, -24.274036407470703, -22.902870178222656, -21.53170394897461, -20.160537719726562, -18.789371490478516, -17.4182071685791, -16.047040939331055, -14.675874710083008, -13.304709434509277, -11.933544158935547, -10.5623779296875, -9.191211700439453, -7.820046424865723, -6.448880672454834, -5.077714920043945, -3.7065491676330566, -2.335383415222168, -0.9642181396484375, 0.40694427490234375, 1.7781100273132324, 3.149275779724121, 4.52044153213501, 5.891607284545898, 7.262773036956787, 8.633938789367676, 10.005104064941406, 11.376270294189453, 12.7474365234375, 14.11860179901123, 15.489767074584961, 16.860933303833008, 18.232099533081055, 19.60326385498047, 20.974430084228516, 22.345596313476562, 23.71676254272461, 25.087928771972656, 26.45909309387207, 27.830259323120117, 29.201425552368164, 30.572589874267578, 31.943756103515625, 33.31492233276367, 34.68608856201172, 36.057254791259766, 37.42842102050781, 38.799583435058594, 40.17074966430664, 41.54191589355469, 42.913082122802734, 44.28424835205078]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 7.0, 5.0, 8.0, 10.0, 10.0, 11.0, 7.0, 12.0, 25.0, 26.0, 22.0, 24.0, 32.0, 21.0, 32.0, 36.0, 33.0, 32.0, 42.0, 49.0, 43.0, 39.0, 38.0, 35.0, 38.0, 41.0, 40.0, 34.0, 32.0, 27.0, 27.0, 16.0, 28.0, 19.0, 21.0, 22.0, 10.0, 15.0, 6.0, 6.0, 3.0, 6.0, 5.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.04576873779297, -50.14818572998047, -48.25060272216797, -46.35301971435547, -44.45543670654297, -42.55785369873047, -40.66027069091797, -38.762691497802734, -36.865108489990234, -34.967525482177734, -33.069942474365234, -31.172359466552734, -29.274778366088867, -27.377195358276367, -25.479612350463867, -23.58203125, -21.684446334838867, -19.786863327026367, -17.889280319213867, -15.991698265075684, -14.0941162109375, -12.196533203125, -10.2989501953125, -8.401368141174316, -6.503785133361816, -4.606202602386475, -2.7086198329925537, -0.8110370635986328, 1.086545467376709, 2.984127998352051, 4.881711006164551, 6.779293060302734, 8.676876068115234, 10.574459075927734, 12.472041130065918, 14.369624137878418, 16.2672061920166, 18.1647891998291, 20.0623722076416, 21.95995330810547, 23.85753631591797, 25.75511932373047, 27.65270233154297, 29.55028533935547, 31.447866439819336, 33.34545135498047, 35.24303436279297, 37.1406135559082, 39.03820037841797, 40.93578338623047, 42.83336639404297, 44.73094940185547, 46.62853240966797, 48.52611541748047, 50.42369842529297, 52.3212776184082, 54.2188606262207, 56.1164436340332, 58.0140266418457, 59.9116096496582, 61.8091926574707, 63.70677185058594, 65.60435485839844, 67.50193786621094, 69.39952087402344]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [6.0, 6.0, 3.0, 17.0, 36.0, 62.0, 102.0, 181.0, 388.0, 578.0, 978.0, 1763.0, 2953.0, 4642.0, 7629.0, 12214.0, 19456.0, 29679.0, 43768.0, 63786.0, 90185.0, 122514.0, 161381.0, 205810.0, 252152.0, 293506.0, 328889.0, 349266.0, 355243.0, 341888.0, 315823.0, 276764.0, 233772.0, 187811.0, 145518.0, 108232.0, 78905.0, 54359.0, 37205.0, 24638.0, 16112.0, 10190.0, 6385.0, 3870.0, 2327.0, 1381.0, 843.0, 475.0, 284.0, 144.0, 85.0, 44.0, 31.0, 14.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.875, -27.8544921875, -26.833984375, -25.8134765625, -24.79296875, -23.7724609375, -22.751953125, -21.7314453125, -20.7109375, -19.6904296875, -18.669921875, -17.6494140625, -16.62890625, -15.6083984375, -14.587890625, -13.5673828125, -12.546875, -11.5263671875, -10.505859375, -9.4853515625, -8.46484375, -7.4443359375, -6.423828125, -5.4033203125, -4.3828125, -3.3623046875, -2.341796875, -1.3212890625, -0.30078125, 0.7197265625, 1.740234375, 2.7607421875, 3.78125, 4.8017578125, 5.822265625, 6.8427734375, 7.86328125, 8.8837890625, 9.904296875, 10.9248046875, 11.9453125, 12.9658203125, 13.986328125, 15.0068359375, 16.02734375, 17.0478515625, 18.068359375, 19.0888671875, 20.109375, 21.1298828125, 22.150390625, 23.1708984375, 24.19140625, 25.2119140625, 26.232421875, 27.2529296875, 28.2734375, 29.2939453125, 30.314453125, 31.3349609375, 32.35546875, 33.3759765625, 34.396484375, 35.4169921875, 36.4375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 8.0, 8.0, 10.0, 10.0, 11.0, 8.0, 24.0, 26.0, 25.0, 20.0, 27.0, 26.0, 30.0, 35.0, 31.0, 37.0, 41.0, 42.0, 47.0, 45.0, 38.0, 28.0, 47.0, 36.0, 46.0, 31.0, 32.0, 25.0, 29.0, 18.0, 25.0, 20.0, 24.0, 20.0, 13.0, 14.0, 9.0, 4.0, 3.0, 6.0, 5.0, 8.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.4375, -45.7138671875, -43.990234375, -42.2666015625, -40.54296875, -38.8193359375, -37.095703125, -35.3720703125, -33.6484375, -31.9248046875, -30.201171875, -28.4775390625, -26.75390625, -25.0302734375, -23.306640625, -21.5830078125, -19.859375, -18.1357421875, -16.412109375, -14.6884765625, -12.96484375, -11.2412109375, -9.517578125, -7.7939453125, -6.0703125, -4.3466796875, -2.623046875, -0.8994140625, 0.82421875, 2.5478515625, 4.271484375, 5.9951171875, 7.71875, 9.4423828125, 11.166015625, 12.8896484375, 14.61328125, 16.3369140625, 18.060546875, 19.7841796875, 21.5078125, 23.2314453125, 24.955078125, 26.6787109375, 28.40234375, 30.1259765625, 31.849609375, 33.5732421875, 35.296875, 37.0205078125, 38.744140625, 40.4677734375, 42.19140625, 43.9150390625, 45.638671875, 47.3623046875, 49.0859375, 50.8095703125, 52.533203125, 54.2568359375, 55.98046875, 57.7041015625, 59.427734375, 61.1513671875, 62.875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 7.0, 7.0, 15.0, 30.0, 50.0, 90.0, 173.0, 270.0, 500.0, 835.0, 1367.0, 2248.0, 3804.0, 6023.0, 9470.0, 14992.0, 22448.0, 33319.0, 48237.0, 67797.0, 92166.0, 121360.0, 156483.0, 193474.0, 231841.0, 267630.0, 296775.0, 317028.0, 324172.0, 319505.0, 303895.0, 276147.0, 242584.0, 204449.0, 167397.0, 132152.0, 100677.0, 73761.0, 53378.0, 36923.0, 25243.0, 16886.0, 10912.0, 6960.0, 4315.0, 2595.0, 1657.0, 922.0, 579.0, 324.0, 189.0, 114.0, 47.0, 29.0, 22.0, 10.0, 8.0, 2.0, 1.0, 2.0, 2.0], "bins": [-31.390625, -30.398681640625, -29.40673828125, -28.414794921875, -27.4228515625, -26.430908203125, -25.43896484375, -24.447021484375, -23.455078125, -22.463134765625, -21.47119140625, -20.479248046875, -19.4873046875, -18.495361328125, -17.50341796875, -16.511474609375, -15.51953125, -14.527587890625, -13.53564453125, -12.543701171875, -11.5517578125, -10.559814453125, -9.56787109375, -8.575927734375, -7.583984375, -6.592041015625, -5.60009765625, -4.608154296875, -3.6162109375, -2.624267578125, -1.63232421875, -0.640380859375, 0.3515625, 1.343505859375, 2.33544921875, 3.327392578125, 4.3193359375, 5.311279296875, 6.30322265625, 7.295166015625, 8.287109375, 9.279052734375, 10.27099609375, 11.262939453125, 12.2548828125, 13.246826171875, 14.23876953125, 15.230712890625, 16.22265625, 17.214599609375, 18.20654296875, 19.198486328125, 20.1904296875, 21.182373046875, 22.17431640625, 23.166259765625, 24.158203125, 25.150146484375, 26.14208984375, 27.134033203125, 28.1259765625, 29.117919921875, 30.10986328125, 31.101806640625, 32.09375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 6.0, 6.0, 7.0, 13.0, 19.0, 24.0, 35.0, 43.0, 46.0, 53.0, 71.0, 98.0, 102.0, 115.0, 125.0, 146.0, 163.0, 182.0, 200.0, 229.0, 196.0, 194.0, 193.0, 195.0, 205.0, 188.0, 180.0, 142.0, 160.0, 140.0, 118.0, 117.0, 85.0, 79.0, 39.0, 32.0, 38.0, 32.0, 20.0, 13.0, 11.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.984375, -24.1728515625, -23.361328125, -22.5498046875, -21.73828125, -20.9267578125, -20.115234375, -19.3037109375, -18.4921875, -17.6806640625, -16.869140625, -16.0576171875, -15.24609375, -14.4345703125, -13.623046875, -12.8115234375, -12.0, -11.1884765625, -10.376953125, -9.5654296875, -8.75390625, -7.9423828125, -7.130859375, -6.3193359375, -5.5078125, -4.6962890625, -3.884765625, -3.0732421875, -2.26171875, -1.4501953125, -0.638671875, 0.1728515625, 0.984375, 1.7958984375, 2.607421875, 3.4189453125, 4.23046875, 5.0419921875, 5.853515625, 6.6650390625, 7.4765625, 8.2880859375, 9.099609375, 9.9111328125, 10.72265625, 11.5341796875, 12.345703125, 13.1572265625, 13.96875, 14.7802734375, 15.591796875, 16.4033203125, 17.21484375, 18.0263671875, 18.837890625, 19.6494140625, 20.4609375, 21.2724609375, 22.083984375, 22.8955078125, 23.70703125, 24.5185546875, 25.330078125, 26.1416015625, 26.953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 13.0, 13.0, 11.0, 21.0, 9.0, 18.0, 15.0, 28.0, 29.0, 33.0, 32.0, 27.0, 18.0, 44.0, 43.0, 47.0, 40.0, 40.0, 33.0, 39.0, 46.0, 28.0, 48.0, 31.0, 47.0, 29.0, 32.0, 31.0, 25.0, 23.0, 22.0, 11.0, 12.0, 15.0, 5.0, 10.0, 6.0, 4.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.22359085083008, -51.573123931884766, -49.92266082763672, -48.272193908691406, -46.62173080444336, -44.97126388549805, -43.32080078125, -41.67033386230469, -40.019866943359375, -38.36940002441406, -36.718936920166016, -35.0684700012207, -33.418006896972656, -31.767539978027344, -30.117074966430664, -28.466609954833984, -26.816146850585938, -25.165681838989258, -23.515216827392578, -21.864749908447266, -20.21428680419922, -18.563819885253906, -16.913354873657227, -15.262889862060547, -13.612424850463867, -11.961959838867188, -10.311494827270508, -8.661028861999512, -7.010563850402832, -5.360098838806152, -3.7096328735351562, -2.0591678619384766, -0.40869903564453125, 1.2417662143707275, 2.8922314643859863, 4.542696952819824, 6.193161964416504, 7.843626976013184, 9.49409294128418, 11.14455795288086, 12.795022964477539, 14.445487976074219, 16.0959529876709, 17.746417999267578, 19.39688491821289, 21.047348022460938, 22.69781494140625, 24.34827995300293, 25.99874496459961, 27.64920997619629, 29.29967498779297, 30.95014190673828, 32.60060501098633, 34.25107192993164, 35.90153503417969, 37.552001953125, 39.20246887207031, 40.852935791015625, 42.50339889526367, 44.153865814208984, 45.80432891845703, 47.454795837402344, 49.105262756347656, 50.7557258605957, 52.40618896484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 2.0, 6.0, 8.0, 8.0, 13.0, 12.0, 16.0, 15.0, 14.0, 18.0, 25.0, 43.0, 42.0, 30.0, 36.0, 32.0, 38.0, 43.0, 38.0, 45.0, 32.0, 43.0, 52.0, 45.0, 53.0, 36.0, 42.0, 30.0, 23.0, 24.0, 16.0, 18.0, 25.0, 15.0, 13.0, 13.0, 12.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.381290435791016, -55.19485855102539, -53.00843048095703, -50.821998596191406, -48.63557052612305, -46.44913864135742, -44.26271057128906, -42.07627868652344, -39.88984680175781, -37.70341491699219, -35.51698684692383, -33.3305549621582, -31.144126892089844, -28.95769500732422, -26.771265029907227, -24.584835052490234, -22.398406982421875, -20.211977005004883, -18.02554702758789, -15.839116096496582, -13.65268611907959, -11.466256141662598, -9.279825210571289, -7.093395233154297, -4.906965255737305, -2.7205350399017334, -0.5341048240661621, 1.6523256301879883, 3.8387556076049805, 6.025185585021973, 8.211616516113281, 10.398046493530273, 12.58447265625, 14.770902633666992, 16.957332611083984, 19.14376449584961, 21.33019256591797, 23.516624450683594, 25.703054428100586, 27.889484405517578, 30.07591438293457, 32.26234436035156, 34.44877624511719, 36.63520431518555, 38.82163619995117, 41.00806427001953, 43.194496154785156, 45.38092803955078, 47.56735610961914, 49.753787994384766, 51.940216064453125, 54.12664794921875, 56.31307601928711, 58.499507904052734, 60.685935974121094, 62.87236785888672, 65.05879974365234, 67.24523162841797, 69.4316635131836, 71.61808776855469, 73.80451965332031, 75.99095153808594, 78.17738342285156, 80.36381530761719, 82.55023956298828]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 12.0, 25.0, 29.0, 43.0, 76.0, 85.0, 130.0, 239.0, 362.0, 515.0, 811.0, 1285.0, 2101.0, 3359.0, 5382.0, 8807.0, 14376.0, 24194.0, 39479.0, 64423.0, 104589.0, 158100.0, 193130.0, 158069.0, 103814.0, 64255.0, 39401.0, 23922.0, 14604.0, 8495.0, 5362.0, 3353.0, 2013.0, 1350.0, 821.0, 569.0, 300.0, 217.0, 140.0, 93.0, 74.0, 48.0, 37.0, 24.0, 15.0, 8.0, 4.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-6.27734375, -6.08416748046875, -5.8909912109375, -5.69781494140625, -5.504638671875, -5.31146240234375, -5.1182861328125, -4.92510986328125, -4.73193359375, -4.53875732421875, -4.3455810546875, -4.15240478515625, -3.959228515625, -3.76605224609375, -3.5728759765625, -3.37969970703125, -3.1865234375, -2.99334716796875, -2.8001708984375, -2.60699462890625, -2.413818359375, -2.22064208984375, -2.0274658203125, -1.83428955078125, -1.64111328125, -1.44793701171875, -1.2547607421875, -1.06158447265625, -0.868408203125, -0.67523193359375, -0.4820556640625, -0.28887939453125, -0.095703125, 0.09747314453125, 0.2906494140625, 0.48382568359375, 0.677001953125, 0.87017822265625, 1.0633544921875, 1.25653076171875, 1.44970703125, 1.64288330078125, 1.8360595703125, 2.02923583984375, 2.222412109375, 2.41558837890625, 2.6087646484375, 2.80194091796875, 2.9951171875, 3.18829345703125, 3.3814697265625, 3.57464599609375, 3.767822265625, 3.96099853515625, 4.1541748046875, 4.34735107421875, 4.54052734375, 4.73370361328125, 4.9268798828125, 5.12005615234375, 5.313232421875, 5.50640869140625, 5.6995849609375, 5.89276123046875, 6.0859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 2.0, 7.0, 7.0, 8.0, 13.0, 12.0, 15.0, 15.0, 15.0, 18.0, 25.0, 41.0, 44.0, 31.0, 34.0, 33.0, 39.0, 43.0, 37.0, 45.0, 33.0, 42.0, 53.0, 44.0, 52.0, 37.0, 41.0, 31.0, 23.0, 23.0, 17.0, 18.0, 25.0, 15.0, 12.0, 14.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.28125, -55.09521484375, -52.9091796875, -50.72314453125, -48.537109375, -46.35107421875, -44.1650390625, -41.97900390625, -39.79296875, -37.60693359375, -35.4208984375, -33.23486328125, -31.048828125, -28.86279296875, -26.6767578125, -24.49072265625, -22.3046875, -20.11865234375, -17.9326171875, -15.74658203125, -13.560546875, -11.37451171875, -9.1884765625, -7.00244140625, -4.81640625, -2.63037109375, -0.4443359375, 1.74169921875, 3.927734375, 6.11376953125, 8.2998046875, 10.48583984375, 12.671875, 14.85791015625, 17.0439453125, 19.22998046875, 21.416015625, 23.60205078125, 25.7880859375, 27.97412109375, 30.16015625, 32.34619140625, 34.5322265625, 36.71826171875, 38.904296875, 41.09033203125, 43.2763671875, 45.46240234375, 47.6484375, 49.83447265625, 52.0205078125, 54.20654296875, 56.392578125, 58.57861328125, 60.7646484375, 62.95068359375, 65.13671875, 67.32275390625, 69.5087890625, 71.69482421875, 73.880859375, 76.06689453125, 78.2529296875, 80.43896484375, 82.625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 6.0, 13.0, 11.0, 20.0, 24.0, 29.0, 38.0, 65.0, 92.0, 122.0, 153.0, 254.0, 342.0, 479.0, 670.0, 1026.0, 1682.0, 2692.0, 4563.0, 7774.0, 14641.0, 28105.0, 57246.0, 123798.0, 266997.0, 279075.0, 131732.0, 60922.0, 29743.0, 15293.0, 8331.0, 4813.0, 2737.0, 1740.0, 1108.0, 675.0, 463.0, 323.0, 214.0, 157.0, 100.0, 78.0, 51.0, 49.0, 31.0, 18.0, 15.0, 13.0, 9.0, 11.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-9.0625, -8.7796630859375, -8.496826171875, -8.2139892578125, -7.93115234375, -7.6483154296875, -7.365478515625, -7.0826416015625, -6.7998046875, -6.5169677734375, -6.234130859375, -5.9512939453125, -5.66845703125, -5.3856201171875, -5.102783203125, -4.8199462890625, -4.537109375, -4.2542724609375, -3.971435546875, -3.6885986328125, -3.40576171875, -3.1229248046875, -2.840087890625, -2.5572509765625, -2.2744140625, -1.9915771484375, -1.708740234375, -1.4259033203125, -1.14306640625, -0.8602294921875, -0.577392578125, -0.2945556640625, -0.01171875, 0.2711181640625, 0.553955078125, 0.8367919921875, 1.11962890625, 1.4024658203125, 1.685302734375, 1.9681396484375, 2.2509765625, 2.5338134765625, 2.816650390625, 3.0994873046875, 3.38232421875, 3.6651611328125, 3.947998046875, 4.2308349609375, 4.513671875, 4.7965087890625, 5.079345703125, 5.3621826171875, 5.64501953125, 5.9278564453125, 6.210693359375, 6.4935302734375, 6.7763671875, 7.0592041015625, 7.342041015625, 7.6248779296875, 7.90771484375, 8.1905517578125, 8.473388671875, 8.7562255859375, 9.0390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 8.0, 10.0, 5.0, 16.0, 7.0, 14.0, 15.0, 26.0, 18.0, 16.0, 15.0, 30.0, 29.0, 32.0, 33.0, 44.0, 38.0, 32.0, 42.0, 36.0, 41.0, 42.0, 42.0, 41.0, 33.0, 29.0, 37.0, 29.0, 25.0, 22.0, 24.0, 28.0, 18.0, 16.0, 11.0, 13.0, 14.0, 11.0, 9.0, 6.0, 7.0, 4.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-39.78125, -38.587890625, -37.39453125, -36.201171875, -35.0078125, -33.814453125, -32.62109375, -31.427734375, -30.234375, -29.041015625, -27.84765625, -26.654296875, -25.4609375, -24.267578125, -23.07421875, -21.880859375, -20.6875, -19.494140625, -18.30078125, -17.107421875, -15.9140625, -14.720703125, -13.52734375, -12.333984375, -11.140625, -9.947265625, -8.75390625, -7.560546875, -6.3671875, -5.173828125, -3.98046875, -2.787109375, -1.59375, -0.400390625, 0.79296875, 1.986328125, 3.1796875, 4.373046875, 5.56640625, 6.759765625, 7.953125, 9.146484375, 10.33984375, 11.533203125, 12.7265625, 13.919921875, 15.11328125, 16.306640625, 17.5, 18.693359375, 19.88671875, 21.080078125, 22.2734375, 23.466796875, 24.66015625, 25.853515625, 27.046875, 28.240234375, 29.43359375, 30.626953125, 31.8203125, 33.013671875, 34.20703125, 35.400390625, 36.59375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 5.0, 0.0, 3.0, 4.0, 10.0, 9.0, 13.0, 23.0, 32.0, 34.0, 51.0, 58.0, 87.0, 139.0, 156.0, 257.0, 362.0, 521.0, 781.0, 1176.0, 1887.0, 2944.0, 4897.0, 8731.0, 16587.0, 37036.0, 93162.0, 257914.0, 362526.0, 150277.0, 55839.0, 24071.0, 11901.0, 6454.0, 3696.0, 2390.0, 1527.0, 926.0, 577.0, 470.0, 314.0, 210.0, 154.0, 101.0, 71.0, 58.0, 30.0, 31.0, 13.0, 24.0, 11.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.79388427734375, -1.7303466796875, -1.66680908203125, -1.603271484375, -1.53973388671875, -1.4761962890625, -1.41265869140625, -1.34912109375, -1.28558349609375, -1.2220458984375, -1.15850830078125, -1.094970703125, -1.03143310546875, -0.9678955078125, -0.90435791015625, -0.8408203125, -0.77728271484375, -0.7137451171875, -0.65020751953125, -0.586669921875, -0.52313232421875, -0.4595947265625, -0.39605712890625, -0.33251953125, -0.26898193359375, -0.2054443359375, -0.14190673828125, -0.078369140625, -0.01483154296875, 0.0487060546875, 0.11224365234375, 0.17578125, 0.23931884765625, 0.3028564453125, 0.36639404296875, 0.429931640625, 0.49346923828125, 0.5570068359375, 0.62054443359375, 0.68408203125, 0.74761962890625, 0.8111572265625, 0.87469482421875, 0.938232421875, 1.00177001953125, 1.0653076171875, 1.12884521484375, 1.1923828125, 1.25592041015625, 1.3194580078125, 1.38299560546875, 1.446533203125, 1.51007080078125, 1.5736083984375, 1.63714599609375, 1.70068359375, 1.76422119140625, 1.8277587890625, 1.89129638671875, 1.954833984375, 2.01837158203125, 2.0819091796875, 2.14544677734375, 2.208984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 6.0, 6.0, 13.0, 8.0, 5.0, 22.0, 29.0, 24.0, 39.0, 29.0, 33.0, 38.0, 40.0, 49.0, 49.0, 46.0, 66.0, 51.0, 56.0, 42.0, 41.0, 40.0, 35.0, 20.0, 36.0, 31.0, 29.0, 22.0, 17.0, 16.0, 12.0, 9.0, 7.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.00011962652206420898, -0.00011610239744186401, -0.00011257827281951904, -0.00010905414819717407, -0.0001055300235748291, -0.00010200589895248413, -9.848177433013916e-05, -9.495764970779419e-05, -9.143352508544922e-05, -8.790940046310425e-05, -8.438527584075928e-05, -8.08611512184143e-05, -7.733702659606934e-05, -7.381290197372437e-05, -7.02887773513794e-05, -6.676465272903442e-05, -6.324052810668945e-05, -5.971640348434448e-05, -5.619227886199951e-05, -5.266815423965454e-05, -4.914402961730957e-05, -4.56199049949646e-05, -4.209578037261963e-05, -3.857165575027466e-05, -3.504753112792969e-05, -3.152340650558472e-05, -2.7999281883239746e-05, -2.4475157260894775e-05, -2.0951032638549805e-05, -1.7426908016204834e-05, -1.3902783393859863e-05, -1.0378658771514893e-05, -6.854534149169922e-06, -3.330409526824951e-06, 1.9371509552001953e-07, 3.7178397178649902e-06, 7.241964340209961e-06, 1.0766088962554932e-05, 1.4290213584899902e-05, 1.7814338207244873e-05, 2.1338462829589844e-05, 2.4862587451934814e-05, 2.8386712074279785e-05, 3.1910836696624756e-05, 3.5434961318969727e-05, 3.89590859413147e-05, 4.248321056365967e-05, 4.600733518600464e-05, 4.953145980834961e-05, 5.305558443069458e-05, 5.657970905303955e-05, 6.010383367538452e-05, 6.362795829772949e-05, 6.715208292007446e-05, 7.067620754241943e-05, 7.42003321647644e-05, 7.772445678710938e-05, 8.124858140945435e-05, 8.477270603179932e-05, 8.829683065414429e-05, 9.182095527648926e-05, 9.534507989883423e-05, 9.88692045211792e-05, 0.00010239332914352417, 0.00010591745376586914]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 6.0, 8.0, 6.0, 28.0, 33.0, 41.0, 77.0, 87.0, 116.0, 190.0, 259.0, 398.0, 555.0, 865.0, 1409.0, 2023.0, 3303.0, 5189.0, 8890.0, 15104.0, 25798.0, 45341.0, 79398.0, 136958.0, 206254.0, 202552.0, 131393.0, 76499.0, 43394.0, 25245.0, 14417.0, 8462.0, 5347.0, 3043.0, 1968.0, 1280.0, 869.0, 539.0, 365.0, 280.0, 177.0, 125.0, 82.0, 46.0, 54.0, 29.0, 20.0, 6.0, 11.0, 4.0, 10.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-2.470703125, -2.395751953125, -2.32080078125, -2.245849609375, -2.1708984375, -2.095947265625, -2.02099609375, -1.946044921875, -1.87109375, -1.796142578125, -1.72119140625, -1.646240234375, -1.5712890625, -1.496337890625, -1.42138671875, -1.346435546875, -1.271484375, -1.196533203125, -1.12158203125, -1.046630859375, -0.9716796875, -0.896728515625, -0.82177734375, -0.746826171875, -0.671875, -0.596923828125, -0.52197265625, -0.447021484375, -0.3720703125, -0.297119140625, -0.22216796875, -0.147216796875, -0.072265625, 0.002685546875, 0.07763671875, 0.152587890625, 0.2275390625, 0.302490234375, 0.37744140625, 0.452392578125, 0.52734375, 0.602294921875, 0.67724609375, 0.752197265625, 0.8271484375, 0.902099609375, 0.97705078125, 1.052001953125, 1.126953125, 1.201904296875, 1.27685546875, 1.351806640625, 1.4267578125, 1.501708984375, 1.57666015625, 1.651611328125, 1.7265625, 1.801513671875, 1.87646484375, 1.951416015625, 2.0263671875, 2.101318359375, 2.17626953125, 2.251220703125, 2.326171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 5.0, 6.0, 11.0, 7.0, 12.0, 11.0, 18.0, 13.0, 24.0, 26.0, 34.0, 31.0, 44.0, 39.0, 46.0, 58.0, 70.0, 53.0, 62.0, 59.0, 52.0, 45.0, 52.0, 37.0, 27.0, 34.0, 31.0, 16.0, 12.0, 18.0, 12.0, 5.0, 11.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1240234375, -1.0911636352539062, -1.0583038330078125, -1.0254440307617188, -0.992584228515625, -0.9597244262695312, -0.9268646240234375, -0.8940048217773438, -0.86114501953125, -0.8282852172851562, -0.7954254150390625, -0.7625656127929688, -0.729705810546875, -0.6968460083007812, -0.6639862060546875, -0.6311264038085938, -0.5982666015625, -0.5654067993164062, -0.5325469970703125, -0.49968719482421875, -0.466827392578125, -0.43396759033203125, -0.4011077880859375, -0.36824798583984375, -0.33538818359375, -0.30252838134765625, -0.2696685791015625, -0.23680877685546875, -0.203948974609375, -0.17108917236328125, -0.1382293701171875, -0.10536956787109375, -0.072509765625, -0.03964996337890625, -0.0067901611328125, 0.02606964111328125, 0.058929443359375, 0.09178924560546875, 0.1246490478515625, 0.15750885009765625, 0.19036865234375, 0.22322845458984375, 0.2560882568359375, 0.28894805908203125, 0.321807861328125, 0.35466766357421875, 0.3875274658203125, 0.42038726806640625, 0.4532470703125, 0.48610687255859375, 0.5189666748046875, 0.5518264770507812, 0.584686279296875, 0.6175460815429688, 0.6504058837890625, 0.6832656860351562, 0.71612548828125, 0.7489852905273438, 0.7818450927734375, 0.8147048950195312, 0.847564697265625, 0.8804244995117188, 0.9132843017578125, 0.9461441040039062, 0.97900390625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 10.0, 16.0, 11.0, 23.0, 11.0, 13.0, 18.0, 30.0, 24.0, 32.0, 27.0, 29.0, 23.0, 44.0, 43.0, 46.0, 41.0, 41.0, 30.0, 37.0, 44.0, 35.0, 42.0, 39.0, 39.0, 30.0, 27.0, 32.0, 31.0, 21.0, 21.0, 17.0, 11.0, 13.0, 7.0, 9.0, 8.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.032127380371094, -51.3890495300293, -49.745975494384766, -48.10289764404297, -46.45981979370117, -44.816741943359375, -43.173667907714844, -41.53059005737305, -39.88751220703125, -38.24443435668945, -36.60136032104492, -34.958282470703125, -33.31520462036133, -31.672128677368164, -30.029052734375, -28.385974884033203, -26.742900848388672, -25.099824905395508, -23.45674705505371, -21.813671112060547, -20.17059326171875, -18.527517318725586, -16.884441375732422, -15.241364479064941, -13.598287582397461, -11.95521068572998, -10.3121337890625, -8.669057846069336, -7.0259809494018555, -5.382904052734375, -3.739828109741211, -2.0967512130737305, -0.4536781311035156, 1.1893985271453857, 2.832475185394287, 4.475551605224609, 6.11862850189209, 7.76170539855957, 9.404781341552734, 11.047858238220215, 12.690935134887695, 14.334012031555176, 15.977088928222656, 17.62016487121582, 19.263240814208984, 20.90631866455078, 22.549394607543945, 24.19247055053711, 25.835548400878906, 27.47862434387207, 29.121702194213867, 30.76477813720703, 32.40785598754883, 34.050933837890625, 35.694007873535156, 37.33708572387695, 38.98016357421875, 40.62324142456055, 42.26631546020508, 43.909393310546875, 45.55247116088867, 47.19554901123047, 48.838623046875, 50.4817008972168, 52.12477493286133]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 2.0, 5.0, 8.0, 9.0, 13.0, 13.0, 14.0, 16.0, 12.0, 19.0, 25.0, 37.0, 46.0, 35.0, 33.0, 30.0, 39.0, 42.0, 42.0, 44.0, 33.0, 42.0, 51.0, 45.0, 53.0, 36.0, 44.0, 30.0, 20.0, 23.0, 18.0, 19.0, 25.0, 14.0, 13.0, 15.0, 8.0, 10.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.3848876953125, -55.198753356933594, -53.01261520385742, -50.826480865478516, -48.64034652709961, -46.45420837402344, -44.26807403564453, -42.081939697265625, -39.89580535888672, -37.70967102050781, -35.52353286743164, -33.337398529052734, -31.151264190673828, -28.96512794494629, -26.77899169921875, -24.592857360839844, -22.406719207763672, -20.220582962036133, -18.034448623657227, -15.848312377929688, -13.662177085876465, -11.476041793823242, -9.289905548095703, -7.1037702560424805, -4.917634963989258, -2.731499433517456, -0.5453639030456543, 1.6407718658447266, 3.826907157897949, 6.013042449951172, 8.199178695678711, 10.385313987731934, 12.571449279785156, 14.757584571838379, 16.9437198638916, 19.12985610961914, 21.315990447998047, 23.502126693725586, 25.688262939453125, 27.87439727783203, 30.06053352355957, 32.24666976928711, 34.432804107666016, 36.61894226074219, 38.805076599121094, 40.9912109375, 43.177345275878906, 45.36348342895508, 47.549617767333984, 49.73575210571289, 51.92189025878906, 54.10802459716797, 56.294158935546875, 58.48029327392578, 60.66643142700195, 62.85256576538086, 65.03870391845703, 67.22483825683594, 69.41097259521484, 71.59710693359375, 73.78324890136719, 75.9693832397461, 78.155517578125, 80.3416519165039, 82.52778625488281]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 12.0, 18.0, 42.0, 56.0, 85.0, 179.0, 268.0, 418.0, 685.0, 1106.0, 1721.0, 2884.0, 4422.0, 6494.0, 10032.0, 14454.0, 20804.0, 28682.0, 38728.0, 50079.0, 61978.0, 73934.0, 83404.0, 89589.0, 91116.0, 88618.0, 81276.0, 70978.0, 59035.0, 47099.0, 36027.0, 26710.0, 18964.0, 13237.0, 9060.0, 5945.0, 3902.0, 2510.0, 1500.0, 958.0, 614.0, 407.0, 217.0, 139.0, 60.0, 45.0, 27.0, 21.0, 4.0, 6.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.453125, -21.688720703125, -20.92431640625, -20.159912109375, -19.3955078125, -18.631103515625, -17.86669921875, -17.102294921875, -16.337890625, -15.573486328125, -14.80908203125, -14.044677734375, -13.2802734375, -12.515869140625, -11.75146484375, -10.987060546875, -10.22265625, -9.458251953125, -8.69384765625, -7.929443359375, -7.1650390625, -6.400634765625, -5.63623046875, -4.871826171875, -4.107421875, -3.343017578125, -2.57861328125, -1.814208984375, -1.0498046875, -0.285400390625, 0.47900390625, 1.243408203125, 2.0078125, 2.772216796875, 3.53662109375, 4.301025390625, 5.0654296875, 5.829833984375, 6.59423828125, 7.358642578125, 8.123046875, 8.887451171875, 9.65185546875, 10.416259765625, 11.1806640625, 11.945068359375, 12.70947265625, 13.473876953125, 14.23828125, 15.002685546875, 15.76708984375, 16.531494140625, 17.2958984375, 18.060302734375, 18.82470703125, 19.589111328125, 20.353515625, 21.117919921875, 21.88232421875, 22.646728515625, 23.4111328125, 24.175537109375, 24.93994140625, 25.704345703125, 26.46875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 2.0, 5.0, 8.0, 9.0, 12.0, 13.0, 15.0, 14.0, 14.0, 18.0, 26.0, 34.0, 47.0, 32.0, 34.0, 32.0, 39.0, 42.0, 38.0, 48.0, 28.0, 45.0, 52.0, 45.0, 52.0, 38.0, 42.0, 32.0, 20.0, 24.0, 18.0, 18.0, 26.0, 15.0, 13.0, 13.0, 10.0, 10.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.71875, -54.56298828125, -52.4072265625, -50.25146484375, -48.095703125, -45.93994140625, -43.7841796875, -41.62841796875, -39.47265625, -37.31689453125, -35.1611328125, -33.00537109375, -30.849609375, -28.69384765625, -26.5380859375, -24.38232421875, -22.2265625, -20.07080078125, -17.9150390625, -15.75927734375, -13.603515625, -11.44775390625, -9.2919921875, -7.13623046875, -4.98046875, -2.82470703125, -0.6689453125, 1.48681640625, 3.642578125, 5.79833984375, 7.9541015625, 10.10986328125, 12.265625, 14.42138671875, 16.5771484375, 18.73291015625, 20.888671875, 23.04443359375, 25.2001953125, 27.35595703125, 29.51171875, 31.66748046875, 33.8232421875, 35.97900390625, 38.134765625, 40.29052734375, 42.4462890625, 44.60205078125, 46.7578125, 48.91357421875, 51.0693359375, 53.22509765625, 55.380859375, 57.53662109375, 59.6923828125, 61.84814453125, 64.00390625, 66.15966796875, 68.3154296875, 70.47119140625, 72.626953125, 74.78271484375, 76.9384765625, 79.09423828125, 81.25]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 8.0, 6.0, 19.0, 22.0, 28.0, 61.0, 75.0, 136.0, 212.0, 332.0, 525.0, 772.0, 1343.0, 2112.0, 3156.0, 4894.0, 7515.0, 11291.0, 16562.0, 23617.0, 32451.0, 43643.0, 56101.0, 69275.0, 80743.0, 90256.0, 93470.0, 93318.0, 87039.0, 77372.0, 64868.0, 52607.0, 39958.0, 29875.0, 21298.0, 14744.0, 10110.0, 6729.0, 4418.0, 2796.0, 1790.0, 1148.0, 728.0, 418.0, 283.0, 166.0, 89.0, 58.0, 43.0, 24.0, 18.0, 10.0, 10.0, 5.0, 9.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.1875, -23.377197265625, -22.56689453125, -21.756591796875, -20.9462890625, -20.135986328125, -19.32568359375, -18.515380859375, -17.705078125, -16.894775390625, -16.08447265625, -15.274169921875, -14.4638671875, -13.653564453125, -12.84326171875, -12.032958984375, -11.22265625, -10.412353515625, -9.60205078125, -8.791748046875, -7.9814453125, -7.171142578125, -6.36083984375, -5.550537109375, -4.740234375, -3.929931640625, -3.11962890625, -2.309326171875, -1.4990234375, -0.688720703125, 0.12158203125, 0.931884765625, 1.7421875, 2.552490234375, 3.36279296875, 4.173095703125, 4.9833984375, 5.793701171875, 6.60400390625, 7.414306640625, 8.224609375, 9.034912109375, 9.84521484375, 10.655517578125, 11.4658203125, 12.276123046875, 13.08642578125, 13.896728515625, 14.70703125, 15.517333984375, 16.32763671875, 17.137939453125, 17.9482421875, 18.758544921875, 19.56884765625, 20.379150390625, 21.189453125, 21.999755859375, 22.81005859375, 23.620361328125, 24.4306640625, 25.240966796875, 26.05126953125, 26.861572265625, 27.671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 13.0, 11.0, 15.0, 16.0, 20.0, 10.0, 21.0, 19.0, 32.0, 33.0, 39.0, 28.0, 32.0, 38.0, 47.0, 32.0, 41.0, 48.0, 51.0, 53.0, 43.0, 45.0, 36.0, 44.0, 35.0, 16.0, 25.0, 30.0, 24.0, 18.0, 17.0, 14.0, 4.0, 9.0, 14.0, 6.0, 1.0, 1.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-46.96875, -45.611328125, -44.25390625, -42.896484375, -41.5390625, -40.181640625, -38.82421875, -37.466796875, -36.109375, -34.751953125, -33.39453125, -32.037109375, -30.6796875, -29.322265625, -27.96484375, -26.607421875, -25.25, -23.892578125, -22.53515625, -21.177734375, -19.8203125, -18.462890625, -17.10546875, -15.748046875, -14.390625, -13.033203125, -11.67578125, -10.318359375, -8.9609375, -7.603515625, -6.24609375, -4.888671875, -3.53125, -2.173828125, -0.81640625, 0.541015625, 1.8984375, 3.255859375, 4.61328125, 5.970703125, 7.328125, 8.685546875, 10.04296875, 11.400390625, 12.7578125, 14.115234375, 15.47265625, 16.830078125, 18.1875, 19.544921875, 20.90234375, 22.259765625, 23.6171875, 24.974609375, 26.33203125, 27.689453125, 29.046875, 30.404296875, 31.76171875, 33.119140625, 34.4765625, 35.833984375, 37.19140625, 38.548828125, 39.90625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 9.0, 18.0, 24.0, 26.0, 63.0, 123.0, 122.0, 242.0, 415.0, 648.0, 1068.0, 1625.0, 2601.0, 4110.0, 6418.0, 9844.0, 14903.0, 21652.0, 30484.0, 42000.0, 55514.0, 68844.0, 82264.0, 91803.0, 97010.0, 96420.0, 90209.0, 80216.0, 66781.0, 53149.0, 40588.0, 29343.0, 20506.0, 13754.0, 9301.0, 5954.0, 3937.0, 2476.0, 1546.0, 945.0, 611.0, 365.0, 227.0, 138.0, 106.0, 56.0, 44.0, 19.0, 14.0, 11.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -10.016845703125, -9.68212890625, -9.347412109375, -9.0126953125, -8.677978515625, -8.34326171875, -8.008544921875, -7.673828125, -7.339111328125, -7.00439453125, -6.669677734375, -6.3349609375, -6.000244140625, -5.66552734375, -5.330810546875, -4.99609375, -4.661376953125, -4.32666015625, -3.991943359375, -3.6572265625, -3.322509765625, -2.98779296875, -2.653076171875, -2.318359375, -1.983642578125, -1.64892578125, -1.314208984375, -0.9794921875, -0.644775390625, -0.31005859375, 0.024658203125, 0.359375, 0.694091796875, 1.02880859375, 1.363525390625, 1.6982421875, 2.032958984375, 2.36767578125, 2.702392578125, 3.037109375, 3.371826171875, 3.70654296875, 4.041259765625, 4.3759765625, 4.710693359375, 5.04541015625, 5.380126953125, 5.71484375, 6.049560546875, 6.38427734375, 6.718994140625, 7.0537109375, 7.388427734375, 7.72314453125, 8.057861328125, 8.392578125, 8.727294921875, 9.06201171875, 9.396728515625, 9.7314453125, 10.066162109375, 10.40087890625, 10.735595703125, 11.0703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 3.0, 5.0, 2.0, 7.0, 7.0, 9.0, 16.0, 12.0, 13.0, 13.0, 17.0, 22.0, 29.0, 30.0, 27.0, 31.0, 32.0, 34.0, 44.0, 31.0, 48.0, 41.0, 39.0, 36.0, 43.0, 34.0, 36.0, 38.0, 31.0, 30.0, 25.0, 38.0, 19.0, 23.0, 27.0, 14.0, 10.0, 10.0, 13.0, 13.0, 6.0, 5.0, 10.0, 9.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.001354217529296875, -0.001314699649810791, -0.001275181770324707, -0.001235663890838623, -0.001196146011352539, -0.001156628131866455, -0.001117110252380371, -0.0010775923728942871, -0.0010380744934082031, -0.0009985566139221191, -0.0009590387344360352, -0.0009195208549499512, -0.0008800029754638672, -0.0008404850959777832, -0.0008009672164916992, -0.0007614493370056152, -0.0007219314575195312, -0.0006824135780334473, -0.0006428956985473633, -0.0006033778190612793, -0.0005638599395751953, -0.0005243420600891113, -0.00048482418060302734, -0.00044530630111694336, -0.0004057884216308594, -0.0003662705421447754, -0.0003267526626586914, -0.0002872347831726074, -0.00024771690368652344, -0.00020819902420043945, -0.00016868114471435547, -0.00012916326522827148, -8.96453857421875e-05, -5.0127506256103516e-05, -1.0609626770019531e-05, 2.8908252716064453e-05, 6.842613220214844e-05, 0.00010794401168823242, 0.0001474618911743164, 0.0001869797706604004, 0.00022649765014648438, 0.00026601552963256836, 0.00030553340911865234, 0.00034505128860473633, 0.0003845691680908203, 0.0004240870475769043, 0.0004636049270629883, 0.0005031228065490723, 0.0005426406860351562, 0.0005821585655212402, 0.0006216764450073242, 0.0006611943244934082, 0.0007007122039794922, 0.0007402300834655762, 0.0007797479629516602, 0.0008192658424377441, 0.0008587837219238281, 0.0008983016014099121, 0.0009378194808959961, 0.00097733736038208, 0.001016855239868164, 0.001056373119354248, 0.001095890998840332, 0.001135408878326416, 0.0011749267578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 31.0, 33.0, 48.0, 76.0, 112.0, 162.0, 278.0, 415.0, 701.0, 1157.0, 1683.0, 2777.0, 4308.0, 6672.0, 10182.0, 15364.0, 22846.0, 32895.0, 45333.0, 59031.0, 74013.0, 87041.0, 97033.0, 100889.0, 98336.0, 89701.0, 77218.0, 63052.0, 47957.0, 35301.0, 24727.0, 17292.0, 11474.0, 7449.0, 4705.0, 3066.0, 1946.0, 1232.0, 717.0, 473.0, 297.0, 172.0, 130.0, 88.0, 45.0, 44.0, 11.0, 10.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-11.921875, -11.5447998046875, -11.167724609375, -10.7906494140625, -10.41357421875, -10.0364990234375, -9.659423828125, -9.2823486328125, -8.9052734375, -8.5281982421875, -8.151123046875, -7.7740478515625, -7.39697265625, -7.0198974609375, -6.642822265625, -6.2657470703125, -5.888671875, -5.5115966796875, -5.134521484375, -4.7574462890625, -4.38037109375, -4.0032958984375, -3.626220703125, -3.2491455078125, -2.8720703125, -2.4949951171875, -2.117919921875, -1.7408447265625, -1.36376953125, -0.9866943359375, -0.609619140625, -0.2325439453125, 0.14453125, 0.5216064453125, 0.898681640625, 1.2757568359375, 1.65283203125, 2.0299072265625, 2.406982421875, 2.7840576171875, 3.1611328125, 3.5382080078125, 3.915283203125, 4.2923583984375, 4.66943359375, 5.0465087890625, 5.423583984375, 5.8006591796875, 6.177734375, 6.5548095703125, 6.931884765625, 7.3089599609375, 7.68603515625, 8.0631103515625, 8.440185546875, 8.8172607421875, 9.1943359375, 9.5714111328125, 9.948486328125, 10.3255615234375, 10.70263671875, 11.0797119140625, 11.456787109375, 11.8338623046875, 12.2109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 6.0, 6.0, 14.0, 12.0, 12.0, 12.0, 14.0, 29.0, 25.0, 29.0, 33.0, 38.0, 33.0, 42.0, 53.0, 51.0, 39.0, 48.0, 47.0, 40.0, 42.0, 45.0, 50.0, 30.0, 29.0, 24.0, 20.0, 29.0, 22.0, 16.0, 21.0, 11.0, 22.0, 11.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-7.0859375, -6.87652587890625, -6.6671142578125, -6.45770263671875, -6.248291015625, -6.03887939453125, -5.8294677734375, -5.62005615234375, -5.41064453125, -5.20123291015625, -4.9918212890625, -4.78240966796875, -4.572998046875, -4.36358642578125, -4.1541748046875, -3.94476318359375, -3.7353515625, -3.52593994140625, -3.3165283203125, -3.10711669921875, -2.897705078125, -2.68829345703125, -2.4788818359375, -2.26947021484375, -2.06005859375, -1.85064697265625, -1.6412353515625, -1.43182373046875, -1.222412109375, -1.01300048828125, -0.8035888671875, -0.59417724609375, -0.384765625, -0.17535400390625, 0.0340576171875, 0.24346923828125, 0.452880859375, 0.66229248046875, 0.8717041015625, 1.08111572265625, 1.29052734375, 1.49993896484375, 1.7093505859375, 1.91876220703125, 2.128173828125, 2.33758544921875, 2.5469970703125, 2.75640869140625, 2.9658203125, 3.17523193359375, 3.3846435546875, 3.59405517578125, 3.803466796875, 4.01287841796875, 4.2222900390625, 4.43170166015625, 4.64111328125, 4.85052490234375, 5.0599365234375, 5.26934814453125, 5.478759765625, 5.68817138671875, 5.8975830078125, 6.10699462890625, 6.31640625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 5.0, 2.0, 5.0, 4.0, 10.0, 8.0, 12.0, 17.0, 18.0, 24.0, 23.0, 19.0, 21.0, 23.0, 26.0, 33.0, 38.0, 42.0, 31.0, 39.0, 40.0, 32.0, 37.0, 40.0, 40.0, 39.0, 49.0, 35.0, 37.0, 31.0, 29.0, 27.0, 34.0, 18.0, 17.0, 20.0, 19.0, 9.0, 5.0, 13.0, 7.0, 5.0, 7.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.5462532043457, -50.931087493896484, -49.31591796875, -47.70075225830078, -46.08558654785156, -44.470420837402344, -42.85525131225586, -41.24008560180664, -39.62491989135742, -38.0097541809082, -36.39458465576172, -34.7794189453125, -33.16425323486328, -31.54908561706543, -29.933917999267578, -28.31875228881836, -26.703584671020508, -25.088417053222656, -23.473251342773438, -21.858083724975586, -20.242918014526367, -18.627750396728516, -17.012584686279297, -15.397417068481445, -13.78225040435791, -12.167083740234375, -10.55191707611084, -8.936750411987305, -7.321583271026611, -5.706416130065918, -4.091249465942383, -2.4760828018188477, -0.8609161376953125, 0.7542506456375122, 2.369417428970337, 3.984584331512451, 5.599750995635986, 7.21491813659668, 8.830084800720215, 10.44525146484375, 12.060418128967285, 13.67558479309082, 15.290751457214355, 16.90591812133789, 18.521085739135742, 20.136253356933594, 21.751419067382812, 23.36658477783203, 24.981752395629883, 26.596920013427734, 28.212085723876953, 29.827253341674805, 31.442419052124023, 33.057586669921875, 34.672752380371094, 36.28791809082031, 37.9030876159668, 39.518253326416016, 41.1334228515625, 42.74858856201172, 44.36375427246094, 45.978919982910156, 47.59408950805664, 49.20925521850586, 50.82442092895508]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 9.0, 6.0, 12.0, 8.0, 10.0, 9.0, 14.0, 24.0, 16.0, 21.0, 22.0, 30.0, 25.0, 24.0, 39.0, 41.0, 43.0, 34.0, 43.0, 40.0, 43.0, 36.0, 40.0, 46.0, 47.0, 42.0, 29.0, 33.0, 35.0, 26.0, 22.0, 14.0, 23.0, 16.0, 15.0, 16.0, 14.0, 12.0, 6.0, 5.0, 7.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.82920837402344, -61.526241302490234, -59.22327423095703, -56.92030715942383, -54.617340087890625, -52.31437683105469, -50.011409759521484, -47.70844268798828, -45.40547561645508, -43.102508544921875, -40.79954147338867, -38.49657440185547, -36.19361114501953, -33.89064025878906, -31.587677001953125, -29.284709930419922, -26.98174285888672, -24.678775787353516, -22.375808715820312, -20.072843551635742, -17.76987648010254, -15.466909408569336, -13.16394329071045, -10.860977172851562, -8.55801010131836, -6.2550435066223145, -3.9520769119262695, -1.6491103172302246, 0.6538562774658203, 2.9568233489990234, 5.25978946685791, 7.562755584716797, 9.865730285644531, 12.168697357177734, 14.471663475036621, 16.774629592895508, 19.07759666442871, 21.380563735961914, 23.683528900146484, 25.986495971679688, 28.28946304321289, 30.592430114746094, 32.8953971862793, 35.1983642578125, 37.50132751464844, 39.804298400878906, 42.107261657714844, 44.41022872924805, 46.71319580078125, 49.01616287231445, 51.319129943847656, 53.62209701538086, 55.92506408691406, 58.22802734375, 60.5309944152832, 62.833961486816406, 65.13693237304688, 67.43989562988281, 69.74286651611328, 72.04582977294922, 74.34880065917969, 76.65176391601562, 78.9547348022461, 81.25769805908203, 83.56066131591797]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 12.0, 18.0, 36.0, 74.0, 112.0, 214.0, 320.0, 604.0, 1027.0, 1800.0, 2953.0, 4897.0, 7773.0, 12406.0, 19553.0, 29981.0, 44907.0, 65381.0, 92458.0, 127206.0, 167993.0, 213889.0, 262978.0, 305511.0, 339857.0, 360023.0, 361250.0, 346623.0, 313400.0, 270297.0, 224168.0, 177017.0, 134366.0, 98022.0, 69838.0, 48456.0, 32209.0, 21187.0, 13514.0, 8394.0, 5284.0, 3291.0, 1936.0, 1247.0, 747.0, 437.0, 263.0, 156.0, 89.0, 37.0, 40.0, 15.0, 16.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.65625, -37.4130859375, -36.169921875, -34.9267578125, -33.68359375, -32.4404296875, -31.197265625, -29.9541015625, -28.7109375, -27.4677734375, -26.224609375, -24.9814453125, -23.73828125, -22.4951171875, -21.251953125, -20.0087890625, -18.765625, -17.5224609375, -16.279296875, -15.0361328125, -13.79296875, -12.5498046875, -11.306640625, -10.0634765625, -8.8203125, -7.5771484375, -6.333984375, -5.0908203125, -3.84765625, -2.6044921875, -1.361328125, -0.1181640625, 1.125, 2.3681640625, 3.611328125, 4.8544921875, 6.09765625, 7.3408203125, 8.583984375, 9.8271484375, 11.0703125, 12.3134765625, 13.556640625, 14.7998046875, 16.04296875, 17.2861328125, 18.529296875, 19.7724609375, 21.015625, 22.2587890625, 23.501953125, 24.7451171875, 25.98828125, 27.2314453125, 28.474609375, 29.7177734375, 30.9609375, 32.2041015625, 33.447265625, 34.6904296875, 35.93359375, 37.1767578125, 38.419921875, 39.6630859375, 40.90625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 10.0, 8.0, 11.0, 9.0, 8.0, 12.0, 16.0, 21.0, 19.0, 22.0, 17.0, 35.0, 24.0, 25.0, 44.0, 40.0, 42.0, 41.0, 38.0, 44.0, 32.0, 41.0, 47.0, 40.0, 48.0, 37.0, 31.0, 34.0, 33.0, 25.0, 17.0, 21.0, 18.0, 15.0, 15.0, 18.0, 13.0, 10.0, 7.0, 7.0, 2.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.625, -58.412109375, -56.19921875, -53.986328125, -51.7734375, -49.560546875, -47.34765625, -45.134765625, -42.921875, -40.708984375, -38.49609375, -36.283203125, -34.0703125, -31.857421875, -29.64453125, -27.431640625, -25.21875, -23.005859375, -20.79296875, -18.580078125, -16.3671875, -14.154296875, -11.94140625, -9.728515625, -7.515625, -5.302734375, -3.08984375, -0.876953125, 1.3359375, 3.548828125, 5.76171875, 7.974609375, 10.1875, 12.400390625, 14.61328125, 16.826171875, 19.0390625, 21.251953125, 23.46484375, 25.677734375, 27.890625, 30.103515625, 32.31640625, 34.529296875, 36.7421875, 38.955078125, 41.16796875, 43.380859375, 45.59375, 47.806640625, 50.01953125, 52.232421875, 54.4453125, 56.658203125, 58.87109375, 61.083984375, 63.296875, 65.509765625, 67.72265625, 69.935546875, 72.1484375, 74.361328125, 76.57421875, 78.787109375, 81.0]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 15.0, 36.0, 57.0, 86.0, 167.0, 272.0, 479.0, 779.0, 1302.0, 2220.0, 3590.0, 5632.0, 8853.0, 13948.0, 21089.0, 30862.0, 44715.0, 62279.0, 86316.0, 115240.0, 148996.0, 185139.0, 223764.0, 259530.0, 290317.0, 313029.0, 325071.0, 321785.0, 307877.0, 282133.0, 250635.0, 212595.0, 174595.0, 138329.0, 106876.0, 79111.0, 56983.0, 40309.0, 27467.0, 18630.0, 12096.0, 7940.0, 5170.0, 3140.0, 1918.0, 1188.0, 716.0, 417.0, 235.0, 157.0, 82.0, 52.0, 26.0, 17.0, 11.0, 7.0, 1.0, 3.0], "bins": [-39.53125, -38.328125, -37.125, -35.921875, -34.71875, -33.515625, -32.3125, -31.109375, -29.90625, -28.703125, -27.5, -26.296875, -25.09375, -23.890625, -22.6875, -21.484375, -20.28125, -19.078125, -17.875, -16.671875, -15.46875, -14.265625, -13.0625, -11.859375, -10.65625, -9.453125, -8.25, -7.046875, -5.84375, -4.640625, -3.4375, -2.234375, -1.03125, 0.171875, 1.375, 2.578125, 3.78125, 4.984375, 6.1875, 7.390625, 8.59375, 9.796875, 11.0, 12.203125, 13.40625, 14.609375, 15.8125, 17.015625, 18.21875, 19.421875, 20.625, 21.828125, 23.03125, 24.234375, 25.4375, 26.640625, 27.84375, 29.046875, 30.25, 31.453125, 32.65625, 33.859375, 35.0625, 36.265625, 37.46875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 9.0, 18.0, 12.0, 25.0, 26.0, 43.0, 39.0, 58.0, 51.0, 76.0, 86.0, 109.0, 107.0, 124.0, 136.0, 152.0, 187.0, 174.0, 186.0, 192.0, 199.0, 196.0, 186.0, 206.0, 174.0, 181.0, 136.0, 166.0, 150.0, 124.0, 103.0, 90.0, 67.0, 55.0, 57.0, 39.0, 32.0, 22.0, 23.0, 17.0, 10.0, 9.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.015625, -30.07958984375, -29.1435546875, -28.20751953125, -27.271484375, -26.33544921875, -25.3994140625, -24.46337890625, -23.52734375, -22.59130859375, -21.6552734375, -20.71923828125, -19.783203125, -18.84716796875, -17.9111328125, -16.97509765625, -16.0390625, -15.10302734375, -14.1669921875, -13.23095703125, -12.294921875, -11.35888671875, -10.4228515625, -9.48681640625, -8.55078125, -7.61474609375, -6.6787109375, -5.74267578125, -4.806640625, -3.87060546875, -2.9345703125, -1.99853515625, -1.0625, -0.12646484375, 0.8095703125, 1.74560546875, 2.681640625, 3.61767578125, 4.5537109375, 5.48974609375, 6.42578125, 7.36181640625, 8.2978515625, 9.23388671875, 10.169921875, 11.10595703125, 12.0419921875, 12.97802734375, 13.9140625, 14.85009765625, 15.7861328125, 16.72216796875, 17.658203125, 18.59423828125, 19.5302734375, 20.46630859375, 21.40234375, 22.33837890625, 23.2744140625, 24.21044921875, 25.146484375, 26.08251953125, 27.0185546875, 27.95458984375, 28.890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 2.0, 4.0, 6.0, 7.0, 4.0, 4.0, 10.0, 9.0, 12.0, 15.0, 23.0, 27.0, 33.0, 31.0, 29.0, 31.0, 27.0, 25.0, 34.0, 45.0, 34.0, 48.0, 49.0, 42.0, 50.0, 39.0, 37.0, 42.0, 32.0, 37.0, 25.0, 25.0, 23.0, 21.0, 20.0, 15.0, 13.0, 15.0, 12.0, 8.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-65.73580169677734, -63.70317840576172, -61.67055892944336, -59.637935638427734, -57.605316162109375, -55.57269287109375, -53.540069580078125, -51.507450103759766, -49.474830627441406, -47.44220733642578, -45.40958786010742, -43.3769645690918, -41.34434509277344, -39.31172180175781, -37.27909851074219, -35.24647903442383, -33.2138557434082, -31.18123435974121, -29.14861297607422, -27.115989685058594, -25.083370208740234, -23.05074691772461, -21.018125534057617, -18.985504150390625, -16.952882766723633, -14.92026138305664, -12.887639999389648, -10.85501766204834, -8.822396278381348, -6.7897748947143555, -4.757152557373047, -2.7245311737060547, -0.6919097900390625, 1.3407118320465088, 3.37333345413208, 5.4059553146362305, 7.438576698303223, 9.471198081970215, 11.503820419311523, 13.536441802978516, 15.569063186645508, 17.6016845703125, 19.634305953979492, 21.666927337646484, 23.69955062866211, 25.73217010498047, 27.764793395996094, 29.797414779663086, 31.830036163330078, 33.8626594543457, 35.89527893066406, 37.92790222167969, 39.96052169799805, 41.99314498901367, 44.02576446533203, 46.058387756347656, 48.09101104736328, 50.123634338378906, 52.156253814697266, 54.18887710571289, 56.22149658203125, 58.254119873046875, 60.2867431640625, 62.31936264038086, 64.35198211669922]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 9.0, 9.0, 10.0, 13.0, 7.0, 13.0, 16.0, 18.0, 25.0, 31.0, 23.0, 28.0, 29.0, 37.0, 37.0, 52.0, 43.0, 38.0, 40.0, 35.0, 29.0, 29.0, 38.0, 48.0, 37.0, 36.0, 21.0, 16.0, 14.0, 28.0, 32.0, 25.0, 25.0, 12.0, 16.0, 21.0, 17.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-68.78849029541016, -66.302001953125, -63.81550979614258, -61.329017639160156, -58.842529296875, -56.356040954589844, -53.86954879760742, -51.383056640625, -48.896568298339844, -46.41007995605469, -43.923587799072266, -41.437095642089844, -38.95060729980469, -36.46411895751953, -33.97762680053711, -31.49113655090332, -29.00464630126953, -26.518156051635742, -24.031665802001953, -21.545175552368164, -19.058685302734375, -16.572195053100586, -14.085704803466797, -11.599214553833008, -9.112724304199219, -6.62623405456543, -4.139743804931641, -1.6532535552978516, 0.8332366943359375, 3.3197269439697266, 5.806217193603516, 8.292707443237305, 10.779190063476562, 13.265680313110352, 15.75217056274414, 18.23866081237793, 20.72515106201172, 23.211641311645508, 25.698131561279297, 28.184621810913086, 30.671112060546875, 33.15760040283203, 35.64409255981445, 38.130584716796875, 40.61707305908203, 43.10356140136719, 45.59005355834961, 48.07654571533203, 50.56303405761719, 53.049522399902344, 55.536014556884766, 58.02250671386719, 60.508995056152344, 62.9954833984375, 65.48197937011719, 67.96846771240234, 70.4549560546875, 72.94144439697266, 75.42793273925781, 77.9144287109375, 80.40091705322266, 82.88740539550781, 85.3739013671875, 87.86038970947266, 90.34687805175781]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 6.0, 9.0, 10.0, 22.0, 34.0, 50.0, 65.0, 87.0, 101.0, 184.0, 247.0, 373.0, 626.0, 991.0, 1623.0, 2675.0, 4709.0, 8486.0, 15829.0, 29230.0, 55067.0, 104322.0, 187944.0, 247227.0, 177624.0, 98161.0, 51583.0, 27612.0, 14672.0, 8006.0, 4365.0, 2487.0, 1516.0, 858.0, 565.0, 383.0, 269.0, 180.0, 101.0, 54.0, 53.0, 51.0, 31.0, 14.0, 23.0, 5.0, 12.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.0859375, -10.7333984375, -10.380859375, -10.0283203125, -9.67578125, -9.3232421875, -8.970703125, -8.6181640625, -8.265625, -7.9130859375, -7.560546875, -7.2080078125, -6.85546875, -6.5029296875, -6.150390625, -5.7978515625, -5.4453125, -5.0927734375, -4.740234375, -4.3876953125, -4.03515625, -3.6826171875, -3.330078125, -2.9775390625, -2.625, -2.2724609375, -1.919921875, -1.5673828125, -1.21484375, -0.8623046875, -0.509765625, -0.1572265625, 0.1953125, 0.5478515625, 0.900390625, 1.2529296875, 1.60546875, 1.9580078125, 2.310546875, 2.6630859375, 3.015625, 3.3681640625, 3.720703125, 4.0732421875, 4.42578125, 4.7783203125, 5.130859375, 5.4833984375, 5.8359375, 6.1884765625, 6.541015625, 6.8935546875, 7.24609375, 7.5986328125, 7.951171875, 8.3037109375, 8.65625, 9.0087890625, 9.361328125, 9.7138671875, 10.06640625, 10.4189453125, 10.771484375, 11.1240234375, 11.4765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 9.0, 8.0, 10.0, 14.0, 7.0, 12.0, 16.0, 19.0, 26.0, 31.0, 22.0, 29.0, 26.0, 39.0, 37.0, 52.0, 43.0, 39.0, 39.0, 34.0, 30.0, 33.0, 35.0, 47.0, 42.0, 31.0, 22.0, 15.0, 15.0, 28.0, 32.0, 26.0, 24.0, 12.0, 16.0, 22.0, 16.0, 7.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-68.9375, -66.44140625, -63.9453125, -61.44921875, -58.953125, -56.45703125, -53.9609375, -51.46484375, -48.96875, -46.47265625, -43.9765625, -41.48046875, -38.984375, -36.48828125, -33.9921875, -31.49609375, -29.0, -26.50390625, -24.0078125, -21.51171875, -19.015625, -16.51953125, -14.0234375, -11.52734375, -9.03125, -6.53515625, -4.0390625, -1.54296875, 0.953125, 3.44921875, 5.9453125, 8.44140625, 10.9375, 13.43359375, 15.9296875, 18.42578125, 20.921875, 23.41796875, 25.9140625, 28.41015625, 30.90625, 33.40234375, 35.8984375, 38.39453125, 40.890625, 43.38671875, 45.8828125, 48.37890625, 50.875, 53.37109375, 55.8671875, 58.36328125, 60.859375, 63.35546875, 65.8515625, 68.34765625, 70.84375, 73.33984375, 75.8359375, 78.33203125, 80.828125, 83.32421875, 85.8203125, 88.31640625, 90.8125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 8.0, 14.0, 13.0, 20.0, 25.0, 35.0, 45.0, 64.0, 87.0, 133.0, 214.0, 336.0, 486.0, 749.0, 1214.0, 2146.0, 3970.0, 7540.0, 15510.0, 34836.0, 85397.0, 230347.0, 377658.0, 170252.0, 64026.0, 26771.0, 12442.0, 6104.0, 3258.0, 1801.0, 1087.0, 638.0, 399.0, 287.0, 190.0, 130.0, 83.0, 70.0, 38.0, 38.0, 24.0, 18.0, 11.0, 8.0, 9.0, 7.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.6953125, -14.2265625, -13.7578125, -13.2890625, -12.8203125, -12.3515625, -11.8828125, -11.4140625, -10.9453125, -10.4765625, -10.0078125, -9.5390625, -9.0703125, -8.6015625, -8.1328125, -7.6640625, -7.1953125, -6.7265625, -6.2578125, -5.7890625, -5.3203125, -4.8515625, -4.3828125, -3.9140625, -3.4453125, -2.9765625, -2.5078125, -2.0390625, -1.5703125, -1.1015625, -0.6328125, -0.1640625, 0.3046875, 0.7734375, 1.2421875, 1.7109375, 2.1796875, 2.6484375, 3.1171875, 3.5859375, 4.0546875, 4.5234375, 4.9921875, 5.4609375, 5.9296875, 6.3984375, 6.8671875, 7.3359375, 7.8046875, 8.2734375, 8.7421875, 9.2109375, 9.6796875, 10.1484375, 10.6171875, 11.0859375, 11.5546875, 12.0234375, 12.4921875, 12.9609375, 13.4296875, 13.8984375, 14.3671875, 14.8359375, 15.3046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 10.0, 11.0, 4.0, 12.0, 9.0, 11.0, 19.0, 24.0, 23.0, 22.0, 18.0, 14.0, 30.0, 27.0, 40.0, 30.0, 34.0, 34.0, 49.0, 52.0, 32.0, 37.0, 37.0, 39.0, 46.0, 40.0, 31.0, 25.0, 36.0, 29.0, 25.0, 35.0, 20.0, 21.0, 14.0, 10.0, 5.0, 7.0, 11.0, 8.0, 5.0, 4.0, 0.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.46875, -44.75537109375, -43.0419921875, -41.32861328125, -39.615234375, -37.90185546875, -36.1884765625, -34.47509765625, -32.76171875, -31.04833984375, -29.3349609375, -27.62158203125, -25.908203125, -24.19482421875, -22.4814453125, -20.76806640625, -19.0546875, -17.34130859375, -15.6279296875, -13.91455078125, -12.201171875, -10.48779296875, -8.7744140625, -7.06103515625, -5.34765625, -3.63427734375, -1.9208984375, -0.20751953125, 1.505859375, 3.21923828125, 4.9326171875, 6.64599609375, 8.359375, 10.07275390625, 11.7861328125, 13.49951171875, 15.212890625, 16.92626953125, 18.6396484375, 20.35302734375, 22.06640625, 23.77978515625, 25.4931640625, 27.20654296875, 28.919921875, 30.63330078125, 32.3466796875, 34.06005859375, 35.7734375, 37.48681640625, 39.2001953125, 40.91357421875, 42.626953125, 44.34033203125, 46.0537109375, 47.76708984375, 49.48046875, 51.19384765625, 52.9072265625, 54.62060546875, 56.333984375, 58.04736328125, 59.7607421875, 61.47412109375, 63.1875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 5.0, 7.0, 14.0, 12.0, 17.0, 22.0, 17.0, 44.0, 58.0, 81.0, 132.0, 193.0, 290.0, 401.0, 622.0, 924.0, 1514.0, 2394.0, 4363.0, 7789.0, 16334.0, 39317.0, 120465.0, 409259.0, 302158.0, 83788.0, 29732.0, 12888.0, 6474.0, 3573.0, 2048.0, 1209.0, 796.0, 498.0, 376.0, 219.0, 149.0, 125.0, 76.0, 53.0, 28.0, 22.0, 22.0, 13.0, 9.0, 6.0, 11.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.701171875, -3.581207275390625, -3.46124267578125, -3.341278076171875, -3.2213134765625, -3.101348876953125, -2.98138427734375, -2.861419677734375, -2.741455078125, -2.621490478515625, -2.50152587890625, -2.381561279296875, -2.2615966796875, -2.141632080078125, -2.02166748046875, -1.901702880859375, -1.78173828125, -1.661773681640625, -1.54180908203125, -1.421844482421875, -1.3018798828125, -1.181915283203125, -1.06195068359375, -0.941986083984375, -0.822021484375, -0.702056884765625, -0.58209228515625, -0.462127685546875, -0.3421630859375, -0.222198486328125, -0.10223388671875, 0.017730712890625, 0.1376953125, 0.257659912109375, 0.37762451171875, 0.497589111328125, 0.6175537109375, 0.737518310546875, 0.85748291015625, 0.977447509765625, 1.097412109375, 1.217376708984375, 1.33734130859375, 1.457305908203125, 1.5772705078125, 1.697235107421875, 1.81719970703125, 1.937164306640625, 2.05712890625, 2.177093505859375, 2.29705810546875, 2.417022705078125, 2.5369873046875, 2.656951904296875, 2.77691650390625, 2.896881103515625, 3.016845703125, 3.136810302734375, 3.25677490234375, 3.376739501953125, 3.4967041015625, 3.616668701171875, 3.73663330078125, 3.856597900390625, 3.9765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 7.0, 6.0, 9.0, 15.0, 22.0, 20.0, 17.0, 30.0, 35.0, 27.0, 47.0, 46.0, 51.0, 43.0, 55.0, 58.0, 62.0, 56.0, 57.0, 44.0, 55.0, 32.0, 41.0, 31.0, 27.0, 19.0, 17.0, 11.0, 11.0, 10.0, 5.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.00024199485778808594, -0.00023564323782920837, -0.0002292916178703308, -0.00022293999791145325, -0.00021658837795257568, -0.00021023675799369812, -0.00020388513803482056, -0.000197533518075943, -0.00019118189811706543, -0.00018483027815818787, -0.0001784786581993103, -0.00017212703824043274, -0.00016577541828155518, -0.0001594237983226776, -0.00015307217836380005, -0.00014672055840492249, -0.00014036893844604492, -0.00013401731848716736, -0.0001276656985282898, -0.00012131407856941223, -0.00011496245861053467, -0.0001086108386516571, -0.00010225921869277954, -9.590759873390198e-05, -8.955597877502441e-05, -8.320435881614685e-05, -7.685273885726929e-05, -7.050111889839172e-05, -6.414949893951416e-05, -5.77978789806366e-05, -5.144625902175903e-05, -4.509463906288147e-05, -3.8743019104003906e-05, -3.239139914512634e-05, -2.603977918624878e-05, -1.9688159227371216e-05, -1.3336539268493652e-05, -6.984919309616089e-06, -6.332993507385254e-07, 5.718320608139038e-06, 1.2069940567016602e-05, 1.8421560525894165e-05, 2.477318048477173e-05, 3.112480044364929e-05, 3.7476420402526855e-05, 4.382804036140442e-05, 5.017966032028198e-05, 5.6531280279159546e-05, 6.288290023803711e-05, 6.923452019691467e-05, 7.558614015579224e-05, 8.19377601146698e-05, 8.828938007354736e-05, 9.464100003242493e-05, 0.00010099261999130249, 0.00010734423995018005, 0.00011369585990905762, 0.00012004747986793518, 0.00012639909982681274, 0.0001327507197856903, 0.00013910233974456787, 0.00014545395970344543, 0.000151805579662323, 0.00015815719962120056, 0.00016450881958007812]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 9.0, 15.0, 12.0, 23.0, 39.0, 47.0, 90.0, 87.0, 152.0, 195.0, 274.0, 356.0, 480.0, 728.0, 1052.0, 1660.0, 2342.0, 3702.0, 5882.0, 9583.0, 16098.0, 28219.0, 49801.0, 90929.0, 165838.0, 245253.0, 186196.0, 103694.0, 56007.0, 31963.0, 18336.0, 10777.0, 6445.0, 3986.0, 2644.0, 1671.0, 1137.0, 852.0, 569.0, 432.0, 309.0, 215.0, 144.0, 101.0, 70.0, 49.0, 37.0, 16.0, 14.0, 9.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0], "bins": [-4.10546875, -3.983306884765625, -3.86114501953125, -3.738983154296875, -3.6168212890625, -3.494659423828125, -3.37249755859375, -3.250335693359375, -3.128173828125, -3.006011962890625, -2.88385009765625, -2.761688232421875, -2.6395263671875, -2.517364501953125, -2.39520263671875, -2.273040771484375, -2.15087890625, -2.028717041015625, -1.90655517578125, -1.784393310546875, -1.6622314453125, -1.540069580078125, -1.41790771484375, -1.295745849609375, -1.173583984375, -1.051422119140625, -0.92926025390625, -0.807098388671875, -0.6849365234375, -0.562774658203125, -0.44061279296875, -0.318450927734375, -0.1962890625, -0.074127197265625, 0.04803466796875, 0.170196533203125, 0.2923583984375, 0.414520263671875, 0.53668212890625, 0.658843994140625, 0.781005859375, 0.903167724609375, 1.02532958984375, 1.147491455078125, 1.2696533203125, 1.391815185546875, 1.51397705078125, 1.636138916015625, 1.75830078125, 1.880462646484375, 2.00262451171875, 2.124786376953125, 2.2469482421875, 2.369110107421875, 2.49127197265625, 2.613433837890625, 2.735595703125, 2.857757568359375, 2.97991943359375, 3.102081298828125, 3.2242431640625, 3.346405029296875, 3.46856689453125, 3.590728759765625, 3.712890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 0.0, 2.0, 6.0, 3.0, 9.0, 10.0, 13.0, 13.0, 14.0, 29.0, 35.0, 57.0, 96.0, 127.0, 175.0, 129.0, 76.0, 58.0, 34.0, 22.0, 18.0, 13.0, 13.0, 7.0, 8.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.14227294921875, -4.0150146484375, -3.88775634765625, -3.760498046875, -3.63323974609375, -3.5059814453125, -3.37872314453125, -3.25146484375, -3.12420654296875, -2.9969482421875, -2.86968994140625, -2.742431640625, -2.61517333984375, -2.4879150390625, -2.36065673828125, -2.2333984375, -2.10614013671875, -1.9788818359375, -1.85162353515625, -1.724365234375, -1.59710693359375, -1.4698486328125, -1.34259033203125, -1.21533203125, -1.08807373046875, -0.9608154296875, -0.83355712890625, -0.706298828125, -0.57904052734375, -0.4517822265625, -0.32452392578125, -0.197265625, -0.07000732421875, 0.0572509765625, 0.18450927734375, 0.311767578125, 0.43902587890625, 0.5662841796875, 0.69354248046875, 0.82080078125, 0.94805908203125, 1.0753173828125, 1.20257568359375, 1.329833984375, 1.45709228515625, 1.5843505859375, 1.71160888671875, 1.8388671875, 1.96612548828125, 2.0933837890625, 2.22064208984375, 2.347900390625, 2.47515869140625, 2.6024169921875, 2.72967529296875, 2.85693359375, 2.98419189453125, 3.1114501953125, 3.23870849609375, 3.365966796875, 3.49322509765625, 3.6204833984375, 3.74774169921875, 3.875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 3.0, 7.0, 3.0, 2.0, 6.0, 6.0, 6.0, 3.0, 4.0, 10.0, 10.0, 12.0, 15.0, 17.0, 40.0, 26.0, 30.0, 31.0, 31.0, 26.0, 29.0, 41.0, 36.0, 41.0, 42.0, 50.0, 43.0, 43.0, 48.0, 44.0, 30.0, 29.0, 42.0, 30.0, 17.0, 26.0, 20.0, 18.0, 15.0, 14.0, 14.0, 9.0, 7.0, 9.0, 8.0, 0.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-65.58109283447266, -63.537105560302734, -61.49312210083008, -59.449134826660156, -57.4051513671875, -55.36116409301758, -53.317176818847656, -51.273193359375, -49.229209899902344, -47.18522262573242, -45.141239166259766, -43.097251892089844, -41.05326843261719, -39.009281158447266, -36.965293884277344, -34.92131042480469, -32.877323150634766, -30.833337783813477, -28.789352416992188, -26.745365142822266, -24.70138168334961, -22.657394409179688, -20.6134090423584, -18.56942367553711, -16.52543830871582, -14.481452941894531, -12.437467575073242, -10.393481254577637, -8.349495887756348, -6.305510520935059, -4.261524200439453, -2.217538833618164, -0.173553466796875, 1.8704321384429932, 3.9144177436828613, 5.958403587341309, 8.002388954162598, 10.046374320983887, 12.090360641479492, 14.134346008300781, 16.17833137512207, 18.22231674194336, 20.26630210876465, 22.310287475585938, 24.35427474975586, 26.398258209228516, 28.442245483398438, 30.486230850219727, 32.530216217041016, 34.57420349121094, 36.618186950683594, 38.662174224853516, 40.70615768432617, 42.750144958496094, 44.79412841796875, 46.83811569213867, 48.882102966308594, 50.926090240478516, 52.97007369995117, 55.014060974121094, 57.05804443359375, 59.10203170776367, 61.146018981933594, 63.19000244140625, 65.2339859008789]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 8.0, 10.0, 8.0, 13.0, 11.0, 7.0, 18.0, 11.0, 26.0, 32.0, 22.0, 26.0, 28.0, 38.0, 31.0, 45.0, 57.0, 33.0, 43.0, 36.0, 32.0, 35.0, 30.0, 47.0, 43.0, 37.0, 25.0, 16.0, 16.0, 22.0, 32.0, 29.0, 25.0, 13.0, 19.0, 19.0, 13.0, 13.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-71.00120544433594, -68.47046661376953, -65.93972778320312, -63.40898132324219, -60.87824249267578, -58.347503662109375, -55.8167610168457, -53.28601837158203, -50.755279541015625, -48.22454071044922, -45.69379806518555, -43.163055419921875, -40.63231658935547, -38.10157775878906, -35.57083511352539, -33.04009246826172, -30.509353637695312, -27.978612899780273, -25.447872161865234, -22.917131423950195, -20.386390686035156, -17.855649948120117, -15.324909210205078, -12.794168472290039, -10.263427734375, -7.732686996459961, -5.201946258544922, -2.671205520629883, -0.14046478271484375, 2.3902759552001953, 4.921016693115234, 7.451757431030273, 9.982498168945312, 12.513238906860352, 15.04397964477539, 17.57472038269043, 20.10546112060547, 22.636201858520508, 25.166942596435547, 27.697683334350586, 30.228424072265625, 32.75916290283203, 35.2899055480957, 37.820648193359375, 40.35138702392578, 42.88212585449219, 45.41286849975586, 47.94361114501953, 50.47434997558594, 53.005088806152344, 55.535831451416016, 58.06657409667969, 60.597312927246094, 63.1280517578125, 65.65879821777344, 68.18953704833984, 70.72027587890625, 73.25101470947266, 75.78175354003906, 78.3125, 80.8432388305664, 83.37397766113281, 85.90472412109375, 88.43546295166016, 90.96620178222656]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 4.0, 7.0, 13.0, 12.0, 33.0, 45.0, 48.0, 98.0, 138.0, 221.0, 359.0, 563.0, 902.0, 1481.0, 2628.0, 4351.0, 7403.0, 12356.0, 20591.0, 32709.0, 49522.0, 71373.0, 94656.0, 114484.0, 126217.0, 123884.0, 110439.0, 89238.0, 65739.0, 44464.0, 29236.0, 18173.0, 11061.0, 6502.0, 3881.0, 2134.0, 1374.0, 845.0, 518.0, 312.0, 179.0, 114.0, 90.0, 63.0, 34.0, 20.0, 15.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-45.15625, -43.78271484375, -42.4091796875, -41.03564453125, -39.662109375, -38.28857421875, -36.9150390625, -35.54150390625, -34.16796875, -32.79443359375, -31.4208984375, -30.04736328125, -28.673828125, -27.30029296875, -25.9267578125, -24.55322265625, -23.1796875, -21.80615234375, -20.4326171875, -19.05908203125, -17.685546875, -16.31201171875, -14.9384765625, -13.56494140625, -12.19140625, -10.81787109375, -9.4443359375, -8.07080078125, -6.697265625, -5.32373046875, -3.9501953125, -2.57666015625, -1.203125, 0.17041015625, 1.5439453125, 2.91748046875, 4.291015625, 5.66455078125, 7.0380859375, 8.41162109375, 9.78515625, 11.15869140625, 12.5322265625, 13.90576171875, 15.279296875, 16.65283203125, 18.0263671875, 19.39990234375, 20.7734375, 22.14697265625, 23.5205078125, 24.89404296875, 26.267578125, 27.64111328125, 29.0146484375, 30.38818359375, 31.76171875, 33.13525390625, 34.5087890625, 35.88232421875, 37.255859375, 38.62939453125, 40.0029296875, 41.37646484375, 42.75]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 8.0, 9.0, 7.0, 15.0, 10.0, 9.0, 17.0, 9.0, 28.0, 31.0, 23.0, 27.0, 28.0, 37.0, 36.0, 42.0, 52.0, 38.0, 40.0, 36.0, 33.0, 35.0, 32.0, 45.0, 42.0, 38.0, 26.0, 16.0, 17.0, 21.0, 29.0, 33.0, 24.0, 13.0, 17.0, 21.0, 13.0, 13.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-71.5, -68.9501953125, -66.400390625, -63.8505859375, -61.30078125, -58.7509765625, -56.201171875, -53.6513671875, -51.1015625, -48.5517578125, -46.001953125, -43.4521484375, -40.90234375, -38.3525390625, -35.802734375, -33.2529296875, -30.703125, -28.1533203125, -25.603515625, -23.0537109375, -20.50390625, -17.9541015625, -15.404296875, -12.8544921875, -10.3046875, -7.7548828125, -5.205078125, -2.6552734375, -0.10546875, 2.4443359375, 4.994140625, 7.5439453125, 10.09375, 12.6435546875, 15.193359375, 17.7431640625, 20.29296875, 22.8427734375, 25.392578125, 27.9423828125, 30.4921875, 33.0419921875, 35.591796875, 38.1416015625, 40.69140625, 43.2412109375, 45.791015625, 48.3408203125, 50.890625, 53.4404296875, 55.990234375, 58.5400390625, 61.08984375, 63.6396484375, 66.189453125, 68.7392578125, 71.2890625, 73.8388671875, 76.388671875, 78.9384765625, 81.48828125, 84.0380859375, 86.587890625, 89.1376953125, 91.6875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 3.0, 6.0, 17.0, 15.0, 28.0, 40.0, 49.0, 85.0, 119.0, 225.0, 299.0, 444.0, 709.0, 1222.0, 1931.0, 3054.0, 5009.0, 8557.0, 14081.0, 23385.0, 37519.0, 57642.0, 82977.0, 110530.0, 129649.0, 135878.0, 125448.0, 102008.0, 74333.0, 50583.0, 32624.0, 19924.0, 11784.0, 7258.0, 4146.0, 2506.0, 1620.0, 1006.0, 664.0, 397.0, 265.0, 176.0, 114.0, 75.0, 37.0, 54.0, 24.0, 11.0, 7.0, 7.0, 6.0, 4.0, 5.0, 1.0, 2.0], "bins": [-60.125, -58.3740234375, -56.623046875, -54.8720703125, -53.12109375, -51.3701171875, -49.619140625, -47.8681640625, -46.1171875, -44.3662109375, -42.615234375, -40.8642578125, -39.11328125, -37.3623046875, -35.611328125, -33.8603515625, -32.109375, -30.3583984375, -28.607421875, -26.8564453125, -25.10546875, -23.3544921875, -21.603515625, -19.8525390625, -18.1015625, -16.3505859375, -14.599609375, -12.8486328125, -11.09765625, -9.3466796875, -7.595703125, -5.8447265625, -4.09375, -2.3427734375, -0.591796875, 1.1591796875, 2.91015625, 4.6611328125, 6.412109375, 8.1630859375, 9.9140625, 11.6650390625, 13.416015625, 15.1669921875, 16.91796875, 18.6689453125, 20.419921875, 22.1708984375, 23.921875, 25.6728515625, 27.423828125, 29.1748046875, 30.92578125, 32.6767578125, 34.427734375, 36.1787109375, 37.9296875, 39.6806640625, 41.431640625, 43.1826171875, 44.93359375, 46.6845703125, 48.435546875, 50.1865234375, 51.9375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 8.0, 3.0, 10.0, 13.0, 6.0, 12.0, 17.0, 19.0, 24.0, 23.0, 28.0, 28.0, 23.0, 39.0, 38.0, 39.0, 44.0, 50.0, 44.0, 44.0, 49.0, 42.0, 47.0, 35.0, 39.0, 28.0, 33.0, 31.0, 34.0, 21.0, 29.0, 28.0, 16.0, 14.0, 13.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.46875, -50.59521484375, -48.7216796875, -46.84814453125, -44.974609375, -43.10107421875, -41.2275390625, -39.35400390625, -37.48046875, -35.60693359375, -33.7333984375, -31.85986328125, -29.986328125, -28.11279296875, -26.2392578125, -24.36572265625, -22.4921875, -20.61865234375, -18.7451171875, -16.87158203125, -14.998046875, -13.12451171875, -11.2509765625, -9.37744140625, -7.50390625, -5.63037109375, -3.7568359375, -1.88330078125, -0.009765625, 1.86376953125, 3.7373046875, 5.61083984375, 7.484375, 9.35791015625, 11.2314453125, 13.10498046875, 14.978515625, 16.85205078125, 18.7255859375, 20.59912109375, 22.47265625, 24.34619140625, 26.2197265625, 28.09326171875, 29.966796875, 31.84033203125, 33.7138671875, 35.58740234375, 37.4609375, 39.33447265625, 41.2080078125, 43.08154296875, 44.955078125, 46.82861328125, 48.7021484375, 50.57568359375, 52.44921875, 54.32275390625, 56.1962890625, 58.06982421875, 59.943359375, 61.81689453125, 63.6904296875, 65.56396484375, 67.4375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 8.0, 14.0, 22.0, 29.0, 45.0, 60.0, 104.0, 115.0, 185.0, 256.0, 343.0, 422.0, 552.0, 819.0, 1188.0, 1768.0, 2750.0, 4525.0, 8067.0, 14480.0, 25776.0, 44645.0, 70426.0, 101646.0, 129883.0, 145100.0, 140798.0, 119603.0, 89118.0, 59810.0, 36370.0, 20544.0, 11576.0, 6371.0, 3710.0, 2270.0, 1477.0, 957.0, 757.0, 538.0, 425.0, 281.0, 216.0, 132.0, 123.0, 88.0, 58.0, 28.0, 38.0, 14.0, 7.0, 11.0, 3.0, 1.0, 5.0, 1.0, 2.0], "bins": [-20.40625, -19.7841796875, -19.162109375, -18.5400390625, -17.91796875, -17.2958984375, -16.673828125, -16.0517578125, -15.4296875, -14.8076171875, -14.185546875, -13.5634765625, -12.94140625, -12.3193359375, -11.697265625, -11.0751953125, -10.453125, -9.8310546875, -9.208984375, -8.5869140625, -7.96484375, -7.3427734375, -6.720703125, -6.0986328125, -5.4765625, -4.8544921875, -4.232421875, -3.6103515625, -2.98828125, -2.3662109375, -1.744140625, -1.1220703125, -0.5, 0.1220703125, 0.744140625, 1.3662109375, 1.98828125, 2.6103515625, 3.232421875, 3.8544921875, 4.4765625, 5.0986328125, 5.720703125, 6.3427734375, 6.96484375, 7.5869140625, 8.208984375, 8.8310546875, 9.453125, 10.0751953125, 10.697265625, 11.3193359375, 11.94140625, 12.5634765625, 13.185546875, 13.8076171875, 14.4296875, 15.0517578125, 15.673828125, 16.2958984375, 16.91796875, 17.5400390625, 18.162109375, 18.7841796875, 19.40625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 11.0, 13.0, 19.0, 19.0, 37.0, 54.0, 46.0, 60.0, 65.0, 80.0, 69.0, 62.0, 67.0, 64.0, 61.0, 64.0, 47.0, 35.0, 39.0, 23.0, 14.0, 13.0, 10.0, 4.0, 6.0, 2.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0033588409423828125, -0.003268897533416748, -0.0031789541244506836, -0.003089010715484619, -0.0029990673065185547, -0.0029091238975524902, -0.0028191804885864258, -0.0027292370796203613, -0.002639293670654297, -0.0025493502616882324, -0.002459406852722168, -0.0023694634437561035, -0.002279520034790039, -0.0021895766258239746, -0.00209963321685791, -0.0020096898078918457, -0.0019197463989257812, -0.0018298029899597168, -0.0017398595809936523, -0.0016499161720275879, -0.0015599727630615234, -0.001470029354095459, -0.0013800859451293945, -0.00129014253616333, -0.0012001991271972656, -0.0011102557182312012, -0.0010203123092651367, -0.0009303689002990723, -0.0008404254913330078, -0.0007504820823669434, -0.0006605386734008789, -0.0005705952644348145, -0.00048065185546875, -0.00039070844650268555, -0.0003007650375366211, -0.00021082162857055664, -0.00012087821960449219, -3.0934810638427734e-05, 5.900859832763672e-05, 0.00014895200729370117, 0.00023889541625976562, 0.0003288388252258301, 0.00041878223419189453, 0.000508725643157959, 0.0005986690521240234, 0.0006886124610900879, 0.0007785558700561523, 0.0008684992790222168, 0.0009584426879882812, 0.0010483860969543457, 0.0011383295059204102, 0.0012282729148864746, 0.001318216323852539, 0.0014081597328186035, 0.001498103141784668, 0.0015880465507507324, 0.0016779899597167969, 0.0017679333686828613, 0.0018578767776489258, 0.0019478201866149902, 0.0020377635955810547, 0.002127707004547119, 0.0022176504135131836, 0.002307593822479248, 0.0023975372314453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 6.0, 3.0, 8.0, 22.0, 21.0, 48.0, 42.0, 72.0, 118.0, 162.0, 212.0, 348.0, 457.0, 604.0, 835.0, 1198.0, 1779.0, 2735.0, 4547.0, 7862.0, 13970.0, 24339.0, 40737.0, 63415.0, 90683.0, 116942.0, 135087.0, 136913.0, 122947.0, 98024.0, 70005.0, 45761.0, 28256.0, 16326.0, 9271.0, 5308.0, 3087.0, 1902.0, 1352.0, 881.0, 648.0, 481.0, 345.0, 239.0, 164.0, 130.0, 89.0, 64.0, 43.0, 27.0, 11.0, 19.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-18.515625, -17.901123046875, -17.28662109375, -16.672119140625, -16.0576171875, -15.443115234375, -14.82861328125, -14.214111328125, -13.599609375, -12.985107421875, -12.37060546875, -11.756103515625, -11.1416015625, -10.527099609375, -9.91259765625, -9.298095703125, -8.68359375, -8.069091796875, -7.45458984375, -6.840087890625, -6.2255859375, -5.611083984375, -4.99658203125, -4.382080078125, -3.767578125, -3.153076171875, -2.53857421875, -1.924072265625, -1.3095703125, -0.695068359375, -0.08056640625, 0.533935546875, 1.1484375, 1.762939453125, 2.37744140625, 2.991943359375, 3.6064453125, 4.220947265625, 4.83544921875, 5.449951171875, 6.064453125, 6.678955078125, 7.29345703125, 7.907958984375, 8.5224609375, 9.136962890625, 9.75146484375, 10.365966796875, 10.98046875, 11.594970703125, 12.20947265625, 12.823974609375, 13.4384765625, 14.052978515625, 14.66748046875, 15.281982421875, 15.896484375, 16.510986328125, 17.12548828125, 17.739990234375, 18.3544921875, 18.968994140625, 19.58349609375, 20.197998046875, 20.8125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 4.0, 8.0, 7.0, 8.0, 13.0, 11.0, 23.0, 20.0, 25.0, 29.0, 39.0, 34.0, 45.0, 40.0, 64.0, 48.0, 58.0, 57.0, 43.0, 54.0, 67.0, 35.0, 44.0, 37.0, 40.0, 16.0, 24.0, 21.0, 14.0, 13.0, 18.0, 10.0, 10.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.140625, -9.8431396484375, -9.545654296875, -9.2481689453125, -8.95068359375, -8.6531982421875, -8.355712890625, -8.0582275390625, -7.7607421875, -7.4632568359375, -7.165771484375, -6.8682861328125, -6.57080078125, -6.2733154296875, -5.975830078125, -5.6783447265625, -5.380859375, -5.0833740234375, -4.785888671875, -4.4884033203125, -4.19091796875, -3.8934326171875, -3.595947265625, -3.2984619140625, -3.0009765625, -2.7034912109375, -2.406005859375, -2.1085205078125, -1.81103515625, -1.5135498046875, -1.216064453125, -0.9185791015625, -0.62109375, -0.3236083984375, -0.026123046875, 0.2713623046875, 0.56884765625, 0.8663330078125, 1.163818359375, 1.4613037109375, 1.7587890625, 2.0562744140625, 2.353759765625, 2.6512451171875, 2.94873046875, 3.2462158203125, 3.543701171875, 3.8411865234375, 4.138671875, 4.4361572265625, 4.733642578125, 5.0311279296875, 5.32861328125, 5.6260986328125, 5.923583984375, 6.2210693359375, 6.5185546875, 6.8160400390625, 7.113525390625, 7.4110107421875, 7.70849609375, 8.0059814453125, 8.303466796875, 8.6009521484375, 8.8984375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 3.0, 4.0, 3.0, 10.0, 4.0, 15.0, 12.0, 18.0, 17.0, 32.0, 25.0, 25.0, 26.0, 22.0, 39.0, 34.0, 38.0, 36.0, 38.0, 36.0, 43.0, 51.0, 59.0, 47.0, 32.0, 44.0, 43.0, 24.0, 35.0, 19.0, 26.0, 16.0, 21.0, 23.0, 14.0, 10.0, 12.0, 9.0, 5.0, 2.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.5282211303711, -69.32811737060547, -67.12801361083984, -64.92790985107422, -62.727806091308594, -60.52770233154297, -58.32760238647461, -56.127498626708984, -53.92739486694336, -51.727291107177734, -49.52718734741211, -47.327083587646484, -45.126983642578125, -42.9268798828125, -40.726776123046875, -38.52667236328125, -36.326568603515625, -34.12646484375, -31.926361083984375, -29.726259231567383, -27.526155471801758, -25.326051712036133, -23.12594985961914, -20.925846099853516, -18.72574234008789, -16.525638580322266, -14.325535774230957, -12.125432968139648, -9.925329208374023, -7.725225448608398, -5.52512264251709, -3.3250198364257812, -1.124908447265625, 1.0751948356628418, 3.2752981185913086, 5.475401401519775, 7.675504684448242, 9.875608444213867, 12.075711250305176, 14.275814056396484, 16.47591781616211, 18.676021575927734, 20.87612533569336, 23.07622718811035, 25.276330947875977, 27.4764347076416, 29.676536560058594, 31.87664031982422, 34.076744079589844, 36.27684783935547, 38.476951599121094, 40.67705535888672, 42.877159118652344, 45.07726287841797, 47.27736282348633, 49.47746658325195, 51.67757034301758, 53.8776741027832, 56.07777786254883, 58.27788162231445, 60.47798156738281, 62.67808532714844, 64.87818908691406, 67.07829284667969, 69.27839660644531]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 3.0, 7.0, 9.0, 7.0, 9.0, 9.0, 16.0, 11.0, 19.0, 18.0, 22.0, 21.0, 30.0, 30.0, 39.0, 40.0, 36.0, 35.0, 49.0, 40.0, 34.0, 49.0, 38.0, 35.0, 33.0, 34.0, 28.0, 24.0, 32.0, 32.0, 33.0, 23.0, 22.0, 24.0, 21.0, 20.0, 13.0, 17.0, 12.0, 9.0, 7.0, 1.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-84.74928283691406, -81.69412231445312, -78.63896179199219, -75.58380126953125, -72.52863311767578, -69.47347259521484, -66.4183120727539, -63.36315155029297, -60.307987213134766, -57.25282669067383, -54.197662353515625, -51.14250183105469, -48.08734130859375, -45.03217697143555, -41.97701644897461, -38.921852111816406, -35.86669158935547, -32.81153106689453, -29.756366729736328, -26.70120620727539, -23.64604377746582, -20.59088134765625, -17.535720825195312, -14.480558395385742, -11.425395965576172, -8.370233535766602, -5.315072059631348, -2.2599105834960938, 0.7952518463134766, 3.850414276123047, 6.905574798583984, 9.960737228393555, 13.015907287597656, 16.071069717407227, 19.126232147216797, 22.181392669677734, 25.236555099487305, 28.291717529296875, 31.346878051757812, 34.40203857421875, 37.45720291137695, 40.51236343383789, 43.567527770996094, 46.62268829345703, 49.67784881591797, 52.73301315307617, 55.78817367553711, 58.84333801269531, 61.89849853515625, 64.95365905761719, 68.00881958007812, 71.06398010253906, 74.11914825439453, 77.17430877685547, 80.2294692993164, 83.28462982177734, 86.33979797363281, 89.39495849609375, 92.45011901855469, 95.50527954101562, 98.5604476928711, 101.61560821533203, 104.67076873779297, 107.7259292602539, 110.78108978271484]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 6.0, 11.0, 15.0, 26.0, 41.0, 44.0, 82.0, 99.0, 124.0, 180.0, 242.0, 325.0, 436.0, 473.0, 701.0, 847.0, 1029.0, 1242.0, 1570.0, 1938.0, 2288.0, 2747.0, 3371.0, 4249.0, 5641.0, 994596.0, 5891.0, 4286.0, 3387.0, 2785.0, 2266.0, 1922.0, 1615.0, 1260.0, 1129.0, 852.0, 712.0, 557.0, 414.0, 313.0, 239.0, 173.0, 152.0, 87.0, 73.0, 55.0, 28.0, 26.0, 20.0, 14.0, 9.0, 7.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-495.8624267578125, -480.1423645019531, -464.42230224609375, -448.70220947265625, -432.9821472167969, -417.2620849609375, -401.5420227050781, -385.82196044921875, -370.10186767578125, -354.3818054199219, -338.6617431640625, -322.941650390625, -307.2215881347656, -291.50152587890625, -275.7814636230469, -260.0614013671875, -244.34133911132812, -228.62127685546875, -212.9011993408203, -197.18113708496094, -181.4610595703125, -165.74099731445312, -150.02093505859375, -134.30087280273438, -118.58079528808594, -102.86072540283203, -87.14065551757812, -71.42059326171875, -55.700523376464844, -39.98045349121094, -24.260391235351562, -8.540321350097656, 7.179779052734375, 22.89984703063965, 38.61991500854492, 54.33998107910156, 70.06005096435547, 85.78012084960938, 101.50018310546875, 117.22025299072266, 132.94032287597656, 148.66038513183594, 164.38046264648438, 180.10052490234375, 195.82058715820312, 211.54066467285156, 227.26072692871094, 242.98080444335938, 258.70086669921875, 274.4209289550781, 290.1409912109375, 305.861083984375, 321.5811462402344, 337.30120849609375, 353.0212707519531, 368.7413330078125, 384.46142578125, 400.1814880371094, 415.90155029296875, 431.62164306640625, 447.3417053222656, 463.061767578125, 478.7818298339844, 494.50189208984375, 510.2219543457031]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 18.0, 20.0, 34.0, 50.0, 59.0, 73.0, 124.0, 164.0, 245.0, 346.0, 487.0, 820.0, 1239.0, 1885.0, 3142.0, 4977.0, 7765.0, 12327.0, 18030.0, 26170.0, 42549.0, 51196552.0, 66107.0, 28966.0, 20532.0, 13690.0, 9011.0, 5837.0, 3585.0, 2292.0, 1424.0, 918.0, 627.0, 396.0, 292.0, 180.0, 129.0, 70.0, 66.0, 49.0, 38.0, 23.0, 11.0, 7.0, 9.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-599.434326171875, -579.8804321289062, -560.3265380859375, -540.772705078125, -521.2188110351562, -501.6649169921875, -482.11102294921875, -462.5571594238281, -443.0032958984375, -423.44940185546875, -403.8955383300781, -384.3416442871094, -364.78778076171875, -345.23388671875, -325.67999267578125, -306.1261291503906, -286.5722351074219, -267.0183410644531, -247.4644775390625, -227.91058349609375, -208.35671997070312, -188.80282592773438, -169.2489471435547, -149.695068359375, -130.1411895751953, -110.58731079101562, -91.03343200683594, -71.47954559326172, -51.92566680908203, -32.371788024902344, -12.817901611328125, 6.7359771728515625, 26.28985595703125, 45.84373474121094, 65.39761352539062, 84.95149993896484, 104.50537872314453, 124.05925750732422, 143.61314392089844, 163.16702270507812, 182.7209014892578, 202.2747802734375, 221.8286590576172, 241.38253784179688, 260.9364318847656, 280.49029541015625, 300.044189453125, 319.59808349609375, 339.1519470214844, 358.7058410644531, 378.25970458984375, 397.8135986328125, 417.3674621582031, 436.9213562011719, 456.4752197265625, 476.02911376953125, 495.5830078125, 515.1369018554688, 534.6907958984375, 554.24462890625, 573.7985229492188, 593.3524169921875, 612.9063110351562, 632.460205078125, 652.0140380859375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 7.0, 1.0, 1.0, 8.0, 10.0, 11.0, 20.0, 24.0, 48.0, 69.0, 108.0, 173.0, 284.0, 431.0, 735.0, 1091.0, 1750.0, 2858.0, 4618.0, 8526.0, 17308.0, 39639.0, 110908.0, 411868.0, 3793350.0, 1497197.0, 261097.0, 78517.0, 29888.0, 13573.0, 6803.0, 3982.0, 2352.0, 1507.0, 986.0, 653.0, 368.0, 226.0, 162.0, 102.0, 60.0, 41.0, 28.0, 13.0, 5.0, 5.0, 11.0, 3.0, 3.0, 0.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-40.78125, -39.458984375, -38.13671875, -36.814453125, -35.4921875, -34.169921875, -32.84765625, -31.525390625, -30.203125, -28.880859375, -27.55859375, -26.236328125, -24.9140625, -23.591796875, -22.26953125, -20.947265625, -19.625, -18.302734375, -16.98046875, -15.658203125, -14.3359375, -13.013671875, -11.69140625, -10.369140625, -9.046875, -7.724609375, -6.40234375, -5.080078125, -3.7578125, -2.435546875, -1.11328125, 0.208984375, 1.53125, 2.853515625, 4.17578125, 5.498046875, 6.8203125, 8.142578125, 9.46484375, 10.787109375, 12.109375, 13.431640625, 14.75390625, 16.076171875, 17.3984375, 18.720703125, 20.04296875, 21.365234375, 22.6875, 24.009765625, 25.33203125, 26.654296875, 27.9765625, 29.298828125, 30.62109375, 31.943359375, 33.265625, 34.587890625, 35.91015625, 37.232421875, 38.5546875, 39.876953125, 41.19921875, 42.521484375, 43.84375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 3.0, 5.0, 12.0, 11.0, 21.0, 20.0, 29.0, 31.0, 34.0, 48.0, 61.0, 74.0, 105.0, 505.0, 612.0, 70.0, 52.0, 64.0, 56.0, 35.0, 45.0, 23.0, 18.0, 24.0, 14.0, 9.0, 4.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-90.625, -87.89453125, -85.1640625, -82.43359375, -79.703125, -76.97265625, -74.2421875, -71.51171875, -68.78125, -66.05078125, -63.3203125, -60.58984375, -57.859375, -55.12890625, -52.3984375, -49.66796875, -46.9375, -44.20703125, -41.4765625, -38.74609375, -36.015625, -33.28515625, -30.5546875, -27.82421875, -25.09375, -22.36328125, -19.6328125, -16.90234375, -14.171875, -11.44140625, -8.7109375, -5.98046875, -3.25, -0.51953125, 2.2109375, 4.94140625, 7.671875, 10.40234375, 13.1328125, 15.86328125, 18.59375, 21.32421875, 24.0546875, 26.78515625, 29.515625, 32.24609375, 34.9765625, 37.70703125, 40.4375, 43.16796875, 45.8984375, 48.62890625, 51.359375, 54.08984375, 56.8203125, 59.55078125, 62.28125, 65.01171875, 67.7421875, 70.47265625, 73.203125, 75.93359375, 78.6640625, 81.39453125, 84.125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 5.0, 16.0, 17.0, 9.0, 20.0, 39.0, 33.0, 74.0, 142.0, 167.0, 249.0, 389.0, 589.0, 862.0, 1364.0, 2196.0, 3572.0, 6028.0, 10366.0, 19822.0, 39430.0, 96816.0, 305577.0, 3329677.0, 2035878.0, 271290.0, 87153.0, 36944.0, 17849.0, 9913.0, 5460.0, 3437.0, 2107.0, 1398.0, 891.0, 543.0, 324.0, 270.0, 140.0, 110.0, 82.0, 59.0, 36.0, 32.0, 11.0, 13.0, 19.0, 10.0, 1.0, 8.0, 1.0, 0.0, 3.0], "bins": [-50.65625, -49.20703125, -47.7578125, -46.30859375, -44.859375, -43.41015625, -41.9609375, -40.51171875, -39.0625, -37.61328125, -36.1640625, -34.71484375, -33.265625, -31.81640625, -30.3671875, -28.91796875, -27.46875, -26.01953125, -24.5703125, -23.12109375, -21.671875, -20.22265625, -18.7734375, -17.32421875, -15.875, -14.42578125, -12.9765625, -11.52734375, -10.078125, -8.62890625, -7.1796875, -5.73046875, -4.28125, -2.83203125, -1.3828125, 0.06640625, 1.515625, 2.96484375, 4.4140625, 5.86328125, 7.3125, 8.76171875, 10.2109375, 11.66015625, 13.109375, 14.55859375, 16.0078125, 17.45703125, 18.90625, 20.35546875, 21.8046875, 23.25390625, 24.703125, 26.15234375, 27.6015625, 29.05078125, 30.5, 31.94921875, 33.3984375, 34.84765625, 36.296875, 37.74609375, 39.1953125, 40.64453125, 42.09375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 11.0, 6.0, 6.0, 8.0, 24.0, 27.0, 34.0, 44.0, 50.0, 74.0, 144.0, 303.0, 772.0, 98.0, 65.0, 66.0, 52.0, 42.0, 41.0, 34.0, 20.0, 18.0, 14.0, 10.0, 7.0, 4.0, 5.0, 3.0, 8.0, 2.0, 5.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-114.0625, -111.1025390625, -108.142578125, -105.1826171875, -102.22265625, -99.2626953125, -96.302734375, -93.3427734375, -90.3828125, -87.4228515625, -84.462890625, -81.5029296875, -78.54296875, -75.5830078125, -72.623046875, -69.6630859375, -66.703125, -63.7431640625, -60.783203125, -57.8232421875, -54.86328125, -51.9033203125, -48.943359375, -45.9833984375, -43.0234375, -40.0634765625, -37.103515625, -34.1435546875, -31.18359375, -28.2236328125, -25.263671875, -22.3037109375, -19.34375, -16.3837890625, -13.423828125, -10.4638671875, -7.50390625, -4.5439453125, -1.583984375, 1.3759765625, 4.3359375, 7.2958984375, 10.255859375, 13.2158203125, 16.17578125, 19.1357421875, 22.095703125, 25.0556640625, 28.015625, 30.9755859375, 33.935546875, 36.8955078125, 39.85546875, 42.8154296875, 45.775390625, 48.7353515625, 51.6953125, 54.6552734375, 57.615234375, 60.5751953125, 63.53515625, 66.4951171875, 69.455078125, 72.4150390625, 75.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 2.0, 4.0, 8.0, 9.0, 2.0, 15.0, 29.0, 27.0, 55.0, 55.0, 61.0, 91.0, 113.0, 141.0, 236.0, 310.0, 407.0, 548.0, 948.0, 1373.0, 2738.0, 5470.0, 12728.0, 42875.0, 6003571.0, 174487.0, 25552.0, 9242.0, 4272.0, 2240.0, 1236.0, 738.0, 488.0, 338.0, 255.0, 183.0, 165.0, 111.0, 95.0, 46.0, 45.0, 41.0, 19.0, 26.0, 14.0, 16.0, 9.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 7.0], "bins": [-422.0, -409.51953125, -397.0390625, -384.55859375, -372.078125, -359.59765625, -347.1171875, -334.63671875, -322.15625, -309.67578125, -297.1953125, -284.71484375, -272.234375, -259.75390625, -247.2734375, -234.79296875, -222.3125, -209.83203125, -197.3515625, -184.87109375, -172.390625, -159.91015625, -147.4296875, -134.94921875, -122.46875, -109.98828125, -97.5078125, -85.02734375, -72.546875, -60.06640625, -47.5859375, -35.10546875, -22.625, -10.14453125, 2.3359375, 14.81640625, 27.296875, 39.77734375, 52.2578125, 64.73828125, 77.21875, 89.69921875, 102.1796875, 114.66015625, 127.140625, 139.62109375, 152.1015625, 164.58203125, 177.0625, 189.54296875, 202.0234375, 214.50390625, 226.984375, 239.46484375, 251.9453125, 264.42578125, 276.90625, 289.38671875, 301.8671875, 314.34765625, 326.828125, 339.30859375, 351.7890625, 364.26953125, 376.75]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 5.0, 4.0, 5.0, 10.0, 7.0, 14.0, 19.0, 23.0, 32.0, 54.0, 48.0, 118.0, 257.0, 852.0, 181.0, 85.0, 58.0, 48.0, 34.0, 33.0, 23.0, 16.0, 11.0, 12.0, 15.0, 9.0, 6.0, 3.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.875, -144.45703125, -140.0390625, -135.62109375, -131.203125, -126.78515625, -122.3671875, -117.94921875, -113.53125, -109.11328125, -104.6953125, -100.27734375, -95.859375, -91.44140625, -87.0234375, -82.60546875, -78.1875, -73.76953125, -69.3515625, -64.93359375, -60.515625, -56.09765625, -51.6796875, -47.26171875, -42.84375, -38.42578125, -34.0078125, -29.58984375, -25.171875, -20.75390625, -16.3359375, -11.91796875, -7.5, -3.08203125, 1.3359375, 5.75390625, 10.171875, 14.58984375, 19.0078125, 23.42578125, 27.84375, 32.26171875, 36.6796875, 41.09765625, 45.515625, 49.93359375, 54.3515625, 58.76953125, 63.1875, 67.60546875, 72.0234375, 76.44140625, 80.859375, 85.27734375, 89.6953125, 94.11328125, 98.53125, 102.94921875, 107.3671875, 111.78515625, 116.203125, 120.62109375, 125.0390625, 129.45703125, 133.875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 9.0, 17.0, 42.0, 861.0, 67.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3959.149169921875, -3884.03173828125, -3808.91455078125, -3733.797119140625, -3658.6796875, -3583.5625, -3508.445068359375, -3433.32763671875, -3358.21044921875, -3283.093017578125, -3207.975830078125, -3132.8583984375, -3057.740966796875, -2982.62353515625, -2907.50634765625, -2832.388916015625, -2757.271484375, -2682.154052734375, -2607.036865234375, -2531.91943359375, -2456.802001953125, -2381.6845703125, -2306.5673828125, -2231.449951171875, -2156.33251953125, -2081.215087890625, -2006.0977783203125, -1930.98046875, -1855.863037109375, -1780.7457275390625, -1705.62841796875, -1630.510986328125, -1555.39404296875, -1480.2767333984375, -1405.1593017578125, -1330.0419921875, -1254.924560546875, -1179.8072509765625, -1104.68994140625, -1029.572509765625, -954.4552001953125, -879.3378295898438, -804.220458984375, -729.1031494140625, -653.9857788085938, -578.868408203125, -503.7510681152344, -428.63372802734375, -353.516357421875, -278.39898681640625, -203.28164672851562, -128.16429138183594, -53.04693603515625, 22.0704345703125, 97.18777465820312, 172.30511474609375, 247.4224853515625, 322.53985595703125, 397.6571960449219, 472.7745361328125, 547.8919067382812, 623.00927734375, 698.1265869140625, 773.2439575195312, 848.361328125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 7.0, 27.0, 51.0, 688.0, 151.0, 39.0, 15.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2278.950927734375, -2220.281494140625, -2161.6123046875, -2102.94287109375, -2044.2735595703125, -1985.604248046875, -1926.9349365234375, -1868.265625, -1809.5963134765625, -1750.927001953125, -1692.2576904296875, -1633.58837890625, -1574.9189453125, -1516.2496337890625, -1457.580322265625, -1398.9110107421875, -1340.24169921875, -1281.5723876953125, -1222.903076171875, -1164.233642578125, -1105.5643310546875, -1046.89501953125, -988.2257080078125, -929.556396484375, -870.886962890625, -812.2176513671875, -753.5482788085938, -694.8789672851562, -636.2096557617188, -577.540283203125, -518.8709716796875, -460.20166015625, -401.5323486328125, -342.8630065917969, -284.1936950683594, -225.52435302734375, -166.8550262451172, -108.18569946289062, -49.516357421875, 9.1529541015625, 67.82229614257812, 126.49162292480469, 185.16094970703125, 243.83029174804688, 302.4996337890625, 361.1689453125, 419.8382873535156, 478.5075988769531, 537.1769409179688, 595.8462524414062, 654.515625, 713.1849365234375, 771.854248046875, 830.5235595703125, 889.1929321289062, 947.8622436523438, 1006.5316162109375, 1065.200927734375, 1123.8702392578125, 1182.53955078125, 1241.208984375, 1299.8782958984375, 1358.547607421875, 1417.2169189453125, 1475.88623046875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 17.0, 24.0, 23.0, 44.0, 64.0, 88.0, 127.0, 225.0, 359.0, 659.0, 1198.0, 2312.0, 5002.0, 11945.0, 40487.0, 1291569.0, 2767123.0, 47157.0, 13679.0, 5673.0, 2648.0, 1379.0, 757.0, 522.0, 312.0, 211.0, 145.0, 117.0, 93.0, 62.0, 55.0, 36.0, 38.0, 32.0, 21.0, 10.0, 11.0, 11.0, 11.0, 9.0, 11.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1796875, -4.02508544921875, -3.8704833984375, -3.71588134765625, -3.561279296875, -3.40667724609375, -3.2520751953125, -3.09747314453125, -2.94287109375, -2.78826904296875, -2.6336669921875, -2.47906494140625, -2.324462890625, -2.16986083984375, -2.0152587890625, -1.86065673828125, -1.7060546875, -1.55145263671875, -1.3968505859375, -1.24224853515625, -1.087646484375, -0.93304443359375, -0.7784423828125, -0.62384033203125, -0.46923828125, -0.31463623046875, -0.1600341796875, -0.00543212890625, 0.149169921875, 0.30377197265625, 0.4583740234375, 0.61297607421875, 0.767578125, 0.92218017578125, 1.0767822265625, 1.23138427734375, 1.385986328125, 1.54058837890625, 1.6951904296875, 1.84979248046875, 2.00439453125, 2.15899658203125, 2.3135986328125, 2.46820068359375, 2.622802734375, 2.77740478515625, 2.9320068359375, 3.08660888671875, 3.2412109375, 3.39581298828125, 3.5504150390625, 3.70501708984375, 3.859619140625, 4.01422119140625, 4.1688232421875, 4.32342529296875, 4.47802734375, 4.63262939453125, 4.7872314453125, 4.94183349609375, 5.096435546875, 5.25103759765625, 5.4056396484375, 5.56024169921875, 5.71484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 8.0, 4.0, 3.0, 8.0, 10.0, 6.0, 36.0, 80.0, 206.0, 279.0, 207.0, 75.0, 31.0, 13.0, 4.0, 7.0, 9.0, 3.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177001953125, -0.17100906372070312, -0.16501617431640625, -0.15902328491210938, -0.1530303955078125, -0.14703750610351562, -0.14104461669921875, -0.13505172729492188, -0.129058837890625, -0.12306594848632812, -0.11707305908203125, -0.11108016967773438, -0.1050872802734375, -0.09909439086914062, -0.09310150146484375, -0.08710861206054688, -0.08111572265625, -0.07512283325195312, -0.06912994384765625, -0.06313705444335938, -0.0571441650390625, -0.051151275634765625, -0.04515838623046875, -0.039165496826171875, -0.033172607421875, -0.027179718017578125, -0.02118682861328125, -0.015193939208984375, -0.0092010498046875, -0.003208160400390625, 0.00278472900390625, 0.008777618408203125, 0.0147705078125, 0.020763397216796875, 0.02675628662109375, 0.032749176025390625, 0.0387420654296875, 0.044734954833984375, 0.05072784423828125, 0.056720733642578125, 0.062713623046875, 0.06870651245117188, 0.07469940185546875, 0.08069229125976562, 0.0866851806640625, 0.09267807006835938, 0.09867095947265625, 0.10466384887695312, 0.11065673828125, 0.11664962768554688, 0.12264251708984375, 0.12863540649414062, 0.1346282958984375, 0.14062118530273438, 0.14661407470703125, 0.15260696411132812, 0.158599853515625, 0.16459274291992188, 0.17058563232421875, 0.17657852172851562, 0.1825714111328125, 0.18856430053710938, 0.19455718994140625, 0.20055007934570312, 0.20654296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 12.0, 10.0, 8.0, 11.0, 29.0, 22.0, 32.0, 61.0, 83.0, 126.0, 154.0, 229.0, 327.0, 494.0, 790.0, 1464.0, 2851.0, 6299.0, 16156.0, 52058.0, 227243.0, 2506835.0, 1168747.0, 150435.0, 37185.0, 12109.0, 4978.0, 2249.0, 1177.0, 686.0, 438.0, 272.0, 177.0, 120.0, 102.0, 85.0, 50.0, 42.0, 29.0, 24.0, 15.0, 18.0, 10.0, 5.0, 9.0, 8.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.201171875, -3.097503662109375, -2.99383544921875, -2.890167236328125, -2.7864990234375, -2.682830810546875, -2.57916259765625, -2.475494384765625, -2.371826171875, -2.268157958984375, -2.16448974609375, -2.060821533203125, -1.9571533203125, -1.853485107421875, -1.74981689453125, -1.646148681640625, -1.54248046875, -1.438812255859375, -1.33514404296875, -1.231475830078125, -1.1278076171875, -1.024139404296875, -0.92047119140625, -0.816802978515625, -0.713134765625, -0.609466552734375, -0.50579833984375, -0.402130126953125, -0.2984619140625, -0.194793701171875, -0.09112548828125, 0.012542724609375, 0.1162109375, 0.219879150390625, 0.32354736328125, 0.427215576171875, 0.5308837890625, 0.634552001953125, 0.73822021484375, 0.841888427734375, 0.945556640625, 1.049224853515625, 1.15289306640625, 1.256561279296875, 1.3602294921875, 1.463897705078125, 1.56756591796875, 1.671234130859375, 1.77490234375, 1.878570556640625, 1.98223876953125, 2.085906982421875, 2.1895751953125, 2.293243408203125, 2.39691162109375, 2.500579833984375, 2.604248046875, 2.707916259765625, 2.81158447265625, 2.915252685546875, 3.0189208984375, 3.122589111328125, 3.22625732421875, 3.329925537109375, 3.43359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 8.0, 11.0, 13.0, 13.0, 18.0, 31.0, 35.0, 34.0, 58.0, 60.0, 61.0, 76.0, 85.0, 136.0, 156.0, 215.0, 282.0, 325.0, 476.0, 473.0, 356.0, 211.0, 194.0, 143.0, 120.0, 82.0, 83.0, 61.0, 48.0, 46.0, 24.0, 24.0, 18.0, 19.0, 22.0, 14.0, 8.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.48291015625, -0.4691123962402344, -0.45531463623046875, -0.4415168762207031, -0.4277191162109375, -0.4139213562011719, -0.40012359619140625, -0.3863258361816406, -0.372528076171875, -0.3587303161621094, -0.34493255615234375, -0.3311347961425781, -0.3173370361328125, -0.3035392761230469, -0.28974151611328125, -0.2759437561035156, -0.26214599609375, -0.24834823608398438, -0.23455047607421875, -0.22075271606445312, -0.2069549560546875, -0.19315719604492188, -0.17935943603515625, -0.16556167602539062, -0.151763916015625, -0.13796615600585938, -0.12416839599609375, -0.11037063598632812, -0.0965728759765625, -0.08277511596679688, -0.06897735595703125, -0.055179595947265625, -0.0413818359375, -0.027584075927734375, -0.01378631591796875, 1.1444091796875e-05, 0.0138092041015625, 0.027606964111328125, 0.04140472412109375, 0.055202484130859375, 0.069000244140625, 0.08279800415039062, 0.09659576416015625, 0.11039352416992188, 0.1241912841796875, 0.13798904418945312, 0.15178680419921875, 0.16558456420898438, 0.17938232421875, 0.19318008422851562, 0.20697784423828125, 0.22077560424804688, 0.2345733642578125, 0.24837112426757812, 0.26216888427734375, 0.2759666442871094, 0.289764404296875, 0.3035621643066406, 0.31735992431640625, 0.3311576843261719, 0.3449554443359375, 0.3587532043457031, 0.37255096435546875, 0.3863487243652344, 0.400146484375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 8.0, 13.0, 33.0, 50.0, 99.0, 219.0, 271.0, 168.0, 73.0, 37.0, 16.0, 10.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.067535400390625, -23.549304962158203, -23.031076431274414, -22.512845993041992, -21.99461555480957, -21.47638511657715, -20.95815658569336, -20.439926147460938, -19.921695709228516, -19.403465270996094, -18.885236740112305, -18.367006301879883, -17.84877586364746, -17.33054542541504, -16.81231689453125, -16.294086456298828, -15.775856971740723, -15.257627487182617, -14.739397048950195, -14.22116756439209, -13.702937126159668, -13.184707641601562, -12.66647720336914, -12.148247718811035, -11.63001823425293, -11.111788749694824, -10.593558311462402, -10.075328826904297, -9.557098388671875, -9.03886890411377, -8.520639419555664, -8.002408981323242, -7.48417854309082, -6.965948581695557, -6.447718620300293, -5.9294891357421875, -5.411258697509766, -4.89302921295166, -4.3747992515563965, -3.856569290161133, -3.338339328765869, -2.8201093673706055, -2.301879405975342, -1.7836496829986572, -1.2654197216033936, -0.7471897602081299, -0.2289600372314453, 0.28926992416381836, 0.807499885559082, 1.3257298469543457, 1.8439596891403198, 2.362189531326294, 2.8804194927215576, 3.3986494541168213, 3.916879177093506, 4.4351091384887695, 4.953339099884033, 5.471569061279297, 5.9897990226745605, 6.508028984069824, 7.02625846862793, 7.544488906860352, 8.062718391418457, 8.580947875976562, 9.099178314208984]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 11.0, 7.0, 8.0, 12.0, 16.0, 11.0, 13.0, 29.0, 25.0, 32.0, 45.0, 54.0, 55.0, 67.0, 55.0, 61.0, 62.0, 55.0, 56.0, 41.0, 49.0, 42.0, 28.0, 42.0, 30.0, 18.0, 14.0, 14.0, 9.0, 14.0, 9.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.718758583068848, -4.580657482147217, -4.442555904388428, -4.304454803466797, -4.166353702545166, -4.028252601623535, -3.890151023864746, -3.7520499229431152, -3.6139485836029053, -3.4758472442626953, -3.3377461433410645, -3.1996448040008545, -3.0615434646606445, -2.9234423637390137, -2.7853410243988037, -2.6472396850585938, -2.509138584136963, -2.371037244796753, -2.232936143875122, -2.094834804534912, -1.9567335844039917, -1.8186323642730713, -1.6805310249328613, -1.542429804801941, -1.4043285846710205, -1.2662273645401, -1.1281261444091797, -0.9900248050689697, -0.8519235849380493, -0.7138223648071289, -0.5757210850715637, -0.43761980533599854, -0.2995185852050781, -0.16141733527183533, -0.02331608533859253, 0.11478516459465027, 0.25288641452789307, 0.3909876346588135, 0.5290889143943787, 0.6671901941299438, 0.8052914142608643, 0.9433926343917847, 1.081493854522705, 1.219595193862915, 1.3576964139938354, 1.4957976341247559, 1.6338989734649658, 1.7720001935958862, 1.9101014137268066, 2.0482027530670166, 2.1863038539886475, 2.3244051933288574, 2.4625062942504883, 2.6006076335906982, 2.738708972930908, 2.876810073852539, 3.014911413192749, 3.153012752532959, 3.29111385345459, 3.4292151927948, 3.5673165321350098, 3.7054176330566406, 3.8435189723968506, 3.9816203117370605, 4.119721412658691]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 11.0, 14.0, 12.0, 19.0, 32.0, 41.0, 56.0, 63.0, 84.0, 93.0, 164.0, 246.0, 335.0, 594.0, 941.0, 1822.0, 3487.0, 8193.0, 25382.0, 177891.0, 720587.0, 79456.0, 16499.0, 6021.0, 2696.0, 1421.0, 845.0, 483.0, 308.0, 201.0, 136.0, 104.0, 77.0, 65.0, 36.0, 21.0, 28.0, 16.0, 16.0, 13.0, 5.0, 11.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.240234375, -3.1400146484375, -3.039794921875, -2.9395751953125, -2.83935546875, -2.7391357421875, -2.638916015625, -2.5386962890625, -2.4384765625, -2.3382568359375, -2.238037109375, -2.1378173828125, -2.03759765625, -1.9373779296875, -1.837158203125, -1.7369384765625, -1.63671875, -1.5364990234375, -1.436279296875, -1.3360595703125, -1.23583984375, -1.1356201171875, -1.035400390625, -0.9351806640625, -0.8349609375, -0.7347412109375, -0.634521484375, -0.5343017578125, -0.43408203125, -0.3338623046875, -0.233642578125, -0.1334228515625, -0.033203125, 0.0670166015625, 0.167236328125, 0.2674560546875, 0.36767578125, 0.4678955078125, 0.568115234375, 0.6683349609375, 0.7685546875, 0.8687744140625, 0.968994140625, 1.0692138671875, 1.16943359375, 1.2696533203125, 1.369873046875, 1.4700927734375, 1.5703125, 1.6705322265625, 1.770751953125, 1.8709716796875, 1.97119140625, 2.0714111328125, 2.171630859375, 2.2718505859375, 2.3720703125, 2.4722900390625, 2.572509765625, 2.6727294921875, 2.77294921875, 2.8731689453125, 2.973388671875, 3.0736083984375, 3.173828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 8.0, 9.0, 9.0, 17.0, 20.0, 29.0, 52.0, 76.0, 119.0, 135.0, 147.0, 96.0, 90.0, 59.0, 54.0, 23.0, 12.0, 12.0, 7.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2100830078125, -0.2037372589111328, -0.19739151000976562, -0.19104576110839844, -0.18470001220703125, -0.17835426330566406, -0.17200851440429688, -0.1656627655029297, -0.1593170166015625, -0.1529712677001953, -0.14662551879882812, -0.14027976989746094, -0.13393402099609375, -0.12758827209472656, -0.12124252319335938, -0.11489677429199219, -0.108551025390625, -0.10220527648925781, -0.09585952758789062, -0.08951377868652344, -0.08316802978515625, -0.07682228088378906, -0.07047653198242188, -0.06413078308105469, -0.0577850341796875, -0.05143928527832031, -0.045093536376953125, -0.03874778747558594, -0.03240203857421875, -0.026056289672851562, -0.019710540771484375, -0.013364791870117188, -0.00701904296875, -0.0006732940673828125, 0.005672454833984375, 0.012018203735351562, 0.01836395263671875, 0.024709701538085938, 0.031055450439453125, 0.03740119934082031, 0.0437469482421875, 0.05009269714355469, 0.056438446044921875, 0.06278419494628906, 0.06912994384765625, 0.07547569274902344, 0.08182144165039062, 0.08816719055175781, 0.094512939453125, 0.10085868835449219, 0.10720443725585938, 0.11355018615722656, 0.11989593505859375, 0.12624168395996094, 0.13258743286132812, 0.1389331817626953, 0.1452789306640625, 0.1516246795654297, 0.15797042846679688, 0.16431617736816406, 0.17066192626953125, 0.17700767517089844, 0.18335342407226562, 0.1896991729736328, 0.196044921875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 6.0, 9.0, 5.0, 4.0, 12.0, 21.0, 31.0, 40.0, 60.0, 117.0, 214.0, 393.0, 751.0, 1576.0, 3687.0, 10306.0, 44084.0, 548713.0, 387317.0, 36006.0, 8959.0, 3254.0, 1440.0, 706.0, 328.0, 197.0, 109.0, 66.0, 51.0, 31.0, 20.0, 13.0, 8.0, 5.0, 8.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.25628662109375, -4.1141357421875, -3.97198486328125, -3.829833984375, -3.68768310546875, -3.5455322265625, -3.40338134765625, -3.26123046875, -3.11907958984375, -2.9769287109375, -2.83477783203125, -2.692626953125, -2.55047607421875, -2.4083251953125, -2.26617431640625, -2.1240234375, -1.98187255859375, -1.8397216796875, -1.69757080078125, -1.555419921875, -1.41326904296875, -1.2711181640625, -1.12896728515625, -0.98681640625, -0.84466552734375, -0.7025146484375, -0.56036376953125, -0.418212890625, -0.27606201171875, -0.1339111328125, 0.00823974609375, 0.150390625, 0.29254150390625, 0.4346923828125, 0.57684326171875, 0.718994140625, 0.86114501953125, 1.0032958984375, 1.14544677734375, 1.28759765625, 1.42974853515625, 1.5718994140625, 1.71405029296875, 1.856201171875, 1.99835205078125, 2.1405029296875, 2.28265380859375, 2.4248046875, 2.56695556640625, 2.7091064453125, 2.85125732421875, 2.993408203125, 3.13555908203125, 3.2777099609375, 3.41986083984375, 3.56201171875, 3.70416259765625, 3.8463134765625, 3.98846435546875, 4.130615234375, 4.27276611328125, 4.4149169921875, 4.55706787109375, 4.69921875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 13.0, 12.0, 12.0, 8.0, 14.0, 14.0, 24.0, 16.0, 20.0, 22.0, 35.0, 38.0, 39.0, 34.0, 28.0, 37.0, 40.0, 51.0, 45.0, 49.0, 40.0, 36.0, 29.0, 43.0, 40.0, 31.0, 37.0, 29.0, 28.0, 15.0, 22.0, 15.0, 14.0, 11.0, 16.0, 5.0, 6.0, 9.0, 9.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8466796875, -0.8201828002929688, -0.7936859130859375, -0.7671890258789062, -0.740692138671875, -0.7141952514648438, -0.6876983642578125, -0.6612014770507812, -0.63470458984375, -0.6082077026367188, -0.5817108154296875, -0.5552139282226562, -0.528717041015625, -0.5022201538085938, -0.4757232666015625, -0.44922637939453125, -0.4227294921875, -0.39623260498046875, -0.3697357177734375, -0.34323883056640625, -0.316741943359375, -0.29024505615234375, -0.2637481689453125, -0.23725128173828125, -0.21075439453125, -0.18425750732421875, -0.1577606201171875, -0.13126373291015625, -0.104766845703125, -0.07826995849609375, -0.0517730712890625, -0.02527618408203125, 0.001220703125, 0.02771759033203125, 0.0542144775390625, 0.08071136474609375, 0.107208251953125, 0.13370513916015625, 0.1602020263671875, 0.18669891357421875, 0.21319580078125, 0.23969268798828125, 0.2661895751953125, 0.29268646240234375, 0.319183349609375, 0.34568023681640625, 0.3721771240234375, 0.39867401123046875, 0.4251708984375, 0.45166778564453125, 0.4781646728515625, 0.5046615600585938, 0.531158447265625, 0.5576553344726562, 0.5841522216796875, 0.6106491088867188, 0.63714599609375, 0.6636428833007812, 0.6901397705078125, 0.7166366577148438, 0.743133544921875, 0.7696304321289062, 0.7961273193359375, 0.8226242065429688, 0.84912109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 4.0, 7.0, 7.0, 17.0, 15.0, 21.0, 35.0, 34.0, 61.0, 79.0, 108.0, 215.0, 306.0, 615.0, 1232.0, 3106.0, 11390.0, 85169.0, 862275.0, 68363.0, 10091.0, 2811.0, 1159.0, 564.0, 300.0, 165.0, 128.0, 63.0, 58.0, 37.0, 35.0, 19.0, 19.0, 12.0, 11.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5703125, -7.32177734375, -7.0732421875, -6.82470703125, -6.576171875, -6.32763671875, -6.0791015625, -5.83056640625, -5.58203125, -5.33349609375, -5.0849609375, -4.83642578125, -4.587890625, -4.33935546875, -4.0908203125, -3.84228515625, -3.59375, -3.34521484375, -3.0966796875, -2.84814453125, -2.599609375, -2.35107421875, -2.1025390625, -1.85400390625, -1.60546875, -1.35693359375, -1.1083984375, -0.85986328125, -0.611328125, -0.36279296875, -0.1142578125, 0.13427734375, 0.3828125, 0.63134765625, 0.8798828125, 1.12841796875, 1.376953125, 1.62548828125, 1.8740234375, 2.12255859375, 2.37109375, 2.61962890625, 2.8681640625, 3.11669921875, 3.365234375, 3.61376953125, 3.8623046875, 4.11083984375, 4.359375, 4.60791015625, 4.8564453125, 5.10498046875, 5.353515625, 5.60205078125, 5.8505859375, 6.09912109375, 6.34765625, 6.59619140625, 6.8447265625, 7.09326171875, 7.341796875, 7.59033203125, 7.8388671875, 8.08740234375, 8.3359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 11.0, 15.0, 24.0, 38.0, 130.0, 491.0, 165.0, 43.0, 20.0, 17.0, 11.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00244140625, -0.002337813377380371, -0.002234220504760742, -0.0021306276321411133, -0.0020270347595214844, -0.0019234418869018555, -0.0018198490142822266, -0.0017162561416625977, -0.0016126632690429688, -0.0015090703964233398, -0.001405477523803711, -0.001301884651184082, -0.0011982917785644531, -0.0010946989059448242, -0.0009911060333251953, -0.0008875131607055664, -0.0007839202880859375, -0.0006803274154663086, -0.0005767345428466797, -0.0004731416702270508, -0.0003695487976074219, -0.00026595592498779297, -0.00016236305236816406, -5.8770179748535156e-05, 4.482269287109375e-05, 0.00014841556549072266, 0.00025200843811035156, 0.00035560131072998047, 0.0004591941833496094, 0.0005627870559692383, 0.0006663799285888672, 0.0007699728012084961, 0.000873565673828125, 0.000977158546447754, 0.0010807514190673828, 0.0011843442916870117, 0.0012879371643066406, 0.0013915300369262695, 0.0014951229095458984, 0.0015987157821655273, 0.0017023086547851562, 0.0018059015274047852, 0.001909494400024414, 0.002013087272644043, 0.002116680145263672, 0.0022202730178833008, 0.0023238658905029297, 0.0024274587631225586, 0.0025310516357421875, 0.0026346445083618164, 0.0027382373809814453, 0.0028418302536010742, 0.002945423126220703, 0.003049015998840332, 0.003152608871459961, 0.00325620174407959, 0.0033597946166992188, 0.0034633874893188477, 0.0035669803619384766, 0.0036705732345581055, 0.0037741661071777344, 0.0038777589797973633, 0.003981351852416992, 0.004084944725036621, 0.00418853759765625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 5.0, 7.0, 12.0, 22.0, 27.0, 42.0, 62.0, 141.0, 251.0, 552.0, 1434.0, 4539.0, 25935.0, 885623.0, 116364.0, 9514.0, 2383.0, 829.0, 345.0, 195.0, 94.0, 73.0, 33.0, 23.0, 13.0, 17.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8515625, -13.4639892578125, -13.076416015625, -12.6888427734375, -12.30126953125, -11.9136962890625, -11.526123046875, -11.1385498046875, -10.7509765625, -10.3634033203125, -9.975830078125, -9.5882568359375, -9.20068359375, -8.8131103515625, -8.425537109375, -8.0379638671875, -7.650390625, -7.2628173828125, -6.875244140625, -6.4876708984375, -6.10009765625, -5.7125244140625, -5.324951171875, -4.9373779296875, -4.5498046875, -4.1622314453125, -3.774658203125, -3.3870849609375, -2.99951171875, -2.6119384765625, -2.224365234375, -1.8367919921875, -1.44921875, -1.0616455078125, -0.674072265625, -0.2864990234375, 0.10107421875, 0.4886474609375, 0.876220703125, 1.2637939453125, 1.6513671875, 2.0389404296875, 2.426513671875, 2.8140869140625, 3.20166015625, 3.5892333984375, 3.976806640625, 4.3643798828125, 4.751953125, 5.1395263671875, 5.527099609375, 5.9146728515625, 6.30224609375, 6.6898193359375, 7.077392578125, 7.4649658203125, 7.8525390625, 8.2401123046875, 8.627685546875, 9.0152587890625, 9.40283203125, 9.7904052734375, 10.177978515625, 10.5655517578125, 10.953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 5.0, 14.0, 24.0, 37.0, 49.0, 59.0, 100.0, 127.0, 159.0, 118.0, 89.0, 68.0, 46.0, 39.0, 23.0, 14.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -4.00927734375, -3.8857421875, -3.76220703125, -3.638671875, -3.51513671875, -3.3916015625, -3.26806640625, -3.14453125, -3.02099609375, -2.8974609375, -2.77392578125, -2.650390625, -2.52685546875, -2.4033203125, -2.27978515625, -2.15625, -2.03271484375, -1.9091796875, -1.78564453125, -1.662109375, -1.53857421875, -1.4150390625, -1.29150390625, -1.16796875, -1.04443359375, -0.9208984375, -0.79736328125, -0.673828125, -0.55029296875, -0.4267578125, -0.30322265625, -0.1796875, -0.05615234375, 0.0673828125, 0.19091796875, 0.314453125, 0.43798828125, 0.5615234375, 0.68505859375, 0.80859375, 0.93212890625, 1.0556640625, 1.17919921875, 1.302734375, 1.42626953125, 1.5498046875, 1.67333984375, 1.796875, 1.92041015625, 2.0439453125, 2.16748046875, 2.291015625, 2.41455078125, 2.5380859375, 2.66162109375, 2.78515625, 2.90869140625, 3.0322265625, 3.15576171875, 3.279296875, 3.40283203125, 3.5263671875, 3.64990234375, 3.7734375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 13.0, 18.0, 52.0, 87.0, 210.0, 348.0, 159.0, 57.0, 17.0, 10.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.70325469970703, -61.25688552856445, -59.810516357421875, -58.3641471862793, -56.91777801513672, -55.47140884399414, -54.02503967285156, -52.578670501708984, -51.132301330566406, -49.68593215942383, -48.23956298828125, -46.79319381713867, -45.346824645996094, -43.900455474853516, -42.45408630371094, -41.00771713256836, -39.56134796142578, -38.1149787902832, -36.668609619140625, -35.22224044799805, -33.77587127685547, -32.32950210571289, -30.883132934570312, -29.436763763427734, -27.990394592285156, -26.544025421142578, -25.09765625, -23.651287078857422, -22.204917907714844, -20.758548736572266, -19.312179565429688, -17.86581039428711, -16.41944122314453, -14.973072052001953, -13.526702880859375, -12.080333709716797, -10.633964538574219, -9.18759536743164, -7.7412261962890625, -6.294857025146484, -4.848487854003906, -3.402118682861328, -1.95574951171875, -0.5093803405761719, 0.9369888305664062, 2.3833580017089844, 3.8297271728515625, 5.276096343994141, 6.722465515136719, 8.168834686279297, 9.615203857421875, 11.061573028564453, 12.507942199707031, 13.95431137084961, 15.400680541992188, 16.847049713134766, 18.293418884277344, 19.739788055419922, 21.1861572265625, 22.632526397705078, 24.078895568847656, 25.525264739990234, 26.971633911132812, 28.41800308227539, 29.86437225341797]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 4.0, 2.0, 9.0, 17.0, 26.0, 35.0, 64.0, 68.0, 113.0, 129.0, 146.0, 107.0, 75.0, 62.0, 43.0, 18.0, 17.0, 19.0, 10.0, 7.0, 4.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.778369903564453, -18.157878875732422, -17.537389755249023, -16.916898727416992, -16.296409606933594, -15.675918579101562, -15.055428504943848, -14.434938430786133, -13.814447402954102, -13.193957328796387, -12.573467254638672, -11.95297622680664, -11.332486152648926, -10.711996078491211, -10.091506004333496, -9.471015930175781, -8.850525856018066, -8.230035781860352, -7.6095452308654785, -6.989055156707764, -6.368564605712891, -5.748074531555176, -5.127584457397461, -4.507093906402588, -3.886603832244873, -3.266113519668579, -2.645623207092285, -2.0251331329345703, -1.4046428203582764, -0.7841525077819824, -0.16366243362426758, 0.45682811737060547, 1.0773181915283203, 1.6978085041046143, 2.318298816680908, 2.938788890838623, 3.559279203414917, 4.179769515991211, 4.800259590148926, 5.420750141143799, 6.041240215301514, 6.6617302894592285, 7.282220840454102, 7.902710914611816, 8.523200988769531, 9.143692016601562, 9.764181137084961, 10.384672164916992, 11.005162239074707, 11.625652313232422, 12.246142387390137, 12.866632461547852, 13.487123489379883, 14.107613563537598, 14.728103637695312, 15.348594665527344, 15.969083786010742, 16.589574813842773, 17.210063934326172, 17.830554962158203, 18.4510440826416, 19.071535110473633, 19.69202423095703, 20.312515258789062, 20.933006286621094]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 10.0, 22.0, 27.0, 93.0, 310.0, 2505.0, 4189916.0, 1217.0, 87.0, 34.0, 22.0, 15.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-262.0, -256.5947265625, -251.189453125, -245.7841796875, -240.37890625, -234.9736328125, -229.568359375, -224.1630859375, -218.7578125, -213.3525390625, -207.947265625, -202.5419921875, -197.13671875, -191.7314453125, -186.326171875, -180.9208984375, -175.515625, -170.1103515625, -164.705078125, -159.2998046875, -153.89453125, -148.4892578125, -143.083984375, -137.6787109375, -132.2734375, -126.8681640625, -121.462890625, -116.0576171875, -110.65234375, -105.2470703125, -99.841796875, -94.4365234375, -89.03125, -83.6259765625, -78.220703125, -72.8154296875, -67.41015625, -62.0048828125, -56.599609375, -51.1943359375, -45.7890625, -40.3837890625, -34.978515625, -29.5732421875, -24.16796875, -18.7626953125, -13.357421875, -7.9521484375, -2.546875, 2.8583984375, 8.263671875, 13.6689453125, 19.07421875, 24.4794921875, 29.884765625, 35.2900390625, 40.6953125, 46.1005859375, 51.505859375, 56.9111328125, 62.31640625, 67.7216796875, 73.126953125, 78.5322265625, 83.9375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 5.0, 8.0, 7.0, 7.0, 18.0, 29.0, 38.0, 49.0, 94.0, 115.0, 137.0, 129.0, 108.0, 75.0, 50.0, 34.0, 34.0, 13.0, 15.0, 5.0, 7.0, 5.0, 3.0, 5.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.290771484375, -0.2828712463378906, -0.27497100830078125, -0.2670707702636719, -0.2591705322265625, -0.2512702941894531, -0.24337005615234375, -0.23546981811523438, -0.227569580078125, -0.21966934204101562, -0.21176910400390625, -0.20386886596679688, -0.1959686279296875, -0.18806838989257812, -0.18016815185546875, -0.17226791381835938, -0.16436767578125, -0.15646743774414062, -0.14856719970703125, -0.14066696166992188, -0.1327667236328125, -0.12486648559570312, -0.11696624755859375, -0.10906600952148438, -0.101165771484375, -0.09326553344726562, -0.08536529541015625, -0.07746505737304688, -0.0695648193359375, -0.061664581298828125, -0.05376434326171875, -0.045864105224609375, -0.0379638671875, -0.030063629150390625, -0.02216339111328125, -0.014263153076171875, -0.0063629150390625, 0.001537322998046875, 0.00943756103515625, 0.017337799072265625, 0.025238037109375, 0.033138275146484375, 0.04103851318359375, 0.048938751220703125, 0.0568389892578125, 0.06473922729492188, 0.07263946533203125, 0.08053970336914062, 0.08843994140625, 0.09634017944335938, 0.10424041748046875, 0.11214065551757812, 0.1200408935546875, 0.12794113159179688, 0.13584136962890625, 0.14374160766601562, 0.151641845703125, 0.15954208374023438, 0.16744232177734375, 0.17534255981445312, 0.1832427978515625, 0.19114303588867188, 0.19904327392578125, 0.20694351196289062, 0.21484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 19.0, 71.0, 249.0, 30982.0, 4161193.0, 951.0, 383.0, 211.0, 108.0, 61.0, 25.0, 18.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.09375, -17.91357421875, -15.7333984375, -13.55322265625, -11.373046875, -9.19287109375, -7.0126953125, -4.83251953125, -2.65234375, -0.47216796875, 1.7080078125, 3.88818359375, 6.068359375, 8.24853515625, 10.4287109375, 12.60888671875, 14.7890625, 16.96923828125, 19.1494140625, 21.32958984375, 23.509765625, 25.68994140625, 27.8701171875, 30.05029296875, 32.23046875, 34.41064453125, 36.5908203125, 38.77099609375, 40.951171875, 43.13134765625, 45.3115234375, 47.49169921875, 49.671875, 51.85205078125, 54.0322265625, 56.21240234375, 58.392578125, 60.57275390625, 62.7529296875, 64.93310546875, 67.11328125, 69.29345703125, 71.4736328125, 73.65380859375, 75.833984375, 78.01416015625, 80.1943359375, 82.37451171875, 84.5546875, 86.73486328125, 88.9150390625, 91.09521484375, 93.275390625, 95.45556640625, 97.6357421875, 99.81591796875, 101.99609375, 104.17626953125, 106.3564453125, 108.53662109375, 110.716796875, 112.89697265625, 115.0771484375, 117.25732421875, 119.4375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 5.0, 14.0, 15.0, 22.0, 31.0, 34.0, 62.0, 71.0, 99.0, 181.0, 410.0, 1348.0, 599.0, 436.0, 280.0, 154.0, 96.0, 68.0, 34.0, 34.0, 21.0, 15.0, 8.0, 9.0, 5.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470947265625, -0.4491310119628906, -0.42731475830078125, -0.4054985046386719, -0.3836822509765625, -0.3618659973144531, -0.34004974365234375, -0.3182334899902344, -0.296417236328125, -0.2746009826660156, -0.25278472900390625, -0.23096847534179688, -0.2091522216796875, -0.18733596801757812, -0.16551971435546875, -0.14370346069335938, -0.12188720703125, -0.10007095336914062, -0.07825469970703125, -0.056438446044921875, -0.0346221923828125, -0.012805938720703125, 0.00901031494140625, 0.030826568603515625, 0.052642822265625, 0.07445907592773438, 0.09627532958984375, 0.11809158325195312, 0.1399078369140625, 0.16172409057617188, 0.18354034423828125, 0.20535659790039062, 0.2271728515625, 0.24898910522460938, 0.27080535888671875, 0.2926216125488281, 0.3144378662109375, 0.3362541198730469, 0.35807037353515625, 0.3798866271972656, 0.401702880859375, 0.4235191345214844, 0.44533538818359375, 0.4671516418457031, 0.4889678955078125, 0.5107841491699219, 0.5326004028320312, 0.5544166564941406, 0.57623291015625, 0.5980491638183594, 0.6198654174804688, 0.6416816711425781, 0.6634979248046875, 0.6853141784667969, 0.7071304321289062, 0.7289466857910156, 0.750762939453125, 0.7725791931152344, 0.7943954467773438, 0.8162117004394531, 0.8380279541015625, 0.8598442077636719, 0.8816604614257812, 0.9034767150878906, 0.92529296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 7.0, 936.0, 70.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.286718368530273, -21.870264053344727, -13.45380973815918, -5.037355422973633, 3.379098892211914, 11.795553207397461, 20.212007522583008, 28.628461837768555, 37.04491424560547, 45.461368560791016, 53.87782287597656, 62.29427719116211, 70.71073150634766, 79.12718200683594, 87.54364013671875, 95.96009826660156, 104.37654876708984, 112.79299926757812, 121.20945739746094, 129.62591552734375, 138.0423583984375, 146.4588165283203, 154.87527465820312, 163.29173278808594, 171.70819091796875, 180.12464904785156, 188.54110717773438, 196.95755004882812, 205.37400817871094, 213.79046630859375, 222.2069091796875, 230.6233673095703, 239.039794921875, 247.4562530517578, 255.87271118164062, 264.2891540527344, 272.70562744140625, 281.1220703125, 289.53851318359375, 297.9549865722656, 306.3714294433594, 314.7878723144531, 323.204345703125, 331.62078857421875, 340.0372314453125, 348.4537048339844, 356.8701477050781, 365.28662109375, 373.70306396484375, 382.1195068359375, 390.5359802246094, 398.9524230957031, 407.368896484375, 415.78533935546875, 424.2017822265625, 432.6182556152344, 441.0346984863281, 449.4511413574219, 457.86761474609375, 466.2840576171875, 474.70050048828125, 483.1169738769531, 491.5334167480469, 499.94989013671875, 508.3663330078125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 15.0, 27.0, 45.0, 92.0, 116.0, 166.0, 169.0, 156.0, 102.0, 53.0, 33.0, 16.0, 7.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.922917366027832, -6.2643866539001465, -5.605855941772461, -4.947325706481934, -4.28879451751709, -3.6302640438079834, -2.971733570098877, -2.3132028579711914, -1.6546721458435059, -0.9961414933204651, -0.3376108407974243, 0.3209197521209717, 0.9794504642486572, 1.6379811763763428, 2.296511650085449, 2.9550423622131348, 3.6135730743408203, 4.272103786468506, 4.930634498596191, 5.589164733886719, 6.2476959228515625, 6.90622615814209, 7.564756870269775, 8.223287582397461, 8.881818771362305, 9.540349006652832, 10.198880195617676, 10.857410430908203, 11.515941619873047, 12.174471855163574, 12.833002090454102, 13.491533279418945, 14.150064468383789, 14.808594703674316, 15.46712589263916, 16.125656127929688, 16.78418731689453, 17.442718505859375, 18.101247787475586, 18.75977897644043, 19.418310165405273, 20.076841354370117, 20.735370635986328, 21.393901824951172, 22.052433013916016, 22.71096420288086, 23.36949348449707, 24.028024673461914, 24.686553955078125, 25.34508514404297, 26.00361442565918, 26.662145614624023, 27.320676803588867, 27.97920799255371, 28.637737274169922, 29.296268463134766, 29.95479965209961, 30.613330841064453, 31.271860122680664, 31.930391311645508, 32.58892059326172, 33.24745178222656, 33.905982971191406, 34.56451416015625, 35.223045349121094]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 6.0, 6.0, 9.0, 4.0, 3.0, 11.0, 19.0, 17.0, 31.0, 51.0, 79.0, 168.0, 413.0, 1238.0, 5624.0, 49298.0, 778509.0, 195063.0, 14516.0, 2382.0, 611.0, 231.0, 101.0, 56.0, 28.0, 26.0, 10.0, 12.0, 7.0, 7.0, 7.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.40625, -10.0977783203125, -9.789306640625, -9.4808349609375, -9.17236328125, -8.8638916015625, -8.555419921875, -8.2469482421875, -7.9384765625, -7.6300048828125, -7.321533203125, -7.0130615234375, -6.70458984375, -6.3961181640625, -6.087646484375, -5.7791748046875, -5.470703125, -5.1622314453125, -4.853759765625, -4.5452880859375, -4.23681640625, -3.9283447265625, -3.619873046875, -3.3114013671875, -3.0029296875, -2.6944580078125, -2.385986328125, -2.0775146484375, -1.76904296875, -1.4605712890625, -1.152099609375, -0.8436279296875, -0.53515625, -0.2266845703125, 0.081787109375, 0.3902587890625, 0.69873046875, 1.0072021484375, 1.315673828125, 1.6241455078125, 1.9326171875, 2.2410888671875, 2.549560546875, 2.8580322265625, 3.16650390625, 3.4749755859375, 3.783447265625, 4.0919189453125, 4.400390625, 4.7088623046875, 5.017333984375, 5.3258056640625, 5.63427734375, 5.9427490234375, 6.251220703125, 6.5596923828125, 6.8681640625, 7.1766357421875, 7.485107421875, 7.7935791015625, 8.10205078125, 8.4105224609375, 8.718994140625, 9.0274658203125, 9.3359375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 3.0, 8.0, 13.0, 30.0, 42.0, 72.0, 84.0, 108.0, 150.0, 137.0, 118.0, 92.0, 48.0, 37.0, 26.0, 16.0, 7.0, 3.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1717529296875, -0.1609668731689453, -0.15018081665039062, -0.13939476013183594, -0.12860870361328125, -0.11782264709472656, -0.10703659057617188, -0.09625053405761719, -0.0854644775390625, -0.07467842102050781, -0.06389236450195312, -0.05310630798339844, -0.04232025146484375, -0.03153419494628906, -0.020748138427734375, -0.009962081909179688, 0.000823974609375, 0.011610031127929688, 0.022396087646484375, 0.03318214416503906, 0.04396820068359375, 0.05475425720214844, 0.06554031372070312, 0.07632637023925781, 0.0871124267578125, 0.09789848327636719, 0.10868453979492188, 0.11947059631347656, 0.13025665283203125, 0.14104270935058594, 0.15182876586914062, 0.1626148223876953, 0.17340087890625, 0.1841869354248047, 0.19497299194335938, 0.20575904846191406, 0.21654510498046875, 0.22733116149902344, 0.23811721801757812, 0.2489032745361328, 0.2596893310546875, 0.2704753875732422, 0.2812614440917969, 0.29204750061035156, 0.30283355712890625, 0.31361961364746094, 0.3244056701660156, 0.3351917266845703, 0.345977783203125, 0.3567638397216797, 0.3675498962402344, 0.37833595275878906, 0.38912200927734375, 0.39990806579589844, 0.4106941223144531, 0.4214801788330078, 0.4322662353515625, 0.4430522918701172, 0.4538383483886719, 0.46462440490722656, 0.47541046142578125, 0.48619651794433594, 0.4969825744628906, 0.5077686309814453, 0.5185546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 2.0, 9.0, 4.0, 7.0, 9.0, 8.0, 14.0, 8.0, 7.0, 11.0, 16.0, 23.0, 23.0, 58.0, 219.0, 2194.0, 89429.0, 942628.0, 12746.0, 765.0, 148.0, 48.0, 31.0, 13.0, 26.0, 13.0, 12.0, 20.0, 7.0, 7.0, 12.0, 5.0, 9.0, 5.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.0703125, -13.6475830078125, -13.224853515625, -12.8021240234375, -12.37939453125, -11.9566650390625, -11.533935546875, -11.1112060546875, -10.6884765625, -10.2657470703125, -9.843017578125, -9.4202880859375, -8.99755859375, -8.5748291015625, -8.152099609375, -7.7293701171875, -7.306640625, -6.8839111328125, -6.461181640625, -6.0384521484375, -5.61572265625, -5.1929931640625, -4.770263671875, -4.3475341796875, -3.9248046875, -3.5020751953125, -3.079345703125, -2.6566162109375, -2.23388671875, -1.8111572265625, -1.388427734375, -0.9656982421875, -0.54296875, -0.1202392578125, 0.302490234375, 0.7252197265625, 1.14794921875, 1.5706787109375, 1.993408203125, 2.4161376953125, 2.8388671875, 3.2615966796875, 3.684326171875, 4.1070556640625, 4.52978515625, 4.9525146484375, 5.375244140625, 5.7979736328125, 6.220703125, 6.6434326171875, 7.066162109375, 7.4888916015625, 7.91162109375, 8.3343505859375, 8.757080078125, 9.1798095703125, 9.6025390625, 10.0252685546875, 10.447998046875, 10.8707275390625, 11.29345703125, 11.7161865234375, 12.138916015625, 12.5616455078125, 12.984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 5.0, 2.0, 12.0, 4.0, 1.0, 13.0, 15.0, 5.0, 14.0, 19.0, 23.0, 29.0, 27.0, 28.0, 20.0, 45.0, 43.0, 34.0, 49.0, 50.0, 40.0, 50.0, 44.0, 39.0, 40.0, 42.0, 44.0, 41.0, 30.0, 33.0, 29.0, 23.0, 21.0, 11.0, 14.0, 15.0, 17.0, 14.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.88525390625, -0.8581085205078125, -0.830963134765625, -0.8038177490234375, -0.77667236328125, -0.7495269775390625, -0.722381591796875, -0.6952362060546875, -0.6680908203125, -0.6409454345703125, -0.613800048828125, -0.5866546630859375, -0.55950927734375, -0.5323638916015625, -0.505218505859375, -0.4780731201171875, -0.450927734375, -0.4237823486328125, -0.396636962890625, -0.3694915771484375, -0.34234619140625, -0.3152008056640625, -0.288055419921875, -0.2609100341796875, -0.2337646484375, -0.2066192626953125, -0.179473876953125, -0.1523284912109375, -0.12518310546875, -0.0980377197265625, -0.070892333984375, -0.0437469482421875, -0.0166015625, 0.0105438232421875, 0.037689208984375, 0.0648345947265625, 0.09197998046875, 0.1191253662109375, 0.146270751953125, 0.1734161376953125, 0.2005615234375, 0.2277069091796875, 0.254852294921875, 0.2819976806640625, 0.30914306640625, 0.3362884521484375, 0.363433837890625, 0.3905792236328125, 0.417724609375, 0.4448699951171875, 0.472015380859375, 0.4991607666015625, 0.52630615234375, 0.5534515380859375, 0.580596923828125, 0.6077423095703125, 0.6348876953125, 0.6620330810546875, 0.689178466796875, 0.7163238525390625, 0.74346923828125, 0.7706146240234375, 0.797760009765625, 0.8249053955078125, 0.85205078125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 6.0, 2.0, 11.0, 8.0, 12.0, 20.0, 35.0, 65.0, 191.0, 948.0, 25240.0, 1013634.0, 7501.0, 587.0, 126.0, 40.0, 26.0, 18.0, 15.0, 15.0, 7.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-28.703125, -27.913818359375, -27.12451171875, -26.335205078125, -25.5458984375, -24.756591796875, -23.96728515625, -23.177978515625, -22.388671875, -21.599365234375, -20.81005859375, -20.020751953125, -19.2314453125, -18.442138671875, -17.65283203125, -16.863525390625, -16.07421875, -15.284912109375, -14.49560546875, -13.706298828125, -12.9169921875, -12.127685546875, -11.33837890625, -10.549072265625, -9.759765625, -8.970458984375, -8.18115234375, -7.391845703125, -6.6025390625, -5.813232421875, -5.02392578125, -4.234619140625, -3.4453125, -2.656005859375, -1.86669921875, -1.077392578125, -0.2880859375, 0.501220703125, 1.29052734375, 2.079833984375, 2.869140625, 3.658447265625, 4.44775390625, 5.237060546875, 6.0263671875, 6.815673828125, 7.60498046875, 8.394287109375, 9.18359375, 9.972900390625, 10.76220703125, 11.551513671875, 12.3408203125, 13.130126953125, 13.91943359375, 14.708740234375, 15.498046875, 16.287353515625, 17.07666015625, 17.865966796875, 18.6552734375, 19.444580078125, 20.23388671875, 21.023193359375, 21.8125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 8.0, 6.0, 10.0, 18.0, 13.0, 33.0, 35.0, 48.0, 89.0, 230.0, 190.0, 74.0, 41.0, 38.0, 37.0, 23.0, 18.0, 14.0, 15.0, 9.0, 6.0, 8.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002597808837890625, -0.0025212466716766357, -0.0024446845054626465, -0.0023681223392486572, -0.002291560173034668, -0.0022149980068206787, -0.0021384358406066895, -0.0020618736743927, -0.001985311508178711, -0.0019087493419647217, -0.0018321871757507324, -0.0017556250095367432, -0.001679062843322754, -0.0016025006771087646, -0.0015259385108947754, -0.0014493763446807861, -0.0013728141784667969, -0.0012962520122528076, -0.0012196898460388184, -0.001143127679824829, -0.0010665655136108398, -0.0009900033473968506, -0.0009134411811828613, -0.0008368790149688721, -0.0007603168487548828, -0.0006837546825408936, -0.0006071925163269043, -0.000530630350112915, -0.0004540681838989258, -0.0003775060176849365, -0.00030094385147094727, -0.000224381685256958, -0.00014781951904296875, -7.125735282897949e-05, 5.304813385009766e-06, 8.186697959899902e-05, 0.00015842914581298828, 0.00023499131202697754, 0.0003115534782409668, 0.00038811564445495605, 0.0004646778106689453, 0.0005412399768829346, 0.0006178021430969238, 0.0006943643093109131, 0.0007709264755249023, 0.0008474886417388916, 0.0009240508079528809, 0.0010006129741668701, 0.0010771751403808594, 0.0011537373065948486, 0.0012302994728088379, 0.0013068616390228271, 0.0013834238052368164, 0.0014599859714508057, 0.001536548137664795, 0.0016131103038787842, 0.0016896724700927734, 0.0017662346363067627, 0.001842796802520752, 0.0019193589687347412, 0.0019959211349487305, 0.0020724833011627197, 0.002149045467376709, 0.0022256076335906982, 0.0023021697998046875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 9.0, 8.0, 12.0, 25.0, 33.0, 59.0, 106.0, 162.0, 301.0, 550.0, 1239.0, 2956.0, 8852.0, 47542.0, 877854.0, 89401.0, 12437.0, 3738.0, 1560.0, 714.0, 391.0, 218.0, 130.0, 91.0, 44.0, 36.0, 30.0, 11.0, 11.0, 7.0, 8.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.046875, -17.567138671875, -17.08740234375, -16.607666015625, -16.1279296875, -15.648193359375, -15.16845703125, -14.688720703125, -14.208984375, -13.729248046875, -13.24951171875, -12.769775390625, -12.2900390625, -11.810302734375, -11.33056640625, -10.850830078125, -10.37109375, -9.891357421875, -9.41162109375, -8.931884765625, -8.4521484375, -7.972412109375, -7.49267578125, -7.012939453125, -6.533203125, -6.053466796875, -5.57373046875, -5.093994140625, -4.6142578125, -4.134521484375, -3.65478515625, -3.175048828125, -2.6953125, -2.215576171875, -1.73583984375, -1.256103515625, -0.7763671875, -0.296630859375, 0.18310546875, 0.662841796875, 1.142578125, 1.622314453125, 2.10205078125, 2.581787109375, 3.0615234375, 3.541259765625, 4.02099609375, 4.500732421875, 4.98046875, 5.460205078125, 5.93994140625, 6.419677734375, 6.8994140625, 7.379150390625, 7.85888671875, 8.338623046875, 8.818359375, 9.298095703125, 9.77783203125, 10.257568359375, 10.7373046875, 11.217041015625, 11.69677734375, 12.176513671875, 12.65625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 8.0, 5.0, 6.0, 11.0, 29.0, 72.0, 156.0, 367.0, 170.0, 71.0, 29.0, 22.0, 10.0, 8.0, 4.0, 3.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.49505615234375, -6.2205810546875, -5.94610595703125, -5.671630859375, -5.39715576171875, -5.1226806640625, -4.84820556640625, -4.57373046875, -4.29925537109375, -4.0247802734375, -3.75030517578125, -3.475830078125, -3.20135498046875, -2.9268798828125, -2.65240478515625, -2.3779296875, -2.10345458984375, -1.8289794921875, -1.55450439453125, -1.280029296875, -1.00555419921875, -0.7310791015625, -0.45660400390625, -0.18212890625, 0.09234619140625, 0.3668212890625, 0.64129638671875, 0.915771484375, 1.19024658203125, 1.4647216796875, 1.73919677734375, 2.013671875, 2.28814697265625, 2.5626220703125, 2.83709716796875, 3.111572265625, 3.38604736328125, 3.6605224609375, 3.93499755859375, 4.20947265625, 4.48394775390625, 4.7584228515625, 5.03289794921875, 5.307373046875, 5.58184814453125, 5.8563232421875, 6.13079833984375, 6.4052734375, 6.67974853515625, 6.9542236328125, 7.22869873046875, 7.503173828125, 7.77764892578125, 8.0521240234375, 8.32659912109375, 8.60107421875, 8.87554931640625, 9.1500244140625, 9.42449951171875, 9.698974609375, 9.97344970703125, 10.2479248046875, 10.52239990234375, 10.796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 12.0, 41.0, 142.0, 353.0, 300.0, 100.0, 32.0, 16.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.00551986694336, -54.122154235839844, -52.23878860473633, -50.35542297363281, -48.47206115722656, -46.58869552612305, -44.70532989501953, -42.821964263916016, -40.9385986328125, -39.055233001708984, -37.17186737060547, -35.28850555419922, -33.4051399230957, -31.521774291992188, -29.638408660888672, -27.755043029785156, -25.871681213378906, -23.98831558227539, -22.104951858520508, -20.221586227416992, -18.33822250366211, -16.454856872558594, -14.571491241455078, -12.688126564025879, -10.80476188659668, -8.92139720916748, -7.038032054901123, -5.154666900634766, -3.2713022232055664, -1.3879375457763672, 0.49542808532714844, 2.3787927627563477, 4.2621612548828125, 6.145525932312012, 8.028890609741211, 9.912256240844727, 11.795620918273926, 13.678985595703125, 15.56235122680664, 17.445716857910156, 19.32908058166504, 21.212446212768555, 23.095809936523438, 24.979175567626953, 26.86254119873047, 28.74590492248535, 30.629270553588867, 32.51263427734375, 34.395999908447266, 36.27936553955078, 38.1627311706543, 40.04609680175781, 41.92945861816406, 43.81282424926758, 45.696189880371094, 47.57955551147461, 49.462921142578125, 51.34628677368164, 53.229652404785156, 55.113014221191406, 56.99637985229492, 58.87974548339844, 60.76311111450195, 62.64647674560547, 64.52983856201172]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 5.0, 13.0, 16.0, 22.0, 32.0, 46.0, 80.0, 86.0, 83.0, 104.0, 95.0, 99.0, 70.0, 65.0, 60.0, 44.0, 33.0, 22.0, 6.0, 7.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-24.54124641418457, -23.985618591308594, -23.429990768432617, -22.87436294555664, -22.318735122680664, -21.763107299804688, -21.20747947692871, -20.651851654052734, -20.096221923828125, -19.54059410095215, -18.984966278076172, -18.429338455200195, -17.87371063232422, -17.318082809448242, -16.762454986572266, -16.206825256347656, -15.651199340820312, -15.095571517944336, -14.53994369506836, -13.984315872192383, -13.428688049316406, -12.87306022644043, -12.317431449890137, -11.76180362701416, -11.206175804138184, -10.650547981262207, -10.09492015838623, -9.539292335510254, -8.983663558959961, -8.428035736083984, -7.872407913208008, -7.316780090332031, -6.7611541748046875, -6.205526351928711, -5.649898529052734, -5.0942702293396, -4.538642406463623, -3.9830145835876465, -3.427386522293091, -2.871758460998535, -2.3161306381225586, -1.7605026960372925, -1.2048747539520264, -0.6492468118667603, -0.09361886978149414, 0.4620089530944824, 1.017637014389038, 1.5732650756835938, 2.1288928985595703, 2.684520721435547, 3.2401487827301025, 3.795776844024658, 4.351404666900635, 4.907032489776611, 5.462660789489746, 6.018288612365723, 6.573916435241699, 7.129544258117676, 7.685172080993652, 8.240799903869629, 8.796428680419922, 9.352056503295898, 9.907684326171875, 10.463312149047852, 11.018939971923828]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 0.0, 4.0, 2.0, 6.0, 6.0, 10.0, 6.0, 4.0, 10.0, 12.0, 6.0, 8.0, 8.0, 16.0, 12.0, 18.0, 34.0, 73.0, 271.0, 1922.0, 4190191.0, 1326.0, 129.0, 47.0, 35.0, 24.0, 12.0, 8.0, 8.0, 14.0, 10.0, 6.0, 6.0, 14.0, 6.0, 10.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-77.625, -74.9912109375, -72.357421875, -69.7236328125, -67.08984375, -64.4560546875, -61.822265625, -59.1884765625, -56.5546875, -53.9208984375, -51.287109375, -48.6533203125, -46.01953125, -43.3857421875, -40.751953125, -38.1181640625, -35.484375, -32.8505859375, -30.216796875, -27.5830078125, -24.94921875, -22.3154296875, -19.681640625, -17.0478515625, -14.4140625, -11.7802734375, -9.146484375, -6.5126953125, -3.87890625, -1.2451171875, 1.388671875, 4.0224609375, 6.65625, 9.2900390625, 11.923828125, 14.5576171875, 17.19140625, 19.8251953125, 22.458984375, 25.0927734375, 27.7265625, 30.3603515625, 32.994140625, 35.6279296875, 38.26171875, 40.8955078125, 43.529296875, 46.1630859375, 48.796875, 51.4306640625, 54.064453125, 56.6982421875, 59.33203125, 61.9658203125, 64.599609375, 67.2333984375, 69.8671875, 72.5009765625, 75.134765625, 77.7685546875, 80.40234375, 83.0361328125, 85.669921875, 88.3037109375, 90.9375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 9.0, 14.0, 27.0, 48.0, 63.0, 76.0, 101.0, 125.0, 113.0, 114.0, 101.0, 79.0, 61.0, 25.0, 20.0, 12.0, 2.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.5100975036621094, -0.49773406982421875, -0.4853706359863281, -0.4730072021484375, -0.4606437683105469, -0.44828033447265625, -0.4359169006347656, -0.423553466796875, -0.4111900329589844, -0.39882659912109375, -0.3864631652832031, -0.3740997314453125, -0.3617362976074219, -0.34937286376953125, -0.3370094299316406, -0.32464599609375, -0.3122825622558594, -0.29991912841796875, -0.2875556945800781, -0.2751922607421875, -0.2628288269042969, -0.25046539306640625, -0.23810195922851562, -0.225738525390625, -0.21337509155273438, -0.20101165771484375, -0.18864822387695312, -0.1762847900390625, -0.16392135620117188, -0.15155792236328125, -0.13919448852539062, -0.1268310546875, -0.11446762084960938, -0.10210418701171875, -0.08974075317382812, -0.0773773193359375, -0.06501388549804688, -0.05265045166015625, -0.040287017822265625, -0.027923583984375, -0.015560150146484375, -0.00319671630859375, 0.009166717529296875, 0.0215301513671875, 0.033893585205078125, 0.04625701904296875, 0.058620452880859375, 0.07098388671875, 0.08334732055664062, 0.09571075439453125, 0.10807418823242188, 0.1204376220703125, 0.13280105590820312, 0.14516448974609375, 0.15752792358398438, 0.169891357421875, 0.18225479125976562, 0.19461822509765625, 0.20698165893554688, 0.2193450927734375, 0.23170852661132812, 0.24407196044921875, 0.2564353942871094, 0.268798828125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 10.0, 26.0, 76.0, 297.0, 2420.0, 4191133.0, 273.0, 48.0, 10.0, 2.0], "bins": [-290.75, -285.843505859375, -280.93701171875, -276.030517578125, -271.1240234375, -266.217529296875, -261.31103515625, -256.404541015625, -251.498046875, -246.591552734375, -241.68505859375, -236.778564453125, -231.8720703125, -226.965576171875, -222.05908203125, -217.152587890625, -212.24609375, -207.339599609375, -202.43310546875, -197.526611328125, -192.6201171875, -187.713623046875, -182.80712890625, -177.900634765625, -172.994140625, -168.087646484375, -163.18115234375, -158.274658203125, -153.3681640625, -148.461669921875, -143.55517578125, -138.648681640625, -133.7421875, -128.835693359375, -123.92919921875, -119.022705078125, -114.1162109375, -109.209716796875, -104.30322265625, -99.396728515625, -94.490234375, -89.583740234375, -84.67724609375, -79.770751953125, -74.8642578125, -69.957763671875, -65.05126953125, -60.144775390625, -55.23828125, -50.331787109375, -45.42529296875, -40.518798828125, -35.6123046875, -30.705810546875, -25.79931640625, -20.892822265625, -15.986328125, -11.079833984375, -6.17333984375, -1.266845703125, 3.6396484375, 8.546142578125, 13.45263671875, 18.359130859375, 23.265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 9.0, 15.0, 16.0, 46.0, 57.0, 125.0, 226.0, 697.0, 1949.0, 461.0, 198.0, 110.0, 82.0, 41.0, 18.0, 7.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.080078125, -2.035369873046875, -1.99066162109375, -1.945953369140625, -1.9012451171875, -1.856536865234375, -1.81182861328125, -1.767120361328125, -1.722412109375, -1.677703857421875, -1.63299560546875, -1.588287353515625, -1.5435791015625, -1.498870849609375, -1.45416259765625, -1.409454345703125, -1.36474609375, -1.320037841796875, -1.27532958984375, -1.230621337890625, -1.1859130859375, -1.141204833984375, -1.09649658203125, -1.051788330078125, -1.007080078125, -0.962371826171875, -0.91766357421875, -0.872955322265625, -0.8282470703125, -0.783538818359375, -0.73883056640625, -0.694122314453125, -0.6494140625, -0.604705810546875, -0.55999755859375, -0.515289306640625, -0.4705810546875, -0.425872802734375, -0.38116455078125, -0.336456298828125, -0.291748046875, -0.247039794921875, -0.20233154296875, -0.157623291015625, -0.1129150390625, -0.068206787109375, -0.02349853515625, 0.021209716796875, 0.06591796875, 0.110626220703125, 0.15533447265625, 0.200042724609375, 0.2447509765625, 0.289459228515625, 0.33416748046875, 0.378875732421875, 0.423583984375, 0.468292236328125, 0.51300048828125, 0.557708740234375, 0.6024169921875, 0.647125244140625, 0.69183349609375, 0.736541748046875, 0.78125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 1010.0], "bins": [-714.6007080078125, -703.3050537109375, -692.0093383789062, -680.7136840820312, -669.41796875, -658.122314453125, -646.8265991210938, -635.5309448242188, -624.2352294921875, -612.9395751953125, -601.6438598632812, -590.3482055664062, -579.052490234375, -567.7568359375, -556.4611206054688, -545.1654663085938, -533.8698120117188, -522.5741577148438, -511.2784423828125, -499.9827575683594, -488.68707275390625, -477.39141845703125, -466.0957336425781, -454.800048828125, -443.5043640136719, -432.20867919921875, -420.9129943847656, -409.6173095703125, -398.3216552734375, -387.0259704589844, -375.73028564453125, -364.4346008300781, -353.138916015625, -341.8432312011719, -330.54754638671875, -319.2518615722656, -307.9561767578125, -296.6605224609375, -285.3648376464844, -274.06915283203125, -262.7734680175781, -251.477783203125, -240.18209838867188, -228.8864288330078, -217.5907440185547, -206.29505920410156, -194.9993896484375, -183.70370483398438, -172.40802001953125, -161.11233520507812, -149.816650390625, -138.52098083496094, -127.22529602050781, -115.92961120605469, -104.6339340209961, -93.3382568359375, -82.04256439208984, -70.74688720703125, -59.451202392578125, -48.155521392822266, -36.859840393066406, -25.564159393310547, -14.268478393554688, -2.9728012084960938, 8.322883605957031]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 11.0, 22.0, 33.0, 60.0, 94.0, 133.0, 186.0, 158.0, 150.0, 73.0, 51.0, 26.0, 12.0, 6.0, 1.0, 0.0, 3.0], "bins": [-39.6678581237793, -38.92586898803711, -38.183876037597656, -37.44188690185547, -36.69989776611328, -35.95790481567383, -35.21591567993164, -34.47392272949219, -33.73193359375, -32.98994445800781, -32.24795150756836, -31.505962371826172, -30.76397132873535, -30.02198028564453, -29.279991149902344, -28.538000106811523, -27.796009063720703, -27.054018020629883, -26.312028884887695, -25.570037841796875, -24.828046798706055, -24.086055755615234, -23.344066619873047, -22.602075576782227, -21.86008644104004, -21.11809539794922, -20.37610626220703, -19.63411521911621, -18.89212417602539, -18.15013313293457, -17.408143997192383, -16.666152954101562, -15.92416000366211, -15.182169914245605, -14.440178871154785, -13.698188781738281, -12.956197738647461, -12.214207649230957, -11.472217559814453, -10.730226516723633, -9.988236427307129, -9.246246337890625, -8.504255294799805, -7.762265205383301, -7.0202741622924805, -6.278284072875977, -5.5362935066223145, -4.794302940368652, -4.05231237411499, -3.310321807861328, -2.568331241607666, -1.826340913772583, -1.084350347518921, -0.3423597812652588, 0.3996305465698242, 1.1416211128234863, 1.8836116790771484, 2.6256022453308105, 3.3675928115844727, 4.109582901000977, 4.851573944091797, 5.593564033508301, 6.335554599761963, 7.077545166015625, 7.819535732269287]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 8.0, 6.0, 5.0, 7.0, 9.0, 10.0, 9.0, 21.0, 10.0, 20.0, 27.0, 26.0, 24.0, 30.0, 27.0, 45.0, 41.0, 36.0, 53.0, 2087.0, 1008352.0, 37180.0, 98.0, 50.0, 43.0, 40.0, 41.0, 34.0, 34.0, 32.0, 19.0, 22.0, 21.0, 18.0, 11.0, 9.0, 13.0, 11.0, 11.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0], "bins": [-34.40625, -33.442138671875, -32.47802734375, -31.513916015625, -30.5498046875, -29.585693359375, -28.62158203125, -27.657470703125, -26.693359375, -25.729248046875, -24.76513671875, -23.801025390625, -22.8369140625, -21.872802734375, -20.90869140625, -19.944580078125, -18.98046875, -18.016357421875, -17.05224609375, -16.088134765625, -15.1240234375, -14.159912109375, -13.19580078125, -12.231689453125, -11.267578125, -10.303466796875, -9.33935546875, -8.375244140625, -7.4111328125, -6.447021484375, -5.48291015625, -4.518798828125, -3.5546875, -2.590576171875, -1.62646484375, -0.662353515625, 0.3017578125, 1.265869140625, 2.22998046875, 3.194091796875, 4.158203125, 5.122314453125, 6.08642578125, 7.050537109375, 8.0146484375, 8.978759765625, 9.94287109375, 10.906982421875, 11.87109375, 12.835205078125, 13.79931640625, 14.763427734375, 15.7275390625, 16.691650390625, 17.65576171875, 18.619873046875, 19.583984375, 20.548095703125, 21.51220703125, 22.476318359375, 23.4404296875, 24.404541015625, 25.36865234375, 26.332763671875, 27.296875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 38.0, 145.0, 350.0, 322.0, 127.0, 29.0, 4.0, 1.0], "bins": [-5.05078125, -4.9649658203125, -4.879150390625, -4.7933349609375, -4.70751953125, -4.6217041015625, -4.535888671875, -4.4500732421875, -4.3642578125, -4.2784423828125, -4.192626953125, -4.1068115234375, -4.02099609375, -3.9351806640625, -3.849365234375, -3.7635498046875, -3.677734375, -3.5919189453125, -3.506103515625, -3.4202880859375, -3.33447265625, -3.2486572265625, -3.162841796875, -3.0770263671875, -2.9912109375, -2.9053955078125, -2.819580078125, -2.7337646484375, -2.64794921875, -2.5621337890625, -2.476318359375, -2.3905029296875, -2.3046875, -2.2188720703125, -2.133056640625, -2.0472412109375, -1.96142578125, -1.8756103515625, -1.789794921875, -1.7039794921875, -1.6181640625, -1.5323486328125, -1.446533203125, -1.3607177734375, -1.27490234375, -1.1890869140625, -1.103271484375, -1.0174560546875, -0.931640625, -0.8458251953125, -0.760009765625, -0.6741943359375, -0.58837890625, -0.5025634765625, -0.416748046875, -0.3309326171875, -0.2451171875, -0.1593017578125, -0.073486328125, 0.0123291015625, 0.09814453125, 0.1839599609375, 0.269775390625, 0.3555908203125, 0.44140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 2.0, 5.0, 6.0, 5.0, 9.0, 25.0, 34.0, 69.0, 143.0, 431.0, 1728.0, 10634.0, 172209.0, 796350.0, 59781.0, 5531.0, 1065.0, 283.0, 119.0, 49.0, 26.0, 15.0, 11.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.265869140625, -11.78173828125, -11.297607421875, -10.8134765625, -10.329345703125, -9.84521484375, -9.361083984375, -8.876953125, -8.392822265625, -7.90869140625, -7.424560546875, -6.9404296875, -6.456298828125, -5.97216796875, -5.488037109375, -5.00390625, -4.519775390625, -4.03564453125, -3.551513671875, -3.0673828125, -2.583251953125, -2.09912109375, -1.614990234375, -1.130859375, -0.646728515625, -0.16259765625, 0.321533203125, 0.8056640625, 1.289794921875, 1.77392578125, 2.258056640625, 2.7421875, 3.226318359375, 3.71044921875, 4.194580078125, 4.6787109375, 5.162841796875, 5.64697265625, 6.131103515625, 6.615234375, 7.099365234375, 7.58349609375, 8.067626953125, 8.5517578125, 9.035888671875, 9.52001953125, 10.004150390625, 10.48828125, 10.972412109375, 11.45654296875, 11.940673828125, 12.4248046875, 12.908935546875, 13.39306640625, 13.877197265625, 14.361328125, 14.845458984375, 15.32958984375, 15.813720703125, 16.2978515625, 16.781982421875, 17.26611328125, 17.750244140625, 18.234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 15.0, 8.0, 16.0, 22.0, 30.0, 28.0, 35.0, 45.0, 50.0, 69.0, 53.0, 77.0, 58.0, 62.0, 66.0, 44.0, 53.0, 52.0, 31.0, 42.0, 28.0, 18.0, 13.0, 14.0, 15.0, 9.0, 6.0, 3.0, 8.0, 6.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.916015625, -3.779876708984375, -3.64373779296875, -3.507598876953125, -3.3714599609375, -3.235321044921875, -3.09918212890625, -2.963043212890625, -2.826904296875, -2.690765380859375, -2.55462646484375, -2.418487548828125, -2.2823486328125, -2.146209716796875, -2.01007080078125, -1.873931884765625, -1.73779296875, -1.601654052734375, -1.46551513671875, -1.329376220703125, -1.1932373046875, -1.057098388671875, -0.92095947265625, -0.784820556640625, -0.648681640625, -0.512542724609375, -0.37640380859375, -0.240264892578125, -0.1041259765625, 0.032012939453125, 0.16815185546875, 0.304290771484375, 0.4404296875, 0.576568603515625, 0.71270751953125, 0.848846435546875, 0.9849853515625, 1.121124267578125, 1.25726318359375, 1.393402099609375, 1.529541015625, 1.665679931640625, 1.80181884765625, 1.937957763671875, 2.0740966796875, 2.210235595703125, 2.34637451171875, 2.482513427734375, 2.61865234375, 2.754791259765625, 2.89093017578125, 3.027069091796875, 3.1632080078125, 3.299346923828125, 3.43548583984375, 3.571624755859375, 3.707763671875, 3.843902587890625, 3.98004150390625, 4.116180419921875, 4.2523193359375, 4.388458251953125, 4.52459716796875, 4.660736083984375, 4.796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 6.0, 9.0, 12.0, 13.0, 18.0, 22.0, 26.0, 62.0, 121.0, 245.0, 908.0, 4245.0, 41973.0, 860259.0, 130464.0, 8037.0, 1407.0, 364.0, 133.0, 66.0, 53.0, 28.0, 15.0, 13.0, 17.0, 9.0, 7.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4375, -14.93408203125, -14.4306640625, -13.92724609375, -13.423828125, -12.92041015625, -12.4169921875, -11.91357421875, -11.41015625, -10.90673828125, -10.4033203125, -9.89990234375, -9.396484375, -8.89306640625, -8.3896484375, -7.88623046875, -7.3828125, -6.87939453125, -6.3759765625, -5.87255859375, -5.369140625, -4.86572265625, -4.3623046875, -3.85888671875, -3.35546875, -2.85205078125, -2.3486328125, -1.84521484375, -1.341796875, -0.83837890625, -0.3349609375, 0.16845703125, 0.671875, 1.17529296875, 1.6787109375, 2.18212890625, 2.685546875, 3.18896484375, 3.6923828125, 4.19580078125, 4.69921875, 5.20263671875, 5.7060546875, 6.20947265625, 6.712890625, 7.21630859375, 7.7197265625, 8.22314453125, 8.7265625, 9.22998046875, 9.7333984375, 10.23681640625, 10.740234375, 11.24365234375, 11.7470703125, 12.25048828125, 12.75390625, 13.25732421875, 13.7607421875, 14.26416015625, 14.767578125, 15.27099609375, 15.7744140625, 16.27783203125, 16.78125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 4.0, 7.0, 3.0, 5.0, 8.0, 20.0, 27.0, 22.0, 41.0, 62.0, 98.0, 131.0, 133.0, 119.0, 87.0, 61.0, 54.0, 31.0, 25.0, 4.0, 10.0, 9.0, 10.0, 2.0, 4.0, 5.0, 5.0, 6.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.0012493133544921875, -0.0012184828519821167, -0.001187652349472046, -0.001156821846961975, -0.0011259913444519043, -0.0010951608419418335, -0.0010643303394317627, -0.001033499836921692, -0.001002669334411621, -0.0009718388319015503, -0.0009410083293914795, -0.0009101778268814087, -0.0008793473243713379, -0.0008485168218612671, -0.0008176863193511963, -0.0007868558168411255, -0.0007560253143310547, -0.0007251948118209839, -0.0006943643093109131, -0.0006635338068008423, -0.0006327033042907715, -0.0006018728017807007, -0.0005710422992706299, -0.0005402117967605591, -0.0005093812942504883, -0.0004785507917404175, -0.0004477202892303467, -0.0004168897867202759, -0.0003860592842102051, -0.0003552287817001343, -0.0003243982791900635, -0.0002935677766799927, -0.0002627372741699219, -0.00023190677165985107, -0.00020107626914978027, -0.00017024576663970947, -0.00013941526412963867, -0.00010858476161956787, -7.775425910949707e-05, -4.692375659942627e-05, -1.609325408935547e-05, 1.4737248420715332e-05, 4.556775093078613e-05, 7.639825344085693e-05, 0.00010722875595092773, 0.00013805925846099854, 0.00016888976097106934, 0.00019972026348114014, 0.00023055076599121094, 0.00026138126850128174, 0.00029221177101135254, 0.00032304227352142334, 0.00035387277603149414, 0.00038470327854156494, 0.00041553378105163574, 0.00044636428356170654, 0.00047719478607177734, 0.0005080252885818481, 0.0005388557910919189, 0.0005696862936019897, 0.0006005167961120605, 0.0006313472986221313, 0.0006621778011322021, 0.000693008303642273, 0.0007238388061523438]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 3.0, 4.0, 11.0, 15.0, 32.0, 34.0, 62.0, 107.0, 281.0, 935.0, 6228.0, 155267.0, 849635.0, 32494.0, 2521.0, 524.0, 186.0, 91.0, 32.0, 26.0, 12.0, 11.0, 8.0, 5.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-19.203125, -18.738037109375, -18.27294921875, -17.807861328125, -17.3427734375, -16.877685546875, -16.41259765625, -15.947509765625, -15.482421875, -15.017333984375, -14.55224609375, -14.087158203125, -13.6220703125, -13.156982421875, -12.69189453125, -12.226806640625, -11.76171875, -11.296630859375, -10.83154296875, -10.366455078125, -9.9013671875, -9.436279296875, -8.97119140625, -8.506103515625, -8.041015625, -7.575927734375, -7.11083984375, -6.645751953125, -6.1806640625, -5.715576171875, -5.25048828125, -4.785400390625, -4.3203125, -3.855224609375, -3.39013671875, -2.925048828125, -2.4599609375, -1.994873046875, -1.52978515625, -1.064697265625, -0.599609375, -0.134521484375, 0.33056640625, 0.795654296875, 1.2607421875, 1.725830078125, 2.19091796875, 2.656005859375, 3.12109375, 3.586181640625, 4.05126953125, 4.516357421875, 4.9814453125, 5.446533203125, 5.91162109375, 6.376708984375, 6.841796875, 7.306884765625, 7.77197265625, 8.237060546875, 8.7021484375, 9.167236328125, 9.63232421875, 10.097412109375, 10.5625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 12.0, 12.0, 22.0, 33.0, 49.0, 78.0, 122.0, 162.0, 160.0, 141.0, 76.0, 41.0, 25.0, 19.0, 13.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.484375, -7.3245849609375, -7.164794921875, -7.0050048828125, -6.84521484375, -6.6854248046875, -6.525634765625, -6.3658447265625, -6.2060546875, -6.0462646484375, -5.886474609375, -5.7266845703125, -5.56689453125, -5.4071044921875, -5.247314453125, -5.0875244140625, -4.927734375, -4.7679443359375, -4.608154296875, -4.4483642578125, -4.28857421875, -4.1287841796875, -3.968994140625, -3.8092041015625, -3.6494140625, -3.4896240234375, -3.329833984375, -3.1700439453125, -3.01025390625, -2.8504638671875, -2.690673828125, -2.5308837890625, -2.37109375, -2.2113037109375, -2.051513671875, -1.8917236328125, -1.73193359375, -1.5721435546875, -1.412353515625, -1.2525634765625, -1.0927734375, -0.9329833984375, -0.773193359375, -0.6134033203125, -0.45361328125, -0.2938232421875, -0.134033203125, 0.0257568359375, 0.185546875, 0.3453369140625, 0.505126953125, 0.6649169921875, 0.82470703125, 0.9844970703125, 1.144287109375, 1.3040771484375, 1.4638671875, 1.6236572265625, 1.783447265625, 1.9432373046875, 2.10302734375, 2.2628173828125, 2.422607421875, 2.5823974609375, 2.7421875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 80.0, 809.0, 106.0, 14.0, 5.0, 1.0, 1.0], "bins": [-489.5556640625, -481.1854248046875, -472.815185546875, -464.4449462890625, -456.0746765136719, -447.7044372558594, -439.3341979980469, -430.9639587402344, -422.5937194824219, -414.2234802246094, -405.8532409667969, -397.48297119140625, -389.11273193359375, -380.74249267578125, -372.37225341796875, -364.00201416015625, -355.63177490234375, -347.26153564453125, -338.89129638671875, -330.52105712890625, -322.1507873535156, -313.7805480957031, -305.4103088378906, -297.0400695800781, -288.6697998046875, -280.299560546875, -271.9293212890625, -263.55908203125, -255.18882751464844, -246.81857299804688, -238.44833374023438, -230.07809448242188, -221.7078857421875, -213.337646484375, -204.96739196777344, -196.59715270996094, -188.22691345214844, -179.85665893554688, -171.48641967773438, -163.11618041992188, -154.7459259033203, -146.3756866455078, -138.00543212890625, -129.63519287109375, -121.26495361328125, -112.89470672607422, -104.52445983886719, -96.15422058105469, -87.78398132324219, -79.41373443603516, -71.04349517822266, -62.673248291015625, -54.30300521850586, -45.932762145996094, -37.56251525878906, -29.192272186279297, -20.822025299072266, -12.451781272888184, -4.081537246704102, 4.288707733154297, 12.658950805664062, 21.029193878173828, 29.39944076538086, 37.769683837890625, 46.13992691040039]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 7.0, 7.0, 12.0, 4.0, 11.0, 15.0, 32.0, 17.0, 23.0, 34.0, 27.0, 38.0, 30.0, 53.0, 44.0, 45.0, 57.0, 51.0, 57.0, 58.0, 39.0, 52.0, 52.0, 32.0, 36.0, 31.0, 21.0, 23.0, 22.0, 13.0, 17.0, 11.0, 6.0, 4.0, 5.0, 10.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.45362091064453, -19.716480255126953, -18.979339599609375, -18.242198944091797, -17.50505828857422, -16.767915725708008, -16.03077507019043, -15.293634414672852, -14.556493759155273, -13.819353103637695, -13.082212448120117, -12.345070838928223, -11.607930183410645, -10.870789527893066, -10.133647918701172, -9.396507263183594, -8.659366607666016, -7.9222259521484375, -7.185084819793701, -6.447943687438965, -5.710803031921387, -4.973662376403809, -4.236521244049072, -3.499380111694336, -2.762239456176758, -2.0250985622406006, -1.2879576683044434, -0.5508167743682861, 0.1863241195678711, 0.9234650135040283, 1.6606059074401855, 2.397747039794922, 3.134885787963867, 3.8720266819000244, 4.609167575836182, 5.346308708190918, 6.083449363708496, 6.820590019226074, 7.5577311515808105, 8.294872283935547, 9.032012939453125, 9.769153594970703, 10.506294250488281, 11.243435859680176, 11.980576515197754, 12.717717170715332, 13.454858779907227, 14.191999435424805, 14.929140090942383, 15.666280746459961, 16.40342140197754, 17.140562057495117, 17.877704620361328, 18.614845275878906, 19.351985931396484, 20.089126586914062, 20.82626724243164, 21.56340789794922, 22.300548553466797, 23.037689208984375, 23.774829864501953, 24.511972427368164, 25.249113082885742, 25.98625373840332, 26.7233943939209]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 10.0, 14.0, 21.0, 49.0, 54.0, 71.0, 118.0, 197.0, 636.0, 150955.0, 4041479.0, 522.0, 144.0, 24.0, 1.0, 0.0, 1.0], "bins": [-184.625, -181.39013671875, -178.1552734375, -174.92041015625, -171.685546875, -168.45068359375, -165.2158203125, -161.98095703125, -158.74609375, -155.51123046875, -152.2763671875, -149.04150390625, -145.806640625, -142.57177734375, -139.3369140625, -136.10205078125, -132.8671875, -129.63232421875, -126.3974609375, -123.16259765625, -119.927734375, -116.69287109375, -113.4580078125, -110.22314453125, -106.98828125, -103.75341796875, -100.5185546875, -97.28369140625, -94.048828125, -90.81396484375, -87.5791015625, -84.34423828125, -81.109375, -77.87451171875, -74.6396484375, -71.40478515625, -68.169921875, -64.93505859375, -61.7001953125, -58.46533203125, -55.23046875, -51.99560546875, -48.7607421875, -45.52587890625, -42.291015625, -39.05615234375, -35.8212890625, -32.58642578125, -29.3515625, -26.11669921875, -22.8818359375, -19.64697265625, -16.412109375, -13.17724609375, -9.9423828125, -6.70751953125, -3.47265625, -0.23779296875, 2.9970703125, 6.23193359375, 9.466796875, 12.70166015625, 15.9365234375, 19.17138671875, 22.40625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 18.0, 60.0, 169.0, 269.0, 260.0, 149.0, 73.0, 17.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.991172790527344, -4.9003143310546875, -4.809455871582031, -4.718597412109375, -4.627738952636719, -4.5368804931640625, -4.446022033691406, -4.35516357421875, -4.264305114746094, -4.1734466552734375, -4.082588195800781, -3.991729736328125, -3.9008712768554688, -3.8100128173828125, -3.7191543579101562, -3.6282958984375, -3.5374374389648438, -3.4465789794921875, -3.3557205200195312, -3.264862060546875, -3.1740036010742188, -3.0831451416015625, -2.9922866821289062, -2.90142822265625, -2.8105697631835938, -2.7197113037109375, -2.6288528442382812, -2.537994384765625, -2.4471359252929688, -2.3562774658203125, -2.2654190063476562, -2.174560546875, -2.0837020874023438, -1.9928436279296875, -1.9019851684570312, -1.811126708984375, -1.7202682495117188, -1.6294097900390625, -1.5385513305664062, -1.44769287109375, -1.3568344116210938, -1.2659759521484375, -1.1751174926757812, -1.084259033203125, -0.9934005737304688, -0.9025421142578125, -0.8116836547851562, -0.7208251953125, -0.6299667358398438, -0.5391082763671875, -0.44824981689453125, -0.357391357421875, -0.26653289794921875, -0.1756744384765625, -0.08481597900390625, 0.00604248046875, 0.09690093994140625, 0.1877593994140625, 0.27861785888671875, 0.369476318359375, 0.46033477783203125, 0.5511932373046875, 0.6420516967773438, 0.73291015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 23.0, 67.0, 144.0, 343.0, 1807.0, 4190411.0, 1075.0, 270.0, 95.0, 48.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.625, -232.2763671875, -226.927734375, -221.5791015625, -216.23046875, -210.8818359375, -205.533203125, -200.1845703125, -194.8359375, -189.4873046875, -184.138671875, -178.7900390625, -173.44140625, -168.0927734375, -162.744140625, -157.3955078125, -152.046875, -146.6982421875, -141.349609375, -136.0009765625, -130.65234375, -125.3037109375, -119.955078125, -114.6064453125, -109.2578125, -103.9091796875, -98.560546875, -93.2119140625, -87.86328125, -82.5146484375, -77.166015625, -71.8173828125, -66.46875, -61.1201171875, -55.771484375, -50.4228515625, -45.07421875, -39.7255859375, -34.376953125, -29.0283203125, -23.6796875, -18.3310546875, -12.982421875, -7.6337890625, -2.28515625, 3.0634765625, 8.412109375, 13.7607421875, 19.109375, 24.4580078125, 29.806640625, 35.1552734375, 40.50390625, 45.8525390625, 51.201171875, 56.5498046875, 61.8984375, 67.2470703125, 72.595703125, 77.9443359375, 83.29296875, 88.6416015625, 93.990234375, 99.3388671875, 104.6875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 25.0, 212.0, 3219.0, 515.0, 77.0, 18.0, 11.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3046875, -13.9613037109375, -13.617919921875, -13.2745361328125, -12.93115234375, -12.5877685546875, -12.244384765625, -11.9010009765625, -11.5576171875, -11.2142333984375, -10.870849609375, -10.5274658203125, -10.18408203125, -9.8406982421875, -9.497314453125, -9.1539306640625, -8.810546875, -8.4671630859375, -8.123779296875, -7.7803955078125, -7.43701171875, -7.0936279296875, -6.750244140625, -6.4068603515625, -6.0634765625, -5.7200927734375, -5.376708984375, -5.0333251953125, -4.68994140625, -4.3465576171875, -4.003173828125, -3.6597900390625, -3.31640625, -2.9730224609375, -2.629638671875, -2.2862548828125, -1.94287109375, -1.5994873046875, -1.256103515625, -0.9127197265625, -0.5693359375, -0.2259521484375, 0.117431640625, 0.4608154296875, 0.80419921875, 1.1475830078125, 1.490966796875, 1.8343505859375, 2.177734375, 2.5211181640625, 2.864501953125, 3.2078857421875, 3.55126953125, 3.8946533203125, 4.238037109375, 4.5814208984375, 4.9248046875, 5.2681884765625, 5.611572265625, 5.9549560546875, 6.29833984375, 6.6417236328125, 6.985107421875, 7.3284912109375, 7.671875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 54.0, 840.0, 104.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-293.0742492675781, -286.64093017578125, -280.2076110839844, -273.7742919921875, -267.34100341796875, -260.9076843261719, -254.474365234375, -248.04104614257812, -241.6077423095703, -235.17442321777344, -228.74111938476562, -222.30780029296875, -215.87448120117188, -209.44117736816406, -203.0078582763672, -196.57455444335938, -190.1412353515625, -183.70791625976562, -177.2746124267578, -170.84129333496094, -164.40797424316406, -157.97467041015625, -151.54135131835938, -145.1080322265625, -138.67471313476562, -132.24139404296875, -125.8080825805664, -119.37477111816406, -112.94145965576172, -106.50814819335938, -100.0748291015625, -93.64151763916016, -87.20821380615234, -80.77490234375, -74.34158325195312, -67.90827178955078, -61.47496032714844, -55.04164505004883, -48.60832977294922, -42.175018310546875, -35.741703033447266, -29.30838966369629, -22.875076293945312, -16.441761016845703, -10.008447647094727, -3.57513427734375, 2.8581809997558594, 9.291492462158203, 15.724807739257812, 22.15812110900879, 28.591434478759766, 35.024749755859375, 41.45806121826172, 47.89137649536133, 54.32469177246094, 60.75800323486328, 67.19131469726562, 73.62462615966797, 80.05794525146484, 86.49125671386719, 92.92456817626953, 99.35787963867188, 105.79119873046875, 112.2245101928711, 118.65782928466797]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 16.0, 31.0, 45.0, 74.0, 94.0, 136.0, 138.0, 132.0, 111.0, 72.0, 49.0, 52.0, 30.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.27851104736328, -45.7283821105957, -44.17825698852539, -42.62812805175781, -41.0780029296875, -39.52787399291992, -37.97774887084961, -36.42761993408203, -34.87749481201172, -33.32736587524414, -31.777240753173828, -30.227113723754883, -28.676986694335938, -27.126859664916992, -25.576732635498047, -24.02660369873047, -22.476476669311523, -20.926349639892578, -19.376222610473633, -17.826095581054688, -16.275968551635742, -14.725841522216797, -13.175713539123535, -11.62558650970459, -10.075459480285645, -8.5253324508667, -6.975205421447754, -5.42507791519165, -3.874950885772705, -2.3248238563537598, -0.7746963500976562, 0.7754306793212891, 2.3255577087402344, 3.8756847381591797, 5.425811767578125, 6.9759392738342285, 8.526065826416016, 10.076192855834961, 11.626320838928223, 13.176447868347168, 14.726574897766113, 16.276702880859375, 17.82682991027832, 19.376956939697266, 20.92708396911621, 22.477210998535156, 24.0273380279541, 25.577465057373047, 27.127592086791992, 28.677719116210938, 30.227846145629883, 31.777973175048828, 33.328102111816406, 34.87822723388672, 36.4283561706543, 37.97848129272461, 39.52861022949219, 41.078739166259766, 42.62886428833008, 44.178993225097656, 45.72911834716797, 47.27924728393555, 48.82937240600586, 50.37950134277344, 51.92962646484375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 7.0, 7.0, 15.0, 18.0, 21.0, 25.0, 48.0, 48.0, 81.0, 140.0, 348.0, 1136.0, 7087.0, 320621.0, 703729.0, 12805.0, 1531.0, 417.0, 170.0, 68.0, 65.0, 33.0, 31.0, 18.0, 21.0, 13.0, 10.0, 13.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.59375, -32.54736328125, -31.5009765625, -30.45458984375, -29.408203125, -28.36181640625, -27.3154296875, -26.26904296875, -25.22265625, -24.17626953125, -23.1298828125, -22.08349609375, -21.037109375, -19.99072265625, -18.9443359375, -17.89794921875, -16.8515625, -15.80517578125, -14.7587890625, -13.71240234375, -12.666015625, -11.61962890625, -10.5732421875, -9.52685546875, -8.48046875, -7.43408203125, -6.3876953125, -5.34130859375, -4.294921875, -3.24853515625, -2.2021484375, -1.15576171875, -0.109375, 0.93701171875, 1.9833984375, 3.02978515625, 4.076171875, 5.12255859375, 6.1689453125, 7.21533203125, 8.26171875, 9.30810546875, 10.3544921875, 11.40087890625, 12.447265625, 13.49365234375, 14.5400390625, 15.58642578125, 16.6328125, 17.67919921875, 18.7255859375, 19.77197265625, 20.818359375, 21.86474609375, 22.9111328125, 23.95751953125, 25.00390625, 26.05029296875, 27.0966796875, 28.14306640625, 29.189453125, 30.23583984375, 31.2822265625, 32.32861328125, 33.375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 18.0, 30.0, 79.0, 129.0, 229.0, 226.0, 144.0, 84.0, 38.0, 17.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.655548095703125, -5.52984619140625, -5.404144287109375, -5.2784423828125, -5.152740478515625, -5.02703857421875, -4.901336669921875, -4.775634765625, -4.649932861328125, -4.52423095703125, -4.398529052734375, -4.2728271484375, -4.147125244140625, -4.02142333984375, -3.895721435546875, -3.77001953125, -3.644317626953125, -3.51861572265625, -3.392913818359375, -3.2672119140625, -3.141510009765625, -3.01580810546875, -2.890106201171875, -2.764404296875, -2.638702392578125, -2.51300048828125, -2.387298583984375, -2.2615966796875, -2.135894775390625, -2.01019287109375, -1.884490966796875, -1.7587890625, -1.633087158203125, -1.50738525390625, -1.381683349609375, -1.2559814453125, -1.130279541015625, -1.00457763671875, -0.878875732421875, -0.753173828125, -0.627471923828125, -0.50177001953125, -0.376068115234375, -0.2503662109375, -0.124664306640625, 0.00103759765625, 0.126739501953125, 0.25244140625, 0.378143310546875, 0.50384521484375, 0.629547119140625, 0.7552490234375, 0.880950927734375, 1.00665283203125, 1.132354736328125, 1.258056640625, 1.383758544921875, 1.50946044921875, 1.635162353515625, 1.7608642578125, 1.886566162109375, 2.01226806640625, 2.137969970703125, 2.263671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 1.0, 10.0, 9.0, 12.0, 17.0, 17.0, 18.0, 34.0, 43.0, 91.0, 201.0, 1159.0, 14564.0, 613351.0, 408000.0, 9721.0, 875.0, 165.0, 72.0, 42.0, 41.0, 22.0, 11.0, 12.0, 17.0, 5.0, 5.0, 5.0, 6.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.734375, -22.0224609375, -21.310546875, -20.5986328125, -19.88671875, -19.1748046875, -18.462890625, -17.7509765625, -17.0390625, -16.3271484375, -15.615234375, -14.9033203125, -14.19140625, -13.4794921875, -12.767578125, -12.0556640625, -11.34375, -10.6318359375, -9.919921875, -9.2080078125, -8.49609375, -7.7841796875, -7.072265625, -6.3603515625, -5.6484375, -4.9365234375, -4.224609375, -3.5126953125, -2.80078125, -2.0888671875, -1.376953125, -0.6650390625, 0.046875, 0.7587890625, 1.470703125, 2.1826171875, 2.89453125, 3.6064453125, 4.318359375, 5.0302734375, 5.7421875, 6.4541015625, 7.166015625, 7.8779296875, 8.58984375, 9.3017578125, 10.013671875, 10.7255859375, 11.4375, 12.1494140625, 12.861328125, 13.5732421875, 14.28515625, 14.9970703125, 15.708984375, 16.4208984375, 17.1328125, 17.8447265625, 18.556640625, 19.2685546875, 19.98046875, 20.6923828125, 21.404296875, 22.1162109375, 22.828125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 1.0, 9.0, 18.0, 9.0, 14.0, 18.0, 23.0, 28.0, 34.0, 42.0, 37.0, 49.0, 52.0, 60.0, 58.0, 63.0, 60.0, 50.0, 61.0, 57.0, 41.0, 47.0, 28.0, 30.0, 21.0, 16.0, 16.0, 9.0, 12.0, 6.0, 7.0, 3.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40234375, -6.21612548828125, -6.0299072265625, -5.84368896484375, -5.657470703125, -5.47125244140625, -5.2850341796875, -5.09881591796875, -4.91259765625, -4.72637939453125, -4.5401611328125, -4.35394287109375, -4.167724609375, -3.98150634765625, -3.7952880859375, -3.60906982421875, -3.4228515625, -3.23663330078125, -3.0504150390625, -2.86419677734375, -2.677978515625, -2.49176025390625, -2.3055419921875, -2.11932373046875, -1.93310546875, -1.74688720703125, -1.5606689453125, -1.37445068359375, -1.188232421875, -1.00201416015625, -0.8157958984375, -0.62957763671875, -0.443359375, -0.25714111328125, -0.0709228515625, 0.11529541015625, 0.301513671875, 0.48773193359375, 0.6739501953125, 0.86016845703125, 1.04638671875, 1.23260498046875, 1.4188232421875, 1.60504150390625, 1.791259765625, 1.97747802734375, 2.1636962890625, 2.34991455078125, 2.5361328125, 2.72235107421875, 2.9085693359375, 3.09478759765625, 3.281005859375, 3.46722412109375, 3.6534423828125, 3.83966064453125, 4.02587890625, 4.21209716796875, 4.3983154296875, 4.58453369140625, 4.770751953125, 4.95697021484375, 5.1431884765625, 5.32940673828125, 5.515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 5.0, 11.0, 14.0, 29.0, 53.0, 68.0, 145.0, 227.0, 449.0, 978.0, 2370.0, 7254.0, 43061.0, 471216.0, 468519.0, 42548.0, 7368.0, 2260.0, 922.0, 459.0, 229.0, 149.0, 70.0, 41.0, 22.0, 15.0, 21.0, 6.0, 6.0, 6.0, 3.0, 1.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.5859375, -9.25537109375, -8.9248046875, -8.59423828125, -8.263671875, -7.93310546875, -7.6025390625, -7.27197265625, -6.94140625, -6.61083984375, -6.2802734375, -5.94970703125, -5.619140625, -5.28857421875, -4.9580078125, -4.62744140625, -4.296875, -3.96630859375, -3.6357421875, -3.30517578125, -2.974609375, -2.64404296875, -2.3134765625, -1.98291015625, -1.65234375, -1.32177734375, -0.9912109375, -0.66064453125, -0.330078125, 0.00048828125, 0.3310546875, 0.66162109375, 0.9921875, 1.32275390625, 1.6533203125, 1.98388671875, 2.314453125, 2.64501953125, 2.9755859375, 3.30615234375, 3.63671875, 3.96728515625, 4.2978515625, 4.62841796875, 4.958984375, 5.28955078125, 5.6201171875, 5.95068359375, 6.28125, 6.61181640625, 6.9423828125, 7.27294921875, 7.603515625, 7.93408203125, 8.2646484375, 8.59521484375, 8.92578125, 9.25634765625, 9.5869140625, 9.91748046875, 10.248046875, 10.57861328125, 10.9091796875, 11.23974609375, 11.5703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 8.0, 10.0, 13.0, 20.0, 22.0, 29.0, 27.0, 49.0, 64.0, 70.0, 69.0, 93.0, 89.0, 85.0, 72.0, 50.0, 47.0, 43.0, 32.0, 30.0, 15.0, 10.0, 7.0, 10.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000614166259765625, -0.0005932003259658813, -0.0005722343921661377, -0.000551268458366394, -0.0005303025245666504, -0.0005093365907669067, -0.0004883706569671631, -0.00046740472316741943, -0.0004464387893676758, -0.00042547285556793213, -0.0004045069217681885, -0.0003835409879684448, -0.00036257505416870117, -0.0003416091203689575, -0.00032064318656921387, -0.0002996772527694702, -0.00027871131896972656, -0.0002577453851699829, -0.00023677945137023926, -0.0002158135175704956, -0.00019484758377075195, -0.0001738816499710083, -0.00015291571617126465, -0.000131949782371521, -0.00011098384857177734, -9.001791477203369e-05, -6.905198097229004e-05, -4.808604717254639e-05, -2.7120113372802734e-05, -6.154179573059082e-06, 1.481175422668457e-05, 3.577768802642822e-05, 5.6743621826171875e-05, 7.770955562591553e-05, 9.867548942565918e-05, 0.00011964142322540283, 0.00014060735702514648, 0.00016157329082489014, 0.0001825392246246338, 0.00020350515842437744, 0.0002244710922241211, 0.00024543702602386475, 0.0002664029598236084, 0.00028736889362335205, 0.0003083348274230957, 0.00032930076122283936, 0.000350266695022583, 0.00037123262882232666, 0.0003921985626220703, 0.00041316449642181396, 0.0004341304302215576, 0.00045509636402130127, 0.0004760622978210449, 0.0004970282316207886, 0.0005179941654205322, 0.0005389600992202759, 0.0005599260330200195, 0.0005808919668197632, 0.0006018579006195068, 0.0006228238344192505, 0.0006437897682189941, 0.0006647557020187378, 0.0006857216358184814, 0.0007066875696182251, 0.0007276535034179688]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 13.0, 25.0, 36.0, 57.0, 124.0, 313.0, 1820.0, 44004.0, 960436.0, 39313.0, 1773.0, 371.0, 128.0, 50.0, 34.0, 17.0, 12.0, 7.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1875, -11.5283203125, -10.869140625, -10.2099609375, -9.55078125, -8.8916015625, -8.232421875, -7.5732421875, -6.9140625, -6.2548828125, -5.595703125, -4.9365234375, -4.27734375, -3.6181640625, -2.958984375, -2.2998046875, -1.640625, -0.9814453125, -0.322265625, 0.3369140625, 0.99609375, 1.6552734375, 2.314453125, 2.9736328125, 3.6328125, 4.2919921875, 4.951171875, 5.6103515625, 6.26953125, 6.9287109375, 7.587890625, 8.2470703125, 8.90625, 9.5654296875, 10.224609375, 10.8837890625, 11.54296875, 12.2021484375, 12.861328125, 13.5205078125, 14.1796875, 14.8388671875, 15.498046875, 16.1572265625, 16.81640625, 17.4755859375, 18.134765625, 18.7939453125, 19.453125, 20.1123046875, 20.771484375, 21.4306640625, 22.08984375, 22.7490234375, 23.408203125, 24.0673828125, 24.7265625, 25.3857421875, 26.044921875, 26.7041015625, 27.36328125, 28.0224609375, 28.681640625, 29.3408203125, 30.0]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 13.0, 22.0, 32.0, 46.0, 71.0, 89.0, 90.0, 128.0, 124.0, 109.0, 84.0, 61.0, 48.0, 21.0, 16.0, 11.0, 12.0, 7.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28515625, -4.04864501953125, -3.8121337890625, -3.57562255859375, -3.339111328125, -3.10260009765625, -2.8660888671875, -2.62957763671875, -2.39306640625, -2.15655517578125, -1.9200439453125, -1.68353271484375, -1.447021484375, -1.21051025390625, -0.9739990234375, -0.73748779296875, -0.5009765625, -0.26446533203125, -0.0279541015625, 0.20855712890625, 0.445068359375, 0.68157958984375, 0.9180908203125, 1.15460205078125, 1.39111328125, 1.62762451171875, 1.8641357421875, 2.10064697265625, 2.337158203125, 2.57366943359375, 2.8101806640625, 3.04669189453125, 3.283203125, 3.51971435546875, 3.7562255859375, 3.99273681640625, 4.229248046875, 4.46575927734375, 4.7022705078125, 4.93878173828125, 5.17529296875, 5.41180419921875, 5.6483154296875, 5.88482666015625, 6.121337890625, 6.35784912109375, 6.5943603515625, 6.83087158203125, 7.0673828125, 7.30389404296875, 7.5404052734375, 7.77691650390625, 8.013427734375, 8.24993896484375, 8.4864501953125, 8.72296142578125, 8.95947265625, 9.19598388671875, 9.4324951171875, 9.66900634765625, 9.905517578125, 10.14202880859375, 10.3785400390625, 10.61505126953125, 10.8515625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 39.0, 359.0, 495.0, 88.0, 21.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.4951934814453, -138.8935546875, -132.29190063476562, -125.69026184082031, -119.088623046875, -112.48697662353516, -105.88533020019531, -99.28369140625, -92.68204498291016, -86.08039855957031, -79.478759765625, -72.87711334228516, -66.27546691894531, -59.673828125, -53.072181701660156, -46.47053909301758, -39.868896484375, -33.26725387573242, -26.66560935974121, -20.06396484375, -13.462322235107422, -6.860679626464844, -0.259033203125, 6.342609405517578, 12.944252014160156, 19.545894622802734, 26.147539138793945, 32.749183654785156, 39.350826263427734, 45.95246887207031, 52.554115295410156, 59.155757904052734, 65.75738525390625, 72.3590316772461, 78.9606704711914, 85.56231689453125, 92.16395568847656, 98.7656021118164, 105.36724853515625, 111.96888732910156, 118.5705337524414, 125.17218017578125, 131.77381896972656, 138.37545776367188, 144.97711181640625, 151.57875061035156, 158.18038940429688, 164.78204345703125, 171.38368225097656, 177.98532104492188, 184.58697509765625, 191.18861389160156, 197.79025268554688, 204.39190673828125, 210.99354553222656, 217.59518432617188, 224.19683837890625, 230.79847717285156, 237.40013122558594, 244.00177001953125, 250.60340881347656, 257.2050476074219, 263.80670166015625, 270.4083557128906, 277.0099792480469]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 9.0, 5.0, 14.0, 17.0, 16.0, 31.0, 29.0, 50.0, 42.0, 43.0, 60.0, 49.0, 55.0, 63.0, 59.0, 60.0, 53.0, 64.0, 42.0, 33.0, 32.0, 41.0, 26.0, 24.0, 16.0, 17.0, 12.0, 8.0, 4.0, 11.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.56108856201172, -43.249656677246094, -41.93822479248047, -40.62679672241211, -39.315364837646484, -38.00393295288086, -36.692501068115234, -35.381072998046875, -34.06964111328125, -32.758209228515625, -31.446779251098633, -30.135347366333008, -28.823917388916016, -27.51248550415039, -26.201053619384766, -24.889623641967773, -23.57819175720215, -22.266759872436523, -20.95532989501953, -19.643898010253906, -18.332468032836914, -17.02103614807129, -15.70960521697998, -14.398174285888672, -13.086743354797363, -11.775312423706055, -10.463881492614746, -9.152450561523438, -7.841019153594971, -6.529588222503662, -5.218156814575195, -3.9067258834838867, -2.595294952392578, -1.28386390209198, 0.027567148208618164, 1.3389983177185059, 2.6504292488098145, 3.961860179901123, 5.27329158782959, 6.584722518920898, 7.896153450012207, 9.207584381103516, 10.519015312194824, 11.830446243286133, 13.141878128051758, 14.45330810546875, 15.764739990234375, 17.076171875, 18.387601852416992, 19.699033737182617, 21.01046371459961, 22.321895599365234, 23.633325576782227, 24.94475746154785, 26.256187438964844, 27.56761932373047, 28.879051208496094, 30.19048309326172, 31.50191307067871, 32.8133430480957, 34.12477493286133, 35.43620681762695, 36.74763870239258, 38.05906677246094, 39.37049865722656]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 9.0, 17.0, 12.0, 25.0, 13.0, 25.0, 39.0, 48.0, 73.0, 114.0, 215.0, 502.0, 1742.0, 16845.0, 4029704.0, 140188.0, 3959.0, 515.0, 123.0, 61.0, 22.0, 8.0, 1.0, 5.0, 3.0, 3.0], "bins": [-68.4375, -67.1400146484375, -65.842529296875, -64.5450439453125, -63.24755859375, -61.9500732421875, -60.652587890625, -59.3551025390625, -58.0576171875, -56.7601318359375, -55.462646484375, -54.1651611328125, -52.86767578125, -51.5701904296875, -50.272705078125, -48.9752197265625, -47.677734375, -46.3802490234375, -45.082763671875, -43.7852783203125, -42.48779296875, -41.1903076171875, -39.892822265625, -38.5953369140625, -37.2978515625, -36.0003662109375, -34.702880859375, -33.4053955078125, -32.10791015625, -30.8104248046875, -29.512939453125, -28.2154541015625, -26.91796875, -25.6204833984375, -24.322998046875, -23.0255126953125, -21.72802734375, -20.4305419921875, -19.133056640625, -17.8355712890625, -16.5380859375, -15.2406005859375, -13.943115234375, -12.6456298828125, -11.34814453125, -10.0506591796875, -8.753173828125, -7.4556884765625, -6.158203125, -4.8607177734375, -3.563232421875, -2.2657470703125, -0.96826171875, 0.3292236328125, 1.626708984375, 2.9241943359375, 4.2216796875, 5.5191650390625, 6.816650390625, 8.1141357421875, 9.41162109375, 10.7091064453125, 12.006591796875, 13.3040771484375, 14.6015625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 8.0, 19.0, 41.0, 72.0, 137.0, 176.0, 193.0, 132.0, 118.0, 53.0, 33.0, 16.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.859375, -5.74713134765625, -5.6348876953125, -5.52264404296875, -5.410400390625, -5.29815673828125, -5.1859130859375, -5.07366943359375, -4.96142578125, -4.84918212890625, -4.7369384765625, -4.62469482421875, -4.512451171875, -4.40020751953125, -4.2879638671875, -4.17572021484375, -4.0634765625, -3.95123291015625, -3.8389892578125, -3.72674560546875, -3.614501953125, -3.50225830078125, -3.3900146484375, -3.27777099609375, -3.16552734375, -3.05328369140625, -2.9410400390625, -2.82879638671875, -2.716552734375, -2.60430908203125, -2.4920654296875, -2.37982177734375, -2.267578125, -2.15533447265625, -2.0430908203125, -1.93084716796875, -1.818603515625, -1.70635986328125, -1.5941162109375, -1.48187255859375, -1.36962890625, -1.25738525390625, -1.1451416015625, -1.03289794921875, -0.920654296875, -0.80841064453125, -0.6961669921875, -0.58392333984375, -0.4716796875, -0.35943603515625, -0.2471923828125, -0.13494873046875, -0.022705078125, 0.08953857421875, 0.2017822265625, 0.31402587890625, 0.42626953125, 0.53851318359375, 0.6507568359375, 0.76300048828125, 0.875244140625, 0.98748779296875, 1.0997314453125, 1.21197509765625, 1.32421875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 12.0, 7.0, 40.0, 77.0, 147.0, 573.0, 67876.0, 4124879.0, 484.0, 107.0, 45.0, 27.0, 12.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-256.5, -251.576171875, -246.65234375, -241.728515625, -236.8046875, -231.880859375, -226.95703125, -222.033203125, -217.109375, -212.185546875, -207.26171875, -202.337890625, -197.4140625, -192.490234375, -187.56640625, -182.642578125, -177.71875, -172.794921875, -167.87109375, -162.947265625, -158.0234375, -153.099609375, -148.17578125, -143.251953125, -138.328125, -133.404296875, -128.48046875, -123.556640625, -118.6328125, -113.708984375, -108.78515625, -103.861328125, -98.9375, -94.013671875, -89.08984375, -84.166015625, -79.2421875, -74.318359375, -69.39453125, -64.470703125, -59.546875, -54.623046875, -49.69921875, -44.775390625, -39.8515625, -34.927734375, -30.00390625, -25.080078125, -20.15625, -15.232421875, -10.30859375, -5.384765625, -0.4609375, 4.462890625, 9.38671875, 14.310546875, 19.234375, 24.158203125, 29.08203125, 34.005859375, 38.9296875, 43.853515625, 48.77734375, 53.701171875, 58.625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 53.0, 393.0, 3279.0, 273.0, 57.0, 12.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.546875, -22.140411376953125, -21.73394775390625, -21.327484130859375, -20.9210205078125, -20.514556884765625, -20.10809326171875, -19.701629638671875, -19.295166015625, -18.888702392578125, -18.48223876953125, -18.075775146484375, -17.6693115234375, -17.262847900390625, -16.85638427734375, -16.449920654296875, -16.04345703125, -15.636993408203125, -15.23052978515625, -14.824066162109375, -14.4176025390625, -14.011138916015625, -13.60467529296875, -13.198211669921875, -12.791748046875, -12.385284423828125, -11.97882080078125, -11.572357177734375, -11.1658935546875, -10.759429931640625, -10.35296630859375, -9.946502685546875, -9.5400390625, -9.133575439453125, -8.72711181640625, -8.320648193359375, -7.9141845703125, -7.507720947265625, -7.10125732421875, -6.694793701171875, -6.288330078125, -5.881866455078125, -5.47540283203125, -5.068939208984375, -4.6624755859375, -4.256011962890625, -3.84954833984375, -3.443084716796875, -3.03662109375, -2.630157470703125, -2.22369384765625, -1.817230224609375, -1.4107666015625, -1.004302978515625, -0.59783935546875, -0.191375732421875, 0.215087890625, 0.621551513671875, 1.02801513671875, 1.434478759765625, 1.8409423828125, 2.247406005859375, 2.65386962890625, 3.060333251953125, 3.466796875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 17.0, 88.0, 457.0, 368.0, 54.0, 18.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.15972900390625, -132.16207885742188, -129.1644287109375, -126.16677856445312, -123.16912841796875, -120.1714859008789, -117.17383575439453, -114.17618560791016, -111.17853546142578, -108.1808853149414, -105.18323516845703, -102.18558502197266, -99.18794250488281, -96.19029235839844, -93.19264221191406, -90.19499206542969, -87.19734191894531, -84.19969177246094, -81.20204162597656, -78.20439147949219, -75.20674133300781, -72.20909881591797, -69.2114486694336, -66.21379852294922, -63.216148376464844, -60.21849822998047, -57.220848083496094, -54.223201751708984, -51.22555160522461, -48.227901458740234, -45.230255126953125, -42.23260498046875, -39.234954833984375, -36.2373046875, -33.239654541015625, -30.242008209228516, -27.24435806274414, -24.246707916259766, -21.249059677124023, -18.25141143798828, -15.253761291503906, -12.256112098693848, -9.258462905883789, -6.2608137130737305, -3.263164520263672, -0.2655153274536133, 2.7321338653564453, 5.7297821044921875, 8.727432250976562, 11.725081443786621, 14.72273063659668, 17.720378875732422, 20.718029022216797, 23.715679168701172, 26.713327407836914, 29.710975646972656, 32.70862579345703, 35.706275939941406, 38.70392608642578, 41.70157241821289, 44.699222564697266, 47.69687271118164, 50.69451904296875, 53.692169189453125, 56.6898193359375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 12.0, 14.0, 26.0, 40.0, 49.0, 80.0, 90.0, 91.0, 133.0, 98.0, 96.0, 84.0, 58.0, 46.0, 28.0, 23.0, 14.0, 6.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.33869171142578, -44.961387634277344, -43.584083557128906, -42.20677947998047, -40.82947540283203, -39.452171325683594, -38.074867248535156, -36.69756317138672, -35.32025909423828, -33.942955017089844, -32.565650939941406, -31.18834686279297, -29.81104278564453, -28.433738708496094, -27.056432723999023, -25.679128646850586, -24.301822662353516, -22.924518585205078, -21.54721450805664, -20.169910430908203, -18.792606353759766, -17.415302276611328, -16.037996292114258, -14.66069221496582, -13.283388137817383, -11.906084060668945, -10.528779983520508, -9.151474952697754, -7.774170875549316, -6.396866798400879, -5.019561767578125, -3.6422576904296875, -2.26495361328125, -0.8876492977142334, 0.4896550178527832, 1.866959571838379, 3.2442636489868164, 4.621567726135254, 5.998872756958008, 7.376176834106445, 8.753480911254883, 10.13078498840332, 11.508089065551758, 12.885394096374512, 14.26269817352295, 15.640002250671387, 17.01730728149414, 18.394611358642578, 19.771915435791016, 21.149219512939453, 22.52652359008789, 23.903827667236328, 25.281131744384766, 26.658435821533203, 28.035741806030273, 29.41304588317871, 30.79034996032715, 32.16765594482422, 33.544960021972656, 34.922264099121094, 36.29956817626953, 37.67687225341797, 39.054176330566406, 40.431480407714844, 41.80878448486328]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 3.0, 4.0, 10.0, 8.0, 13.0, 13.0, 30.0, 25.0, 37.0, 51.0, 67.0, 88.0, 122.0, 167.0, 257.0, 535.0, 1063.0, 3000.0, 11058.0, 54365.0, 393284.0, 493631.0, 70983.0, 13361.0, 3527.0, 1268.0, 540.0, 320.0, 187.0, 132.0, 85.0, 66.0, 53.0, 47.0, 29.0, 23.0, 18.0, 15.0, 12.0, 8.0, 15.0, 6.0, 2.0, 5.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-15.578125, -15.0924072265625, -14.606689453125, -14.1209716796875, -13.63525390625, -13.1495361328125, -12.663818359375, -12.1781005859375, -11.6923828125, -11.2066650390625, -10.720947265625, -10.2352294921875, -9.74951171875, -9.2637939453125, -8.778076171875, -8.2923583984375, -7.806640625, -7.3209228515625, -6.835205078125, -6.3494873046875, -5.86376953125, -5.3780517578125, -4.892333984375, -4.4066162109375, -3.9208984375, -3.4351806640625, -2.949462890625, -2.4637451171875, -1.97802734375, -1.4923095703125, -1.006591796875, -0.5208740234375, -0.03515625, 0.4505615234375, 0.936279296875, 1.4219970703125, 1.90771484375, 2.3934326171875, 2.879150390625, 3.3648681640625, 3.8505859375, 4.3363037109375, 4.822021484375, 5.3077392578125, 5.79345703125, 6.2791748046875, 6.764892578125, 7.2506103515625, 7.736328125, 8.2220458984375, 8.707763671875, 9.1934814453125, 9.67919921875, 10.1649169921875, 10.650634765625, 11.1363525390625, 11.6220703125, 12.1077880859375, 12.593505859375, 13.0792236328125, 13.56494140625, 14.0506591796875, 14.536376953125, 15.0220947265625, 15.5078125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 7.0, 16.0, 28.0, 48.0, 57.0, 79.0, 133.0, 142.0, 135.0, 117.0, 94.0, 64.0, 30.0, 25.0, 12.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.671875, -5.545257568359375, -5.41864013671875, -5.292022705078125, -5.1654052734375, -5.038787841796875, -4.91217041015625, -4.785552978515625, -4.658935546875, -4.532318115234375, -4.40570068359375, -4.279083251953125, -4.1524658203125, -4.025848388671875, -3.89923095703125, -3.772613525390625, -3.64599609375, -3.519378662109375, -3.39276123046875, -3.266143798828125, -3.1395263671875, -3.012908935546875, -2.88629150390625, -2.759674072265625, -2.633056640625, -2.506439208984375, -2.37982177734375, -2.253204345703125, -2.1265869140625, -1.999969482421875, -1.87335205078125, -1.746734619140625, -1.6201171875, -1.493499755859375, -1.36688232421875, -1.240264892578125, -1.1136474609375, -0.987030029296875, -0.86041259765625, -0.733795166015625, -0.607177734375, -0.480560302734375, -0.35394287109375, -0.227325439453125, -0.1007080078125, 0.025909423828125, 0.15252685546875, 0.279144287109375, 0.40576171875, 0.532379150390625, 0.65899658203125, 0.785614013671875, 0.9122314453125, 1.038848876953125, 1.16546630859375, 1.292083740234375, 1.418701171875, 1.545318603515625, 1.67193603515625, 1.798553466796875, 1.9251708984375, 2.051788330078125, 2.17840576171875, 2.305023193359375, 2.431640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 11.0, 9.0, 17.0, 18.0, 23.0, 24.0, 54.0, 106.0, 252.0, 710.0, 2645.0, 13510.0, 117710.0, 715041.0, 175374.0, 18082.0, 3393.0, 920.0, 312.0, 136.0, 69.0, 42.0, 19.0, 20.0, 13.0, 9.0, 9.0, 8.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3125, -13.82861328125, -13.3447265625, -12.86083984375, -12.376953125, -11.89306640625, -11.4091796875, -10.92529296875, -10.44140625, -9.95751953125, -9.4736328125, -8.98974609375, -8.505859375, -8.02197265625, -7.5380859375, -7.05419921875, -6.5703125, -6.08642578125, -5.6025390625, -5.11865234375, -4.634765625, -4.15087890625, -3.6669921875, -3.18310546875, -2.69921875, -2.21533203125, -1.7314453125, -1.24755859375, -0.763671875, -0.27978515625, 0.2041015625, 0.68798828125, 1.171875, 1.65576171875, 2.1396484375, 2.62353515625, 3.107421875, 3.59130859375, 4.0751953125, 4.55908203125, 5.04296875, 5.52685546875, 6.0107421875, 6.49462890625, 6.978515625, 7.46240234375, 7.9462890625, 8.43017578125, 8.9140625, 9.39794921875, 9.8818359375, 10.36572265625, 10.849609375, 11.33349609375, 11.8173828125, 12.30126953125, 12.78515625, 13.26904296875, 13.7529296875, 14.23681640625, 14.720703125, 15.20458984375, 15.6884765625, 16.17236328125, 16.65625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 10.0, 15.0, 14.0, 16.0, 17.0, 18.0, 23.0, 42.0, 54.0, 73.0, 44.0, 60.0, 49.0, 76.0, 59.0, 66.0, 57.0, 65.0, 54.0, 37.0, 40.0, 23.0, 18.0, 14.0, 10.0, 10.0, 6.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.4915771484375, -8.201904296875, -7.9122314453125, -7.62255859375, -7.3328857421875, -7.043212890625, -6.7535400390625, -6.4638671875, -6.1741943359375, -5.884521484375, -5.5948486328125, -5.30517578125, -5.0155029296875, -4.725830078125, -4.4361572265625, -4.146484375, -3.8568115234375, -3.567138671875, -3.2774658203125, -2.98779296875, -2.6981201171875, -2.408447265625, -2.1187744140625, -1.8291015625, -1.5394287109375, -1.249755859375, -0.9600830078125, -0.67041015625, -0.3807373046875, -0.091064453125, 0.1986083984375, 0.48828125, 0.7779541015625, 1.067626953125, 1.3572998046875, 1.64697265625, 1.9366455078125, 2.226318359375, 2.5159912109375, 2.8056640625, 3.0953369140625, 3.385009765625, 3.6746826171875, 3.96435546875, 4.2540283203125, 4.543701171875, 4.8333740234375, 5.123046875, 5.4127197265625, 5.702392578125, 5.9920654296875, 6.28173828125, 6.5714111328125, 6.861083984375, 7.1507568359375, 7.4404296875, 7.7301025390625, 8.019775390625, 8.3094482421875, 8.59912109375, 8.8887939453125, 9.178466796875, 9.4681396484375, 9.7578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 0.0, 3.0, 12.0, 14.0, 27.0, 28.0, 27.0, 48.0, 72.0, 93.0, 142.0, 277.0, 557.0, 1352.0, 3501.0, 10250.0, 40839.0, 219478.0, 552424.0, 171966.0, 33263.0, 8779.0, 2960.0, 1194.0, 521.0, 261.0, 144.0, 101.0, 56.0, 38.0, 23.0, 16.0, 21.0, 17.0, 8.0, 8.0, 6.0, 3.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03515625, -4.86968994140625, -4.7042236328125, -4.53875732421875, -4.373291015625, -4.20782470703125, -4.0423583984375, -3.87689208984375, -3.71142578125, -3.54595947265625, -3.3804931640625, -3.21502685546875, -3.049560546875, -2.88409423828125, -2.7186279296875, -2.55316162109375, -2.3876953125, -2.22222900390625, -2.0567626953125, -1.89129638671875, -1.725830078125, -1.56036376953125, -1.3948974609375, -1.22943115234375, -1.06396484375, -0.89849853515625, -0.7330322265625, -0.56756591796875, -0.402099609375, -0.23663330078125, -0.0711669921875, 0.09429931640625, 0.259765625, 0.42523193359375, 0.5906982421875, 0.75616455078125, 0.921630859375, 1.08709716796875, 1.2525634765625, 1.41802978515625, 1.58349609375, 1.74896240234375, 1.9144287109375, 2.07989501953125, 2.245361328125, 2.41082763671875, 2.5762939453125, 2.74176025390625, 2.9072265625, 3.07269287109375, 3.2381591796875, 3.40362548828125, 3.569091796875, 3.73455810546875, 3.9000244140625, 4.06549072265625, 4.23095703125, 4.39642333984375, 4.5618896484375, 4.72735595703125, 4.892822265625, 5.05828857421875, 5.2237548828125, 5.38922119140625, 5.5546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 1.0, 3.0, 3.0, 12.0, 12.0, 11.0, 16.0, 17.0, 21.0, 19.0, 21.0, 29.0, 37.0, 40.0, 55.0, 64.0, 69.0, 75.0, 68.0, 66.0, 56.0, 44.0, 37.0, 40.0, 30.0, 30.0, 14.0, 18.0, 20.0, 8.0, 9.0, 11.0, 5.0, 7.0, 6.0, 1.0, 5.0, 3.0, 3.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031185150146484375, -0.00029972195625305176, -0.00028759241104125977, -0.0002754628658294678, -0.0002633333206176758, -0.0002512037754058838, -0.0002390742301940918, -0.0002269446849822998, -0.0002148151397705078, -0.00020268559455871582, -0.00019055604934692383, -0.00017842650413513184, -0.00016629695892333984, -0.00015416741371154785, -0.00014203786849975586, -0.00012990832328796387, -0.00011777877807617188, -0.00010564923286437988, -9.351968765258789e-05, -8.13901424407959e-05, -6.92605972290039e-05, -5.7131052017211914e-05, -4.500150680541992e-05, -3.287196159362793e-05, -2.0742416381835938e-05, -8.612871170043945e-06, 3.516674041748047e-06, 1.564621925354004e-05, 2.777576446533203e-05, 3.9905309677124023e-05, 5.2034854888916016e-05, 6.416440010070801e-05, 7.62939453125e-05, 8.842349052429199e-05, 0.00010055303573608398, 0.00011268258094787598, 0.00012481212615966797, 0.00013694167137145996, 0.00014907121658325195, 0.00016120076179504395, 0.00017333030700683594, 0.00018545985221862793, 0.00019758939743041992, 0.00020971894264221191, 0.0002218484878540039, 0.0002339780330657959, 0.0002461075782775879, 0.0002582371234893799, 0.0002703666687011719, 0.00028249621391296387, 0.00029462575912475586, 0.00030675530433654785, 0.00031888484954833984, 0.00033101439476013184, 0.00034314393997192383, 0.0003552734851837158, 0.0003674030303955078, 0.0003795325756072998, 0.0003916621208190918, 0.0004037916660308838, 0.0004159212112426758, 0.0004280507564544678, 0.00044018030166625977, 0.00045230984687805176, 0.00046443939208984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 10.0, 5.0, 10.0, 13.0, 15.0, 34.0, 54.0, 89.0, 205.0, 398.0, 1183.0, 3998.0, 19094.0, 128961.0, 622038.0, 232759.0, 30992.0, 5957.0, 1625.0, 576.0, 241.0, 108.0, 57.0, 38.0, 25.0, 17.0, 11.0, 4.0, 8.0, 2.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.11328125, -5.91375732421875, -5.7142333984375, -5.51470947265625, -5.315185546875, -5.11566162109375, -4.9161376953125, -4.71661376953125, -4.51708984375, -4.31756591796875, -4.1180419921875, -3.91851806640625, -3.718994140625, -3.51947021484375, -3.3199462890625, -3.12042236328125, -2.9208984375, -2.72137451171875, -2.5218505859375, -2.32232666015625, -2.122802734375, -1.92327880859375, -1.7237548828125, -1.52423095703125, -1.32470703125, -1.12518310546875, -0.9256591796875, -0.72613525390625, -0.526611328125, -0.32708740234375, -0.1275634765625, 0.07196044921875, 0.271484375, 0.47100830078125, 0.6705322265625, 0.87005615234375, 1.069580078125, 1.26910400390625, 1.4686279296875, 1.66815185546875, 1.86767578125, 2.06719970703125, 2.2667236328125, 2.46624755859375, 2.665771484375, 2.86529541015625, 3.0648193359375, 3.26434326171875, 3.4638671875, 3.66339111328125, 3.8629150390625, 4.06243896484375, 4.261962890625, 4.46148681640625, 4.6610107421875, 4.86053466796875, 5.06005859375, 5.25958251953125, 5.4591064453125, 5.65863037109375, 5.858154296875, 6.05767822265625, 6.2572021484375, 6.45672607421875, 6.65625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 5.0, 4.0, 12.0, 6.0, 14.0, 17.0, 14.0, 20.0, 35.0, 31.0, 45.0, 43.0, 63.0, 57.0, 75.0, 70.0, 76.0, 60.0, 71.0, 42.0, 52.0, 27.0, 28.0, 22.0, 18.0, 20.0, 20.0, 8.0, 8.0, 7.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.155548095703125, -3.04547119140625, -2.935394287109375, -2.8253173828125, -2.715240478515625, -2.60516357421875, -2.495086669921875, -2.385009765625, -2.274932861328125, -2.16485595703125, -2.054779052734375, -1.9447021484375, -1.834625244140625, -1.72454833984375, -1.614471435546875, -1.50439453125, -1.394317626953125, -1.28424072265625, -1.174163818359375, -1.0640869140625, -0.954010009765625, -0.84393310546875, -0.733856201171875, -0.623779296875, -0.513702392578125, -0.40362548828125, -0.293548583984375, -0.1834716796875, -0.073394775390625, 0.03668212890625, 0.146759033203125, 0.2568359375, 0.366912841796875, 0.47698974609375, 0.587066650390625, 0.6971435546875, 0.807220458984375, 0.91729736328125, 1.027374267578125, 1.137451171875, 1.247528076171875, 1.35760498046875, 1.467681884765625, 1.5777587890625, 1.687835693359375, 1.79791259765625, 1.907989501953125, 2.01806640625, 2.128143310546875, 2.23822021484375, 2.348297119140625, 2.4583740234375, 2.568450927734375, 2.67852783203125, 2.788604736328125, 2.898681640625, 3.008758544921875, 3.11883544921875, 3.228912353515625, 3.3389892578125, 3.449066162109375, 3.55914306640625, 3.669219970703125, 3.779296875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 21.0, 33.0, 66.0, 164.0, 249.0, 197.0, 139.0, 69.0, 27.0, 16.0, 5.0, 7.0, 3.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.71897506713867, -49.09700012207031, -46.47502899169922, -43.85305404663086, -41.231082916259766, -38.609107971191406, -35.98713684082031, -33.36516189575195, -30.743188858032227, -28.1212158203125, -25.499242782592773, -22.877269744873047, -20.255294799804688, -17.633323669433594, -15.011348724365234, -12.389375686645508, -9.767402648925781, -7.145429611206055, -4.52345609664917, -1.9014825820922852, 0.7204904556274414, 3.342463493347168, 5.964437484741211, 8.586410522460938, 11.208383560180664, 13.83035659790039, 16.452329635620117, 19.074302673339844, 21.696277618408203, 24.318248748779297, 26.940223693847656, 29.562196731567383, 32.184165954589844, 34.8061408996582, 37.4281120300293, 40.050086975097656, 42.67205810546875, 45.29403305053711, 47.91600799560547, 50.53797912597656, 53.159950256347656, 55.781925201416016, 58.40389633178711, 61.02587127685547, 63.64784240722656, 66.26981353759766, 68.89179229736328, 71.51376342773438, 74.1357421875, 76.7577133178711, 79.37969207763672, 82.00166320800781, 84.6236343383789, 87.24560546875, 89.86758422851562, 92.48955535888672, 95.11152648925781, 97.7334976196289, 100.35547637939453, 102.97744750976562, 105.59941864013672, 108.22138977050781, 110.84336853027344, 113.46533966064453, 116.08731079101562]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 5.0, 11.0, 15.0, 17.0, 25.0, 28.0, 22.0, 22.0, 46.0, 41.0, 41.0, 58.0, 65.0, 50.0, 64.0, 55.0, 60.0, 64.0, 48.0, 50.0, 27.0, 38.0, 31.0, 22.0, 21.0, 11.0, 10.0, 13.0, 8.0, 8.0, 5.0, 5.0, 5.0, 0.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.418251037597656, -49.9041748046875, -48.390098571777344, -46.87602233886719, -45.36194610595703, -43.847869873046875, -42.33379364013672, -40.81971740722656, -39.305641174316406, -37.79156494140625, -36.277488708496094, -34.76341247558594, -33.24933624267578, -31.735260009765625, -30.2211856842041, -28.707109451293945, -27.193035125732422, -25.678958892822266, -24.16488265991211, -22.650806427001953, -21.136730194091797, -19.62265396118164, -18.108579635620117, -16.59450340270996, -15.080427169799805, -13.566350936889648, -12.052274703979492, -10.538199424743652, -9.024123191833496, -7.51004695892334, -5.9959716796875, -4.481895446777344, -2.9678192138671875, -1.4537432193756104, 0.0603327751159668, 1.5744085311889648, 3.088484764099121, 4.602560997009277, 6.116636276245117, 7.630712509155273, 9.14478874206543, 10.658864974975586, 12.172941207885742, 13.687016487121582, 15.201092720031738, 16.715167999267578, 18.229244232177734, 19.74332046508789, 21.257396697998047, 22.771472930908203, 24.28554916381836, 25.799625396728516, 27.313701629638672, 28.827777862548828, 30.34185218811035, 31.855928421020508, 33.37000274658203, 34.88407897949219, 36.398155212402344, 37.9122314453125, 39.426307678222656, 40.94038391113281, 42.45446014404297, 43.968536376953125, 45.48261260986328]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 5.0, 13.0, 15.0, 11.0, 14.0, 17.0, 22.0, 19.0, 23.0, 37.0, 63.0, 91.0, 120.0, 188.0, 347.0, 605.0, 1369.0, 3805.0, 14647.0, 138547.0, 3912498.0, 103855.0, 12670.0, 3173.0, 1167.0, 475.0, 220.0, 103.0, 58.0, 26.0, 25.0, 13.0, 9.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-27.546875, -26.912841796875, -26.27880859375, -25.644775390625, -25.0107421875, -24.376708984375, -23.74267578125, -23.108642578125, -22.474609375, -21.840576171875, -21.20654296875, -20.572509765625, -19.9384765625, -19.304443359375, -18.67041015625, -18.036376953125, -17.40234375, -16.768310546875, -16.13427734375, -15.500244140625, -14.8662109375, -14.232177734375, -13.59814453125, -12.964111328125, -12.330078125, -11.696044921875, -11.06201171875, -10.427978515625, -9.7939453125, -9.159912109375, -8.52587890625, -7.891845703125, -7.2578125, -6.623779296875, -5.98974609375, -5.355712890625, -4.7216796875, -4.087646484375, -3.45361328125, -2.819580078125, -2.185546875, -1.551513671875, -0.91748046875, -0.283447265625, 0.3505859375, 0.984619140625, 1.61865234375, 2.252685546875, 2.88671875, 3.520751953125, 4.15478515625, 4.788818359375, 5.4228515625, 6.056884765625, 6.69091796875, 7.324951171875, 7.958984375, 8.593017578125, 9.22705078125, 9.861083984375, 10.4951171875, 11.129150390625, 11.76318359375, 12.397216796875, 13.03125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 5.0, 6.0, 21.0, 33.0, 44.0, 73.0, 102.0, 126.0, 129.0, 121.0, 119.0, 71.0, 61.0, 39.0, 20.0, 15.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.7890625, -5.6698760986328125, -5.550689697265625, -5.4315032958984375, -5.31231689453125, -5.1931304931640625, -5.073944091796875, -4.9547576904296875, -4.8355712890625, -4.7163848876953125, -4.597198486328125, -4.4780120849609375, -4.35882568359375, -4.2396392822265625, -4.120452880859375, -4.0012664794921875, -3.882080078125, -3.7628936767578125, -3.643707275390625, -3.5245208740234375, -3.40533447265625, -3.2861480712890625, -3.166961669921875, -3.0477752685546875, -2.9285888671875, -2.8094024658203125, -2.690216064453125, -2.5710296630859375, -2.45184326171875, -2.3326568603515625, -2.213470458984375, -2.0942840576171875, -1.97509765625, -1.8559112548828125, -1.736724853515625, -1.6175384521484375, -1.49835205078125, -1.3791656494140625, -1.259979248046875, -1.1407928466796875, -1.0216064453125, -0.9024200439453125, -0.783233642578125, -0.6640472412109375, -0.54486083984375, -0.4256744384765625, -0.306488037109375, -0.1873016357421875, -0.068115234375, 0.0510711669921875, 0.170257568359375, 0.2894439697265625, 0.40863037109375, 0.5278167724609375, 0.647003173828125, 0.7661895751953125, 0.8853759765625, 1.0045623779296875, 1.123748779296875, 1.2429351806640625, 1.36212158203125, 1.4813079833984375, 1.600494384765625, 1.7196807861328125, 1.8388671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 6.0, 16.0, 14.0, 21.0, 34.0, 48.0, 75.0, 126.0, 852.0, 4154248.0, 38047.0, 398.0, 129.0, 77.0, 70.0, 57.0, 33.0, 15.0, 15.0, 9.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.40625, -41.19091796875, -37.9755859375, -34.76025390625, -31.544921875, -28.32958984375, -25.1142578125, -21.89892578125, -18.68359375, -15.46826171875, -12.2529296875, -9.03759765625, -5.822265625, -2.60693359375, 0.6083984375, 3.82373046875, 7.0390625, 10.25439453125, 13.4697265625, 16.68505859375, 19.900390625, 23.11572265625, 26.3310546875, 29.54638671875, 32.76171875, 35.97705078125, 39.1923828125, 42.40771484375, 45.623046875, 48.83837890625, 52.0537109375, 55.26904296875, 58.484375, 61.69970703125, 64.9150390625, 68.13037109375, 71.345703125, 74.56103515625, 77.7763671875, 80.99169921875, 84.20703125, 87.42236328125, 90.6376953125, 93.85302734375, 97.068359375, 100.28369140625, 103.4990234375, 106.71435546875, 109.9296875, 113.14501953125, 116.3603515625, 119.57568359375, 122.791015625, 126.00634765625, 129.2216796875, 132.43701171875, 135.65234375, 138.86767578125, 142.0830078125, 145.29833984375, 148.513671875, 151.72900390625, 154.9443359375, 158.15966796875, 161.375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 22.0, 103.0, 1239.0, 2577.0, 113.0, 18.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.42108154296875, -4.9320068359375, -4.44293212890625, -3.953857421875, -3.46478271484375, -2.9757080078125, -2.48663330078125, -1.99755859375, -1.50848388671875, -1.0194091796875, -0.53033447265625, -0.041259765625, 0.44781494140625, 0.9368896484375, 1.42596435546875, 1.9150390625, 2.40411376953125, 2.8931884765625, 3.38226318359375, 3.871337890625, 4.36041259765625, 4.8494873046875, 5.33856201171875, 5.82763671875, 6.31671142578125, 6.8057861328125, 7.29486083984375, 7.783935546875, 8.27301025390625, 8.7620849609375, 9.25115966796875, 9.740234375, 10.22930908203125, 10.7183837890625, 11.20745849609375, 11.696533203125, 12.18560791015625, 12.6746826171875, 13.16375732421875, 13.65283203125, 14.14190673828125, 14.6309814453125, 15.12005615234375, 15.609130859375, 16.09820556640625, 16.5872802734375, 17.07635498046875, 17.5654296875, 18.05450439453125, 18.5435791015625, 19.03265380859375, 19.521728515625, 20.01080322265625, 20.4998779296875, 20.98895263671875, 21.47802734375, 21.96710205078125, 22.4561767578125, 22.94525146484375, 23.434326171875, 23.92340087890625, 24.4124755859375, 24.90155029296875, 25.390625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 46.0, 647.0, 298.0, 16.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.15765380859375, -138.36203002929688, -133.56642150878906, -128.77081298828125, -123.97518920898438, -119.17957305908203, -114.38395690917969, -109.58834075927734, -104.792724609375, -99.99710845947266, -95.20149230957031, -90.40587615966797, -85.61026000976562, -80.81464385986328, -76.01902770996094, -71.2234115600586, -66.42779541015625, -61.632179260253906, -56.83656311035156, -52.04094696044922, -47.245330810546875, -42.44971466064453, -37.65409851074219, -32.858482360839844, -28.0628662109375, -23.267250061035156, -18.471633911132812, -13.676017761230469, -8.880401611328125, -4.084785461425781, 0.7108306884765625, 5.506446838378906, 10.302047729492188, 15.097663879394531, 19.893280029296875, 24.68889617919922, 29.484512329101562, 34.280128479003906, 39.07574462890625, 43.871360778808594, 48.66697692871094, 53.46259307861328, 58.258209228515625, 63.05382537841797, 67.84944152832031, 72.64505767822266, 77.440673828125, 82.23628997802734, 87.03190612792969, 91.82752227783203, 96.62313842773438, 101.41875457763672, 106.21437072753906, 111.0099868774414, 115.80560302734375, 120.6012191772461, 125.39683532714844, 130.19244384765625, 134.98806762695312, 139.78369140625, 144.5792999267578, 149.37490844726562, 154.1705322265625, 158.96615600585938, 163.7617645263672]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 20.0, 35.0, 77.0, 80.0, 145.0, 144.0, 137.0, 121.0, 97.0, 74.0, 42.0, 16.0, 5.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.4003791809082, -46.118167877197266, -44.83595657348633, -43.55374526977539, -42.27153396606445, -40.989322662353516, -39.70711135864258, -38.424903869628906, -37.14269256591797, -35.86048126220703, -34.578269958496094, -33.296058654785156, -32.01384735107422, -30.73163604736328, -29.449426651000977, -28.16721534729004, -26.88500213623047, -25.60279083251953, -24.320579528808594, -23.038368225097656, -21.75615692138672, -20.47394561767578, -19.191736221313477, -17.90952491760254, -16.6273136138916, -15.345102310180664, -14.062891006469727, -12.780680656433105, -11.498469352722168, -10.21625804901123, -8.93404769897461, -7.651836395263672, -6.369625091552734, -5.087413787841797, -3.8052029609680176, -2.522991895675659, -1.2407808303833008, 0.04143047332763672, 1.323641300201416, 2.6058521270751953, 3.888063430786133, 5.17027473449707, 6.45248556137085, 7.734696388244629, 9.016907691955566, 10.299118995666504, 11.581329345703125, 12.863540649414062, 14.145751953125, 15.427963256835938, 16.710174560546875, 17.992385864257812, 19.27459716796875, 20.556808471679688, 21.839017868041992, 23.12122917175293, 24.403440475463867, 25.685651779174805, 26.967863082885742, 28.25007438659668, 29.532283782958984, 30.814495086669922, 32.09670639038086, 33.3789176940918, 34.661128997802734]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 14.0, 12.0, 20.0, 23.0, 28.0, 49.0, 81.0, 127.0, 238.0, 491.0, 1326.0, 4822.0, 27101.0, 233247.0, 655575.0, 106671.0, 14152.0, 2946.0, 887.0, 350.0, 149.0, 80.0, 47.0, 36.0, 18.0, 28.0, 10.0, 12.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.125, -14.591064453125, -14.05712890625, -13.523193359375, -12.9892578125, -12.455322265625, -11.92138671875, -11.387451171875, -10.853515625, -10.319580078125, -9.78564453125, -9.251708984375, -8.7177734375, -8.183837890625, -7.64990234375, -7.115966796875, -6.58203125, -6.048095703125, -5.51416015625, -4.980224609375, -4.4462890625, -3.912353515625, -3.37841796875, -2.844482421875, -2.310546875, -1.776611328125, -1.24267578125, -0.708740234375, -0.1748046875, 0.359130859375, 0.89306640625, 1.427001953125, 1.9609375, 2.494873046875, 3.02880859375, 3.562744140625, 4.0966796875, 4.630615234375, 5.16455078125, 5.698486328125, 6.232421875, 6.766357421875, 7.30029296875, 7.834228515625, 8.3681640625, 8.902099609375, 9.43603515625, 9.969970703125, 10.50390625, 11.037841796875, 11.57177734375, 12.105712890625, 12.6396484375, 13.173583984375, 13.70751953125, 14.241455078125, 14.775390625, 15.309326171875, 15.84326171875, 16.377197265625, 16.9111328125, 17.445068359375, 17.97900390625, 18.512939453125, 19.046875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 19.0, 25.0, 32.0, 56.0, 67.0, 84.0, 108.0, 114.0, 106.0, 115.0, 78.0, 71.0, 44.0, 38.0, 12.0, 12.0, 5.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.38671875, -4.286376953125, -4.18603515625, -4.085693359375, -3.9853515625, -3.885009765625, -3.78466796875, -3.684326171875, -3.583984375, -3.483642578125, -3.38330078125, -3.282958984375, -3.1826171875, -3.082275390625, -2.98193359375, -2.881591796875, -2.78125, -2.680908203125, -2.58056640625, -2.480224609375, -2.3798828125, -2.279541015625, -2.17919921875, -2.078857421875, -1.978515625, -1.878173828125, -1.77783203125, -1.677490234375, -1.5771484375, -1.476806640625, -1.37646484375, -1.276123046875, -1.17578125, -1.075439453125, -0.97509765625, -0.874755859375, -0.7744140625, -0.674072265625, -0.57373046875, -0.473388671875, -0.373046875, -0.272705078125, -0.17236328125, -0.072021484375, 0.0283203125, 0.128662109375, 0.22900390625, 0.329345703125, 0.4296875, 0.530029296875, 0.63037109375, 0.730712890625, 0.8310546875, 0.931396484375, 1.03173828125, 1.132080078125, 1.232421875, 1.332763671875, 1.43310546875, 1.533447265625, 1.6337890625, 1.734130859375, 1.83447265625, 1.934814453125, 2.03515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 6.0, 5.0, 18.0, 20.0, 31.0, 33.0, 59.0, 126.0, 215.0, 470.0, 923.0, 2487.0, 7329.0, 27552.0, 141906.0, 549772.0, 254086.0, 46251.0, 11215.0, 3499.0, 1299.0, 543.0, 290.0, 162.0, 89.0, 53.0, 24.0, 22.0, 17.0, 11.0, 12.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.7734375, -11.433837890625, -11.09423828125, -10.754638671875, -10.4150390625, -10.075439453125, -9.73583984375, -9.396240234375, -9.056640625, -8.717041015625, -8.37744140625, -8.037841796875, -7.6982421875, -7.358642578125, -7.01904296875, -6.679443359375, -6.33984375, -6.000244140625, -5.66064453125, -5.321044921875, -4.9814453125, -4.641845703125, -4.30224609375, -3.962646484375, -3.623046875, -3.283447265625, -2.94384765625, -2.604248046875, -2.2646484375, -1.925048828125, -1.58544921875, -1.245849609375, -0.90625, -0.566650390625, -0.22705078125, 0.112548828125, 0.4521484375, 0.791748046875, 1.13134765625, 1.470947265625, 1.810546875, 2.150146484375, 2.48974609375, 2.829345703125, 3.1689453125, 3.508544921875, 3.84814453125, 4.187744140625, 4.52734375, 4.866943359375, 5.20654296875, 5.546142578125, 5.8857421875, 6.225341796875, 6.56494140625, 6.904541015625, 7.244140625, 7.583740234375, 7.92333984375, 8.262939453125, 8.6025390625, 8.942138671875, 9.28173828125, 9.621337890625, 9.9609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 12.0, 17.0, 15.0, 20.0, 25.0, 25.0, 40.0, 48.0, 46.0, 56.0, 70.0, 56.0, 62.0, 77.0, 48.0, 61.0, 52.0, 36.0, 48.0, 36.0, 25.0, 18.0, 17.0, 19.0, 7.0, 6.0, 8.0, 5.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.328125, -9.06463623046875, -8.8011474609375, -8.53765869140625, -8.274169921875, -8.01068115234375, -7.7471923828125, -7.48370361328125, -7.22021484375, -6.95672607421875, -6.6932373046875, -6.42974853515625, -6.166259765625, -5.90277099609375, -5.6392822265625, -5.37579345703125, -5.1123046875, -4.84881591796875, -4.5853271484375, -4.32183837890625, -4.058349609375, -3.79486083984375, -3.5313720703125, -3.26788330078125, -3.00439453125, -2.74090576171875, -2.4774169921875, -2.21392822265625, -1.950439453125, -1.68695068359375, -1.4234619140625, -1.15997314453125, -0.896484375, -0.63299560546875, -0.3695068359375, -0.10601806640625, 0.157470703125, 0.42095947265625, 0.6844482421875, 0.94793701171875, 1.21142578125, 1.47491455078125, 1.7384033203125, 2.00189208984375, 2.265380859375, 2.52886962890625, 2.7923583984375, 3.05584716796875, 3.3193359375, 3.58282470703125, 3.8463134765625, 4.10980224609375, 4.373291015625, 4.63677978515625, 4.9002685546875, 5.16375732421875, 5.42724609375, 5.69073486328125, 5.9542236328125, 6.21771240234375, 6.481201171875, 6.74468994140625, 7.0081787109375, 7.27166748046875, 7.53515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 7.0, 12.0, 15.0, 26.0, 29.0, 40.0, 78.0, 123.0, 182.0, 303.0, 583.0, 1072.0, 2434.0, 5613.0, 17135.0, 70743.0, 374485.0, 452384.0, 90368.0, 20882.0, 6586.0, 2748.0, 1144.0, 623.0, 348.0, 195.0, 128.0, 92.0, 52.0, 47.0, 27.0, 11.0, 12.0, 13.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6796875, -4.51873779296875, -4.3577880859375, -4.19683837890625, -4.035888671875, -3.87493896484375, -3.7139892578125, -3.55303955078125, -3.39208984375, -3.23114013671875, -3.0701904296875, -2.90924072265625, -2.748291015625, -2.58734130859375, -2.4263916015625, -2.26544189453125, -2.1044921875, -1.94354248046875, -1.7825927734375, -1.62164306640625, -1.460693359375, -1.29974365234375, -1.1387939453125, -0.97784423828125, -0.81689453125, -0.65594482421875, -0.4949951171875, -0.33404541015625, -0.173095703125, -0.01214599609375, 0.1488037109375, 0.30975341796875, 0.470703125, 0.63165283203125, 0.7926025390625, 0.95355224609375, 1.114501953125, 1.27545166015625, 1.4364013671875, 1.59735107421875, 1.75830078125, 1.91925048828125, 2.0802001953125, 2.24114990234375, 2.402099609375, 2.56304931640625, 2.7239990234375, 2.88494873046875, 3.0458984375, 3.20684814453125, 3.3677978515625, 3.52874755859375, 3.689697265625, 3.85064697265625, 4.0115966796875, 4.17254638671875, 4.33349609375, 4.49444580078125, 4.6553955078125, 4.81634521484375, 4.977294921875, 5.13824462890625, 5.2991943359375, 5.46014404296875, 5.62109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 8.0, 13.0, 11.0, 22.0, 15.0, 32.0, 36.0, 53.0, 58.0, 87.0, 98.0, 95.0, 103.0, 81.0, 67.0, 39.0, 55.0, 36.0, 31.0, 15.0, 16.0, 10.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004343986511230469, -0.0004159584641456604, -0.0003975182771682739, -0.00037907809019088745, -0.000360637903213501, -0.0003421977162361145, -0.00032375752925872803, -0.00030531734228134155, -0.0002868771553039551, -0.0002684369683265686, -0.00024999678134918213, -0.00023155659437179565, -0.00021311640739440918, -0.0001946762204170227, -0.00017623603343963623, -0.00015779584646224976, -0.00013935565948486328, -0.0001209154725074768, -0.00010247528553009033, -8.403509855270386e-05, -6.559491157531738e-05, -4.715472459793091e-05, -2.8714537620544434e-05, -1.0274350643157959e-05, 8.165836334228516e-06, 2.660602331161499e-05, 4.5046210289001465e-05, 6.348639726638794e-05, 8.192658424377441e-05, 0.00010036677122116089, 0.00011880695819854736, 0.00013724714517593384, 0.0001556873321533203, 0.0001741275191307068, 0.00019256770610809326, 0.00021100789308547974, 0.0002294480800628662, 0.0002478882670402527, 0.00026632845401763916, 0.00028476864099502563, 0.0003032088279724121, 0.0003216490149497986, 0.00034008920192718506, 0.00035852938890457153, 0.000376969575881958, 0.0003954097628593445, 0.00041384994983673096, 0.00043229013681411743, 0.0004507303237915039, 0.0004691705107688904, 0.00048761069774627686, 0.0005060508847236633, 0.0005244910717010498, 0.0005429312586784363, 0.0005613714456558228, 0.0005798116326332092, 0.0005982518196105957, 0.0006166920065879822, 0.0006351321935653687, 0.0006535723805427551, 0.0006720125675201416, 0.0006904527544975281, 0.0007088929414749146, 0.000727333128452301, 0.0007457733154296875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 2.0, 4.0, 3.0, 10.0, 4.0, 16.0, 39.0, 37.0, 83.0, 160.0, 374.0, 966.0, 3058.0, 11675.0, 64872.0, 507067.0, 397793.0, 49235.0, 9160.0, 2433.0, 847.0, 332.0, 153.0, 90.0, 49.0, 28.0, 17.0, 18.0, 8.0, 4.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8984375, -6.7064208984375, -6.514404296875, -6.3223876953125, -6.13037109375, -5.9383544921875, -5.746337890625, -5.5543212890625, -5.3623046875, -5.1702880859375, -4.978271484375, -4.7862548828125, -4.59423828125, -4.4022216796875, -4.210205078125, -4.0181884765625, -3.826171875, -3.6341552734375, -3.442138671875, -3.2501220703125, -3.05810546875, -2.8660888671875, -2.674072265625, -2.4820556640625, -2.2900390625, -2.0980224609375, -1.906005859375, -1.7139892578125, -1.52197265625, -1.3299560546875, -1.137939453125, -0.9459228515625, -0.75390625, -0.5618896484375, -0.369873046875, -0.1778564453125, 0.01416015625, 0.2061767578125, 0.398193359375, 0.5902099609375, 0.7822265625, 0.9742431640625, 1.166259765625, 1.3582763671875, 1.55029296875, 1.7423095703125, 1.934326171875, 2.1263427734375, 2.318359375, 2.5103759765625, 2.702392578125, 2.8944091796875, 3.08642578125, 3.2784423828125, 3.470458984375, 3.6624755859375, 3.8544921875, 4.0465087890625, 4.238525390625, 4.4305419921875, 4.62255859375, 4.8145751953125, 5.006591796875, 5.1986083984375, 5.390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 2.0, 5.0, 10.0, 13.0, 14.0, 16.0, 20.0, 29.0, 47.0, 51.0, 68.0, 91.0, 115.0, 122.0, 93.0, 80.0, 59.0, 46.0, 28.0, 15.0, 15.0, 17.0, 10.0, 9.0, 4.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.56640625, -5.4161376953125, -5.265869140625, -5.1156005859375, -4.96533203125, -4.8150634765625, -4.664794921875, -4.5145263671875, -4.3642578125, -4.2139892578125, -4.063720703125, -3.9134521484375, -3.76318359375, -3.6129150390625, -3.462646484375, -3.3123779296875, -3.162109375, -3.0118408203125, -2.861572265625, -2.7113037109375, -2.56103515625, -2.4107666015625, -2.260498046875, -2.1102294921875, -1.9599609375, -1.8096923828125, -1.659423828125, -1.5091552734375, -1.35888671875, -1.2086181640625, -1.058349609375, -0.9080810546875, -0.7578125, -0.6075439453125, -0.457275390625, -0.3070068359375, -0.15673828125, -0.0064697265625, 0.143798828125, 0.2940673828125, 0.4443359375, 0.5946044921875, 0.744873046875, 0.8951416015625, 1.04541015625, 1.1956787109375, 1.345947265625, 1.4962158203125, 1.646484375, 1.7967529296875, 1.947021484375, 2.0972900390625, 2.24755859375, 2.3978271484375, 2.548095703125, 2.6983642578125, 2.8486328125, 2.9989013671875, 3.149169921875, 3.2994384765625, 3.44970703125, 3.5999755859375, 3.750244140625, 3.9005126953125, 4.05078125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 15.0, 20.0, 29.0, 48.0, 66.0, 115.0, 154.0, 135.0, 125.0, 79.0, 60.0, 37.0, 40.0, 20.0, 12.0, 9.0, 5.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.1981430053711, -73.36457824707031, -71.531005859375, -69.69744110107422, -67.86387634277344, -66.03031158447266, -64.19673919677734, -62.36317443847656, -60.52960968017578, -58.696041107177734, -56.86247634887695, -55.028907775878906, -53.195343017578125, -51.36177444458008, -49.52820587158203, -47.69464111328125, -45.8610725402832, -44.027503967285156, -42.193939208984375, -40.36037063598633, -38.52680587768555, -36.6932373046875, -34.85967254638672, -33.02610397338867, -31.192537307739258, -29.358970642089844, -27.52540397644043, -25.691837310791016, -23.85826873779297, -22.024703979492188, -20.19113540649414, -18.357568740844727, -16.524002075195312, -14.690435409545898, -12.856868743896484, -11.023301124572754, -9.18973445892334, -7.356167793273926, -5.522600173950195, -3.6890335083007812, -1.8554668426513672, -0.021899938583374023, 1.8116669654846191, 3.6452341079711914, 5.4788007736206055, 7.3123674392700195, 9.14593505859375, 10.979501724243164, 12.813068389892578, 14.646635055541992, 16.480201721191406, 18.313770294189453, 20.147335052490234, 21.98090362548828, 23.814470291137695, 25.64803695678711, 27.481603622436523, 29.315170288085938, 31.14873695373535, 32.982303619384766, 34.81587219238281, 36.649436950683594, 38.48300552368164, 40.31657409667969, 42.15013885498047]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 7.0, 14.0, 11.0, 8.0, 19.0, 19.0, 29.0, 35.0, 41.0, 36.0, 49.0, 50.0, 45.0, 66.0, 61.0, 59.0, 61.0, 61.0, 59.0, 46.0, 35.0, 38.0, 23.0, 22.0, 17.0, 14.0, 15.0, 16.0, 5.0, 17.0, 6.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.19953155517578, -48.53373718261719, -46.86794662475586, -45.202152252197266, -43.53636169433594, -41.870567321777344, -40.20477294921875, -38.53898239135742, -36.87318801879883, -35.207393646240234, -33.541603088378906, -31.875808715820312, -30.21001625061035, -28.54422378540039, -26.87843132019043, -25.21263885498047, -23.546846389770508, -21.881053924560547, -20.215261459350586, -18.549468994140625, -16.88367462158203, -15.21788215637207, -13.55208969116211, -11.886296272277832, -10.220503807067871, -8.55471134185791, -6.888917922973633, -5.223125457763672, -3.5573325157165527, -1.8915395736694336, -0.22574710845947266, 1.4400463104248047, 3.1058387756347656, 4.771631717681885, 6.437424659729004, 8.103217124938965, 9.769010543823242, 11.434803009033203, 13.100595474243164, 14.766388893127441, 16.43218231201172, 18.09797477722168, 19.76376724243164, 21.429561614990234, 23.095354080200195, 24.761146545410156, 26.426939010620117, 28.092731475830078, 29.75852394104004, 31.42431640625, 33.090110778808594, 34.75590133666992, 36.421695709228516, 38.087486267089844, 39.75328063964844, 41.41907501220703, 43.08486557006836, 44.75065994262695, 46.41645050048828, 48.082244873046875, 49.7480354309082, 51.4138298034668, 53.079620361328125, 54.74541473388672, 56.41120910644531]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 11.0, 4.0, 11.0, 16.0, 19.0, 18.0, 30.0, 28.0, 42.0, 56.0, 73.0, 116.0, 178.0, 356.0, 611.0, 1380.0, 3268.0, 10682.0, 52746.0, 1326667.0, 2718062.0, 63063.0, 11657.0, 3183.0, 1154.0, 447.0, 208.0, 83.0, 50.0, 22.0, 17.0, 5.0, 3.0, 0.0, 3.0, 2.0], "bins": [-26.546875, -25.9942626953125, -25.441650390625, -24.8890380859375, -24.33642578125, -23.7838134765625, -23.231201171875, -22.6785888671875, -22.1259765625, -21.5733642578125, -21.020751953125, -20.4681396484375, -19.91552734375, -19.3629150390625, -18.810302734375, -18.2576904296875, -17.705078125, -17.1524658203125, -16.599853515625, -16.0472412109375, -15.49462890625, -14.9420166015625, -14.389404296875, -13.8367919921875, -13.2841796875, -12.7315673828125, -12.178955078125, -11.6263427734375, -11.07373046875, -10.5211181640625, -9.968505859375, -9.4158935546875, -8.86328125, -8.3106689453125, -7.758056640625, -7.2054443359375, -6.65283203125, -6.1002197265625, -5.547607421875, -4.9949951171875, -4.4423828125, -3.8897705078125, -3.337158203125, -2.7845458984375, -2.23193359375, -1.6793212890625, -1.126708984375, -0.5740966796875, -0.021484375, 0.5311279296875, 1.083740234375, 1.6363525390625, 2.18896484375, 2.7415771484375, 3.294189453125, 3.8468017578125, 4.3994140625, 4.9520263671875, 5.504638671875, 6.0572509765625, 6.60986328125, 7.1624755859375, 7.715087890625, 8.2677001953125, 8.8203125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 24.0, 24.0, 30.0, 44.0, 62.0, 85.0, 103.0, 104.0, 104.0, 90.0, 87.0, 86.0, 46.0, 36.0, 26.0, 16.0, 7.0, 10.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.52734375, -4.4328765869140625, -4.338409423828125, -4.2439422607421875, -4.14947509765625, -4.0550079345703125, -3.960540771484375, -3.8660736083984375, -3.7716064453125, -3.6771392822265625, -3.582672119140625, -3.4882049560546875, -3.39373779296875, -3.2992706298828125, -3.204803466796875, -3.1103363037109375, -3.015869140625, -2.9214019775390625, -2.826934814453125, -2.7324676513671875, -2.63800048828125, -2.5435333251953125, -2.449066162109375, -2.3545989990234375, -2.2601318359375, -2.1656646728515625, -2.071197509765625, -1.9767303466796875, -1.88226318359375, -1.7877960205078125, -1.693328857421875, -1.5988616943359375, -1.50439453125, -1.4099273681640625, -1.315460205078125, -1.2209930419921875, -1.12652587890625, -1.0320587158203125, -0.937591552734375, -0.8431243896484375, -0.7486572265625, -0.6541900634765625, -0.559722900390625, -0.4652557373046875, -0.37078857421875, -0.2763214111328125, -0.181854248046875, -0.0873870849609375, 0.007080078125, 0.1015472412109375, 0.196014404296875, 0.2904815673828125, 0.38494873046875, 0.4794158935546875, 0.573883056640625, 0.6683502197265625, 0.7628173828125, 0.8572845458984375, 0.951751708984375, 1.0462188720703125, 1.14068603515625, 1.2351531982421875, 1.329620361328125, 1.4240875244140625, 1.5185546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 6.0, 8.0, 16.0, 15.0, 24.0, 37.0, 48.0, 55.0, 59.0, 102.0, 134.0, 250.0, 556.0, 1413.0, 4236.0, 27469.0, 3791518.0, 352387.0, 11714.0, 2452.0, 813.0, 334.0, 202.0, 108.0, 77.0, 65.0, 35.0, 44.0, 23.0, 23.0, 11.0, 8.0, 7.0, 6.0, 8.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.28125, -31.35400390625, -30.4267578125, -29.49951171875, -28.572265625, -27.64501953125, -26.7177734375, -25.79052734375, -24.86328125, -23.93603515625, -23.0087890625, -22.08154296875, -21.154296875, -20.22705078125, -19.2998046875, -18.37255859375, -17.4453125, -16.51806640625, -15.5908203125, -14.66357421875, -13.736328125, -12.80908203125, -11.8818359375, -10.95458984375, -10.02734375, -9.10009765625, -8.1728515625, -7.24560546875, -6.318359375, -5.39111328125, -4.4638671875, -3.53662109375, -2.609375, -1.68212890625, -0.7548828125, 0.17236328125, 1.099609375, 2.02685546875, 2.9541015625, 3.88134765625, 4.80859375, 5.73583984375, 6.6630859375, 7.59033203125, 8.517578125, 9.44482421875, 10.3720703125, 11.29931640625, 12.2265625, 13.15380859375, 14.0810546875, 15.00830078125, 15.935546875, 16.86279296875, 17.7900390625, 18.71728515625, 19.64453125, 20.57177734375, 21.4990234375, 22.42626953125, 23.353515625, 24.28076171875, 25.2080078125, 26.13525390625, 27.0625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 14.0, 25.0, 64.0, 328.0, 2733.0, 707.0, 125.0, 32.0, 21.0, 10.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.25, -15.78125, -15.3125, -14.84375, -14.375, -13.90625, -13.4375, -12.96875, -12.5, -12.03125, -11.5625, -11.09375, -10.625, -10.15625, -9.6875, -9.21875, -8.75, -8.28125, -7.8125, -7.34375, -6.875, -6.40625, -5.9375, -5.46875, -5.0, -4.53125, -4.0625, -3.59375, -3.125, -2.65625, -2.1875, -1.71875, -1.25, -0.78125, -0.3125, 0.15625, 0.625, 1.09375, 1.5625, 2.03125, 2.5, 2.96875, 3.4375, 3.90625, 4.375, 4.84375, 5.3125, 5.78125, 6.25, 6.71875, 7.1875, 7.65625, 8.125, 8.59375, 9.0625, 9.53125, 10.0, 10.46875, 10.9375, 11.40625, 11.875, 12.34375, 12.8125, 13.28125, 13.75]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 20.0, 69.0, 181.0, 331.0, 249.0, 83.0, 38.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-99.58468627929688, -97.18246459960938, -94.7802505493164, -92.3780288696289, -89.9758071899414, -87.57359313964844, -85.17137145996094, -82.76914978027344, -80.36692810058594, -77.96470642089844, -75.56249237060547, -73.16027069091797, -70.75804901123047, -68.3558349609375, -65.95361328125, -63.5513916015625, -61.14917755126953, -58.7469596862793, -56.3447380065918, -53.94252014160156, -51.54029846191406, -49.13808059692383, -46.735862731933594, -44.333641052246094, -41.93142318725586, -39.529205322265625, -37.126983642578125, -34.72476577758789, -32.322547912597656, -29.920326232910156, -27.518108367919922, -25.115888595581055, -22.713672637939453, -20.311452865600586, -17.90923309326172, -15.507015228271484, -13.104795455932617, -10.70257568359375, -8.3003568649292, -5.898138046264648, -3.4959182739257812, -1.0936989784240723, 1.3085203170776367, 3.7107396125793457, 6.112958908081055, 8.515178680419922, 10.917397499084473, 13.319616317749023, 15.72183609008789, 18.124055862426758, 20.526275634765625, 22.92849349975586, 25.330713272094727, 27.732933044433594, 30.135150909423828, 32.53736877441406, 34.93959045410156, 37.3418083190918, 39.7440299987793, 42.14624786376953, 44.54846954345703, 46.950687408447266, 49.3529052734375, 51.755126953125, 54.157344818115234]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 13.0, 9.0, 19.0, 30.0, 29.0, 53.0, 74.0, 66.0, 86.0, 75.0, 85.0, 67.0, 79.0, 64.0, 59.0, 38.0, 46.0, 32.0, 25.0, 13.0, 10.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.089468002319336, -25.134172439575195, -24.178878784179688, -23.223583221435547, -22.268287658691406, -21.312992095947266, -20.357698440551758, -19.402402877807617, -18.44710922241211, -17.49181365966797, -16.53652000427246, -15.58122444152832, -14.62592887878418, -13.670634269714355, -12.715339660644531, -11.76004409790039, -10.80474853515625, -9.849453926086426, -8.894158363342285, -7.938863754272461, -6.9835686683654785, -6.028273582458496, -5.072978973388672, -4.1176838874816895, -3.162388801574707, -2.2070937156677246, -1.2517988681793213, -0.29650402069091797, 0.6587910652160645, 1.6140861511230469, 2.569380760192871, 3.5246758460998535, 4.479972839355469, 5.435267925262451, 6.390563011169434, 7.345857620239258, 8.301153182983398, 9.256447792053223, 10.211742401123047, 11.167037963867188, 12.122332572937012, 13.077627182006836, 14.032922744750977, 14.9882173538208, 15.943511962890625, 16.898807525634766, 17.854103088378906, 18.809396743774414, 19.764692306518555, 20.719987869262695, 21.675281524658203, 22.630577087402344, 23.585872650146484, 24.541168212890625, 25.496461868286133, 26.451757431030273, 27.40705108642578, 28.362346649169922, 29.31764030456543, 30.27293586730957, 31.22823143005371, 32.18352508544922, 33.13882064819336, 34.0941162109375, 35.04941177368164]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 13.0, 26.0, 29.0, 39.0, 78.0, 106.0, 168.0, 259.0, 504.0, 1047.0, 2344.0, 6670.0, 24377.0, 118188.0, 507518.0, 307120.0, 58768.0, 13739.0, 4149.0, 1606.0, 758.0, 367.0, 238.0, 147.0, 91.0, 55.0, 39.0, 29.0, 20.0, 13.0, 10.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-14.4609375, -14.032958984375, -13.60498046875, -13.177001953125, -12.7490234375, -12.321044921875, -11.89306640625, -11.465087890625, -11.037109375, -10.609130859375, -10.18115234375, -9.753173828125, -9.3251953125, -8.897216796875, -8.46923828125, -8.041259765625, -7.61328125, -7.185302734375, -6.75732421875, -6.329345703125, -5.9013671875, -5.473388671875, -5.04541015625, -4.617431640625, -4.189453125, -3.761474609375, -3.33349609375, -2.905517578125, -2.4775390625, -2.049560546875, -1.62158203125, -1.193603515625, -0.765625, -0.337646484375, 0.09033203125, 0.518310546875, 0.9462890625, 1.374267578125, 1.80224609375, 2.230224609375, 2.658203125, 3.086181640625, 3.51416015625, 3.942138671875, 4.3701171875, 4.798095703125, 5.22607421875, 5.654052734375, 6.08203125, 6.510009765625, 6.93798828125, 7.365966796875, 7.7939453125, 8.221923828125, 8.64990234375, 9.077880859375, 9.505859375, 9.933837890625, 10.36181640625, 10.789794921875, 11.2177734375, 11.645751953125, 12.07373046875, 12.501708984375, 12.9296875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 3.0, 3.0, 9.0, 10.0, 15.0, 27.0, 26.0, 46.0, 60.0, 72.0, 72.0, 78.0, 86.0, 95.0, 90.0, 73.0, 60.0, 53.0, 38.0, 29.0, 15.0, 14.0, 11.0, 10.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-3.59765625, -3.518890380859375, -3.44012451171875, -3.361358642578125, -3.2825927734375, -3.203826904296875, -3.12506103515625, -3.046295166015625, -2.967529296875, -2.888763427734375, -2.80999755859375, -2.731231689453125, -2.6524658203125, -2.573699951171875, -2.49493408203125, -2.416168212890625, -2.33740234375, -2.258636474609375, -2.17987060546875, -2.101104736328125, -2.0223388671875, -1.943572998046875, -1.86480712890625, -1.786041259765625, -1.707275390625, -1.628509521484375, -1.54974365234375, -1.470977783203125, -1.3922119140625, -1.313446044921875, -1.23468017578125, -1.155914306640625, -1.0771484375, -0.998382568359375, -0.91961669921875, -0.840850830078125, -0.7620849609375, -0.683319091796875, -0.60455322265625, -0.525787353515625, -0.447021484375, -0.368255615234375, -0.28948974609375, -0.210723876953125, -0.1319580078125, -0.053192138671875, 0.02557373046875, 0.104339599609375, 0.18310546875, 0.261871337890625, 0.34063720703125, 0.419403076171875, 0.4981689453125, 0.576934814453125, 0.65570068359375, 0.734466552734375, 0.813232421875, 0.891998291015625, 0.97076416015625, 1.049530029296875, 1.1282958984375, 1.207061767578125, 1.28582763671875, 1.364593505859375, 1.443359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [6.0, 0.0, 1.0, 4.0, 5.0, 4.0, 8.0, 7.0, 18.0, 22.0, 42.0, 49.0, 79.0, 134.0, 187.0, 271.0, 498.0, 861.0, 1532.0, 2753.0, 4985.0, 9779.0, 19088.0, 38756.0, 79312.0, 158933.0, 263147.0, 226759.0, 122000.0, 58998.0, 29038.0, 14477.0, 7618.0, 3929.0, 2178.0, 1233.0, 698.0, 426.0, 258.0, 168.0, 84.0, 85.0, 53.0, 28.0, 16.0, 13.0, 15.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7578125, -3.61761474609375, -3.4774169921875, -3.33721923828125, -3.197021484375, -3.05682373046875, -2.9166259765625, -2.77642822265625, -2.63623046875, -2.49603271484375, -2.3558349609375, -2.21563720703125, -2.075439453125, -1.93524169921875, -1.7950439453125, -1.65484619140625, -1.5146484375, -1.37445068359375, -1.2342529296875, -1.09405517578125, -0.953857421875, -0.81365966796875, -0.6734619140625, -0.53326416015625, -0.39306640625, -0.25286865234375, -0.1126708984375, 0.02752685546875, 0.167724609375, 0.30792236328125, 0.4481201171875, 0.58831787109375, 0.728515625, 0.86871337890625, 1.0089111328125, 1.14910888671875, 1.289306640625, 1.42950439453125, 1.5697021484375, 1.70989990234375, 1.85009765625, 1.99029541015625, 2.1304931640625, 2.27069091796875, 2.410888671875, 2.55108642578125, 2.6912841796875, 2.83148193359375, 2.9716796875, 3.11187744140625, 3.2520751953125, 3.39227294921875, 3.532470703125, 3.67266845703125, 3.8128662109375, 3.95306396484375, 4.09326171875, 4.23345947265625, 4.3736572265625, 4.51385498046875, 4.654052734375, 4.79425048828125, 4.9344482421875, 5.07464599609375, 5.21484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 7.0, 12.0, 10.0, 14.0, 19.0, 20.0, 20.0, 23.0, 35.0, 39.0, 44.0, 33.0, 31.0, 47.0, 47.0, 41.0, 50.0, 53.0, 48.0, 33.0, 30.0, 52.0, 39.0, 55.0, 40.0, 28.0, 27.0, 23.0, 14.0, 19.0, 10.0, 7.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.21875, -7.02606201171875, -6.8333740234375, -6.64068603515625, -6.447998046875, -6.25531005859375, -6.0626220703125, -5.86993408203125, -5.67724609375, -5.48455810546875, -5.2918701171875, -5.09918212890625, -4.906494140625, -4.71380615234375, -4.5211181640625, -4.32843017578125, -4.1357421875, -3.94305419921875, -3.7503662109375, -3.55767822265625, -3.364990234375, -3.17230224609375, -2.9796142578125, -2.78692626953125, -2.59423828125, -2.40155029296875, -2.2088623046875, -2.01617431640625, -1.823486328125, -1.63079833984375, -1.4381103515625, -1.24542236328125, -1.052734375, -0.86004638671875, -0.6673583984375, -0.47467041015625, -0.281982421875, -0.08929443359375, 0.1033935546875, 0.29608154296875, 0.48876953125, 0.68145751953125, 0.8741455078125, 1.06683349609375, 1.259521484375, 1.45220947265625, 1.6448974609375, 1.83758544921875, 2.0302734375, 2.22296142578125, 2.4156494140625, 2.60833740234375, 2.801025390625, 2.99371337890625, 3.1864013671875, 3.37908935546875, 3.57177734375, 3.76446533203125, 3.9571533203125, 4.14984130859375, 4.342529296875, 4.53521728515625, 4.7279052734375, 4.92059326171875, 5.11328125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 8.0, 8.0, 21.0, 19.0, 42.0, 61.0, 94.0, 184.0, 358.0, 677.0, 1447.0, 3330.0, 9434.0, 43040.0, 429562.0, 494363.0, 48893.0, 10330.0, 3639.0, 1550.0, 673.0, 347.0, 191.0, 96.0, 62.0, 35.0, 30.0, 19.0, 12.0, 7.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1875, -5.9300537109375, -5.672607421875, -5.4151611328125, -5.15771484375, -4.9002685546875, -4.642822265625, -4.3853759765625, -4.1279296875, -3.8704833984375, -3.613037109375, -3.3555908203125, -3.09814453125, -2.8406982421875, -2.583251953125, -2.3258056640625, -2.068359375, -1.8109130859375, -1.553466796875, -1.2960205078125, -1.03857421875, -0.7811279296875, -0.523681640625, -0.2662353515625, -0.0087890625, 0.2486572265625, 0.506103515625, 0.7635498046875, 1.02099609375, 1.2784423828125, 1.535888671875, 1.7933349609375, 2.05078125, 2.3082275390625, 2.565673828125, 2.8231201171875, 3.08056640625, 3.3380126953125, 3.595458984375, 3.8529052734375, 4.1103515625, 4.3677978515625, 4.625244140625, 4.8826904296875, 5.14013671875, 5.3975830078125, 5.655029296875, 5.9124755859375, 6.169921875, 6.4273681640625, 6.684814453125, 6.9422607421875, 7.19970703125, 7.4571533203125, 7.714599609375, 7.9720458984375, 8.2294921875, 8.4869384765625, 8.744384765625, 9.0018310546875, 9.25927734375, 9.5167236328125, 9.774169921875, 10.0316162109375, 10.2890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 10.0, 10.0, 9.0, 17.0, 15.0, 24.0, 47.0, 40.0, 72.0, 93.0, 138.0, 144.0, 104.0, 74.0, 50.0, 41.0, 29.0, 17.0, 17.0, 9.0, 11.0, 9.0, 5.0, 7.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0008540153503417969, -0.0008337311446666718, -0.0008134469389915466, -0.0007931627333164215, -0.0007728785276412964, -0.0007525943219661713, -0.0007323101162910461, -0.000712025910615921, -0.0006917417049407959, -0.0006714574992656708, -0.0006511732935905457, -0.0006308890879154205, -0.0006106048822402954, -0.0005903206765651703, -0.0005700364708900452, -0.00054975226521492, -0.0005294680595397949, -0.0005091838538646698, -0.0004888996481895447, -0.00046861544251441956, -0.00044833123683929443, -0.0004280470311641693, -0.0004077628254890442, -0.00038747861981391907, -0.00036719441413879395, -0.0003469102084636688, -0.0003266260027885437, -0.0003063417971134186, -0.00028605759143829346, -0.00026577338576316833, -0.0002454891800880432, -0.0002252049744129181, -0.00020492076873779297, -0.00018463656306266785, -0.00016435235738754272, -0.0001440681517124176, -0.00012378394603729248, -0.00010349974036216736, -8.321553468704224e-05, -6.293132901191711e-05, -4.264712333679199e-05, -2.236291766166687e-05, -2.078711986541748e-06, 1.8205493688583374e-05, 3.8489699363708496e-05, 5.877390503883362e-05, 7.905811071395874e-05, 9.934231638908386e-05, 0.00011962652206420898, 0.0001399107277393341, 0.00016019493341445923, 0.00018047913908958435, 0.00020076334476470947, 0.0002210475504398346, 0.00024133175611495972, 0.00026161596179008484, 0.00028190016746520996, 0.0003021843731403351, 0.0003224685788154602, 0.00034275278449058533, 0.00036303699016571045, 0.00038332119584083557, 0.0004036054015159607, 0.0004238896071910858, 0.00044417381286621094]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 9.0, 9.0, 13.0, 16.0, 27.0, 32.0, 37.0, 55.0, 76.0, 127.0, 256.0, 514.0, 1131.0, 2800.0, 8332.0, 43658.0, 565579.0, 383428.0, 31145.0, 6806.0, 2426.0, 969.0, 457.0, 252.0, 130.0, 81.0, 67.0, 36.0, 18.0, 18.0, 14.0, 16.0, 9.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0], "bins": [-11.75, -11.46282958984375, -11.1756591796875, -10.88848876953125, -10.601318359375, -10.31414794921875, -10.0269775390625, -9.73980712890625, -9.45263671875, -9.16546630859375, -8.8782958984375, -8.59112548828125, -8.303955078125, -8.01678466796875, -7.7296142578125, -7.44244384765625, -7.1552734375, -6.86810302734375, -6.5809326171875, -6.29376220703125, -6.006591796875, -5.71942138671875, -5.4322509765625, -5.14508056640625, -4.85791015625, -4.57073974609375, -4.2835693359375, -3.99639892578125, -3.709228515625, -3.42205810546875, -3.1348876953125, -2.84771728515625, -2.560546875, -2.27337646484375, -1.9862060546875, -1.69903564453125, -1.411865234375, -1.12469482421875, -0.8375244140625, -0.55035400390625, -0.26318359375, 0.02398681640625, 0.3111572265625, 0.59832763671875, 0.885498046875, 1.17266845703125, 1.4598388671875, 1.74700927734375, 2.0341796875, 2.32135009765625, 2.6085205078125, 2.89569091796875, 3.182861328125, 3.47003173828125, 3.7572021484375, 4.04437255859375, 4.33154296875, 4.61871337890625, 4.9058837890625, 5.19305419921875, 5.480224609375, 5.76739501953125, 6.0545654296875, 6.34173583984375, 6.62890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 6.0, 13.0, 14.0, 27.0, 75.0, 171.0, 240.0, 249.0, 105.0, 46.0, 24.0, 7.0, 8.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.71875, -9.29150390625, -8.8642578125, -8.43701171875, -8.009765625, -7.58251953125, -7.1552734375, -6.72802734375, -6.30078125, -5.87353515625, -5.4462890625, -5.01904296875, -4.591796875, -4.16455078125, -3.7373046875, -3.31005859375, -2.8828125, -2.45556640625, -2.0283203125, -1.60107421875, -1.173828125, -0.74658203125, -0.3193359375, 0.10791015625, 0.53515625, 0.96240234375, 1.3896484375, 1.81689453125, 2.244140625, 2.67138671875, 3.0986328125, 3.52587890625, 3.953125, 4.38037109375, 4.8076171875, 5.23486328125, 5.662109375, 6.08935546875, 6.5166015625, 6.94384765625, 7.37109375, 7.79833984375, 8.2255859375, 8.65283203125, 9.080078125, 9.50732421875, 9.9345703125, 10.36181640625, 10.7890625, 11.21630859375, 11.6435546875, 12.07080078125, 12.498046875, 12.92529296875, 13.3525390625, 13.77978515625, 14.20703125, 14.63427734375, 15.0615234375, 15.48876953125, 15.916015625, 16.34326171875, 16.7705078125, 17.19775390625, 17.625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 9.0, 17.0, 21.0, 36.0, 37.0, 46.0, 91.0, 93.0, 131.0, 99.0, 120.0, 71.0, 65.0, 50.0, 33.0, 22.0, 20.0, 11.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.203887939453125, -39.67637252807617, -38.14885330200195, -36.621337890625, -35.09381866455078, -33.56630325317383, -32.03878402709961, -30.511268615722656, -28.983749389648438, -27.45623207092285, -25.928714752197266, -24.40119743347168, -22.873680114746094, -21.346162796020508, -19.818645477294922, -18.29113006591797, -16.763612747192383, -15.236095428466797, -13.708578109741211, -12.181060791015625, -10.653543472290039, -9.126026153564453, -7.598509788513184, -6.070992469787598, -4.543475151062012, -3.015957832336426, -1.488440752029419, 0.03907632827758789, 1.5665936470031738, 3.0941109657287598, 4.6216278076171875, 6.149145126342773, 7.676662445068359, 9.204179763793945, 10.731697082519531, 12.259214401245117, 13.786731719970703, 15.314249038696289, 16.841766357421875, 18.369281768798828, 19.896800994873047, 21.424318313598633, 22.95183563232422, 24.479352951049805, 26.00687026977539, 27.534387588500977, 29.061904907226562, 30.589420318603516, 32.11693572998047, 33.64445114135742, 35.17197036743164, 36.699485778808594, 38.22700500488281, 39.754520416259766, 41.282039642333984, 42.80955505371094, 44.337074279785156, 45.86458969116211, 47.39210891723633, 48.91962432861328, 50.4471435546875, 51.97465896606445, 53.50217819213867, 55.029693603515625, 56.557212829589844]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 7.0, 9.0, 3.0, 11.0, 12.0, 13.0, 10.0, 16.0, 18.0, 20.0, 26.0, 24.0, 27.0, 32.0, 30.0, 21.0, 38.0, 33.0, 34.0, 37.0, 42.0, 35.0, 44.0, 32.0, 36.0, 34.0, 30.0, 34.0, 38.0, 26.0, 33.0, 22.0, 22.0, 20.0, 22.0, 19.0, 14.0, 14.0, 14.0, 8.0, 6.0, 10.0, 12.0, 1.0, 1.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-33.2794075012207, -32.29589080810547, -31.3123779296875, -30.328861236572266, -29.345346450805664, -28.361831665039062, -27.378314971923828, -26.394800186157227, -25.411285400390625, -24.427770614624023, -23.444255828857422, -22.460739135742188, -21.477224349975586, -20.493709564208984, -19.51019287109375, -18.52667808532715, -17.543163299560547, -16.559648513793945, -15.576132774353027, -14.59261703491211, -13.609102249145508, -12.625587463378906, -11.642071723937988, -10.65855598449707, -9.675041198730469, -8.691526412963867, -7.708010673522949, -6.7244954109191895, -5.74098014831543, -4.75746488571167, -3.77394962310791, -2.7904343605041504, -1.8069190979003906, -0.8234038352966309, 0.1601114273071289, 1.1436266899108887, 2.1271419525146484, 3.110657215118408, 4.094172477722168, 5.077687740325928, 6.0612030029296875, 7.044718265533447, 8.028233528137207, 9.011749267578125, 9.995264053344727, 10.978778839111328, 11.962294578552246, 12.945810317993164, 13.929325103759766, 14.912839889526367, 15.896355628967285, 16.879871368408203, 17.863386154174805, 18.846900939941406, 19.83041763305664, 20.813932418823242, 21.797447204589844, 22.780961990356445, 23.764476776123047, 24.74799346923828, 25.731508255004883, 26.715023040771484, 27.69853973388672, 28.68205451965332, 29.665569305419922]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 6.0, 9.0, 15.0, 14.0, 28.0, 22.0, 32.0, 48.0, 54.0, 75.0, 138.0, 177.0, 304.0, 482.0, 798.0, 1730.0, 4452.0, 13311.0, 55897.0, 2459808.0, 1581691.0, 54282.0, 13242.0, 4363.0, 1656.0, 807.0, 353.0, 188.0, 136.0, 64.0, 36.0, 21.0, 11.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.109375, -15.71630859375, -15.3232421875, -14.93017578125, -14.537109375, -14.14404296875, -13.7509765625, -13.35791015625, -12.96484375, -12.57177734375, -12.1787109375, -11.78564453125, -11.392578125, -10.99951171875, -10.6064453125, -10.21337890625, -9.8203125, -9.42724609375, -9.0341796875, -8.64111328125, -8.248046875, -7.85498046875, -7.4619140625, -7.06884765625, -6.67578125, -6.28271484375, -5.8896484375, -5.49658203125, -5.103515625, -4.71044921875, -4.3173828125, -3.92431640625, -3.53125, -3.13818359375, -2.7451171875, -2.35205078125, -1.958984375, -1.56591796875, -1.1728515625, -0.77978515625, -0.38671875, 0.00634765625, 0.3994140625, 0.79248046875, 1.185546875, 1.57861328125, 1.9716796875, 2.36474609375, 2.7578125, 3.15087890625, 3.5439453125, 3.93701171875, 4.330078125, 4.72314453125, 5.1162109375, 5.50927734375, 5.90234375, 6.29541015625, 6.6884765625, 7.08154296875, 7.474609375, 7.86767578125, 8.2607421875, 8.65380859375, 9.046875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 10.0, 10.0, 16.0, 21.0, 33.0, 30.0, 46.0, 49.0, 54.0, 68.0, 83.0, 70.0, 76.0, 75.0, 47.0, 58.0, 63.0, 46.0, 38.0, 33.0, 15.0, 11.0, 14.0, 9.0, 7.0, 8.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.06640625, -2.993255615234375, -2.92010498046875, -2.846954345703125, -2.7738037109375, -2.700653076171875, -2.62750244140625, -2.554351806640625, -2.481201171875, -2.408050537109375, -2.33489990234375, -2.261749267578125, -2.1885986328125, -2.115447998046875, -2.04229736328125, -1.969146728515625, -1.89599609375, -1.822845458984375, -1.74969482421875, -1.676544189453125, -1.6033935546875, -1.530242919921875, -1.45709228515625, -1.383941650390625, -1.310791015625, -1.237640380859375, -1.16448974609375, -1.091339111328125, -1.0181884765625, -0.945037841796875, -0.87188720703125, -0.798736572265625, -0.7255859375, -0.652435302734375, -0.57928466796875, -0.506134033203125, -0.4329833984375, -0.359832763671875, -0.28668212890625, -0.213531494140625, -0.140380859375, -0.067230224609375, 0.00592041015625, 0.079071044921875, 0.1522216796875, 0.225372314453125, 0.29852294921875, 0.371673583984375, 0.44482421875, 0.517974853515625, 0.59112548828125, 0.664276123046875, 0.7374267578125, 0.810577392578125, 0.88372802734375, 0.956878662109375, 1.030029296875, 1.103179931640625, 1.17633056640625, 1.249481201171875, 1.3226318359375, 1.395782470703125, 1.46893310546875, 1.542083740234375, 1.615234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 9.0, 10.0, 16.0, 11.0, 16.0, 31.0, 28.0, 36.0, 31.0, 60.0, 74.0, 78.0, 113.0, 192.0, 404.0, 878.0, 3381.0, 29370.0, 3484344.0, 653971.0, 17020.0, 2405.0, 768.0, 308.0, 187.0, 104.0, 83.0, 71.0, 39.0, 47.0, 46.0, 27.0, 32.0, 16.0, 21.0, 16.0, 12.0, 8.0, 4.0, 5.0, 4.0, 7.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-21.53125, -20.89599609375, -20.2607421875, -19.62548828125, -18.990234375, -18.35498046875, -17.7197265625, -17.08447265625, -16.44921875, -15.81396484375, -15.1787109375, -14.54345703125, -13.908203125, -13.27294921875, -12.6376953125, -12.00244140625, -11.3671875, -10.73193359375, -10.0966796875, -9.46142578125, -8.826171875, -8.19091796875, -7.5556640625, -6.92041015625, -6.28515625, -5.64990234375, -5.0146484375, -4.37939453125, -3.744140625, -3.10888671875, -2.4736328125, -1.83837890625, -1.203125, -0.56787109375, 0.0673828125, 0.70263671875, 1.337890625, 1.97314453125, 2.6083984375, 3.24365234375, 3.87890625, 4.51416015625, 5.1494140625, 5.78466796875, 6.419921875, 7.05517578125, 7.6904296875, 8.32568359375, 8.9609375, 9.59619140625, 10.2314453125, 10.86669921875, 11.501953125, 12.13720703125, 12.7724609375, 13.40771484375, 14.04296875, 14.67822265625, 15.3134765625, 15.94873046875, 16.583984375, 17.21923828125, 17.8544921875, 18.48974609375, 19.125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 10.0, 11.0, 30.0, 53.0, 92.0, 223.0, 1101.0, 1938.0, 340.0, 123.0, 52.0, 37.0, 27.0, 12.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0, -2.8248291015625, -2.649658203125, -2.4744873046875, -2.29931640625, -2.1241455078125, -1.948974609375, -1.7738037109375, -1.5986328125, -1.4234619140625, -1.248291015625, -1.0731201171875, -0.89794921875, -0.7227783203125, -0.547607421875, -0.3724365234375, -0.197265625, -0.0220947265625, 0.153076171875, 0.3282470703125, 0.50341796875, 0.6785888671875, 0.853759765625, 1.0289306640625, 1.2041015625, 1.3792724609375, 1.554443359375, 1.7296142578125, 1.90478515625, 2.0799560546875, 2.255126953125, 2.4302978515625, 2.60546875, 2.7806396484375, 2.955810546875, 3.1309814453125, 3.30615234375, 3.4813232421875, 3.656494140625, 3.8316650390625, 4.0068359375, 4.1820068359375, 4.357177734375, 4.5323486328125, 4.70751953125, 4.8826904296875, 5.057861328125, 5.2330322265625, 5.408203125, 5.5833740234375, 5.758544921875, 5.9337158203125, 6.10888671875, 6.2840576171875, 6.459228515625, 6.6343994140625, 6.8095703125, 6.9847412109375, 7.159912109375, 7.3350830078125, 7.51025390625, 7.6854248046875, 7.860595703125, 8.0357666015625, 8.2109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 32.0, 113.0, 314.0, 350.0, 128.0, 34.0, 16.0, 7.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.416046142578125, -61.4929313659668, -59.5698127746582, -57.646697998046875, -55.72357940673828, -53.80046463012695, -51.877349853515625, -49.95423126220703, -48.0311164855957, -46.108001708984375, -44.18488311767578, -42.26176834106445, -40.338653564453125, -38.41553497314453, -36.4924201965332, -34.569305419921875, -32.64618682861328, -30.72307014465332, -28.79995346069336, -26.87683868408203, -24.95372200012207, -23.03060531616211, -21.10749053955078, -19.18437385559082, -17.26125717163086, -15.338140487670898, -13.415024757385254, -11.49190902709961, -9.568792343139648, -7.6456756591796875, -5.722559928894043, -3.7994441986083984, -1.8763275146484375, 0.046788692474365234, 1.969904899597168, 3.8930211067199707, 5.816137313842773, 7.739253997802734, 9.662369728088379, 11.585485458374023, 13.508602142333984, 15.431718826293945, 17.354835510253906, 19.277950286865234, 21.201066970825195, 23.124183654785156, 25.047298431396484, 26.970415115356445, 28.893531799316406, 30.816648483276367, 32.73976516723633, 34.662879943847656, 36.58599853515625, 38.50911331176758, 40.432228088378906, 42.3553466796875, 44.27846145629883, 46.201576232910156, 48.12469482421875, 50.04780960083008, 51.970924377441406, 53.89404296875, 55.81715774536133, 57.740272521972656, 59.66339111328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 12.0, 16.0, 19.0, 29.0, 27.0, 42.0, 58.0, 63.0, 67.0, 73.0, 73.0, 64.0, 55.0, 63.0, 69.0, 51.0, 42.0, 41.0, 37.0, 25.0, 20.0, 14.0, 9.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.168455123901367, -17.607484817504883, -17.04651641845703, -16.485546112060547, -15.924575805664062, -15.363605499267578, -14.80263614654541, -14.241666793823242, -13.680696487426758, -13.119726181030273, -12.558756828308105, -11.997787475585938, -11.436817169189453, -10.875846862792969, -10.3148775100708, -9.753908157348633, -9.192937850952148, -8.631967544555664, -8.070998191833496, -7.51002836227417, -6.949058532714844, -6.388088703155518, -5.827118873596191, -5.266149044036865, -4.705179214477539, -4.144209384918213, -3.5832395553588867, -3.0222697257995605, -2.4612998962402344, -1.9003300666809082, -1.339360237121582, -0.7783904075622559, -0.21741867065429688, 0.3435511589050293, 0.9045209884643555, 1.4654908180236816, 2.026460647583008, 2.587430477142334, 3.14840030670166, 3.7093701362609863, 4.2703399658203125, 4.831309795379639, 5.392279624938965, 5.953249454498291, 6.514219284057617, 7.075189113616943, 7.6361589431762695, 8.197128295898438, 8.758098602294922, 9.319068908691406, 9.880038261413574, 10.441007614135742, 11.001977920532227, 11.562948226928711, 12.123917579650879, 12.684886932373047, 13.245857238769531, 13.806827545166016, 14.367796897888184, 14.928766250610352, 15.489736557006836, 16.05070686340332, 16.611675262451172, 17.172645568847656, 17.73361587524414]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 9.0, 15.0, 29.0, 27.0, 67.0, 78.0, 141.0, 201.0, 329.0, 651.0, 1159.0, 2999.0, 7990.0, 26536.0, 101836.0, 380550.0, 382686.0, 102724.0, 26597.0, 8179.0, 2971.0, 1259.0, 619.0, 323.0, 222.0, 124.0, 78.0, 48.0, 19.0, 22.0, 16.0, 15.0, 7.0, 0.0, 12.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.6015625, -13.24365234375, -12.8857421875, -12.52783203125, -12.169921875, -11.81201171875, -11.4541015625, -11.09619140625, -10.73828125, -10.38037109375, -10.0224609375, -9.66455078125, -9.306640625, -8.94873046875, -8.5908203125, -8.23291015625, -7.875, -7.51708984375, -7.1591796875, -6.80126953125, -6.443359375, -6.08544921875, -5.7275390625, -5.36962890625, -5.01171875, -4.65380859375, -4.2958984375, -3.93798828125, -3.580078125, -3.22216796875, -2.8642578125, -2.50634765625, -2.1484375, -1.79052734375, -1.4326171875, -1.07470703125, -0.716796875, -0.35888671875, -0.0009765625, 0.35693359375, 0.71484375, 1.07275390625, 1.4306640625, 1.78857421875, 2.146484375, 2.50439453125, 2.8623046875, 3.22021484375, 3.578125, 3.93603515625, 4.2939453125, 4.65185546875, 5.009765625, 5.36767578125, 5.7255859375, 6.08349609375, 6.44140625, 6.79931640625, 7.1572265625, 7.51513671875, 7.873046875, 8.23095703125, 8.5888671875, 8.94677734375, 9.3046875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 7.0, 11.0, 14.0, 20.0, 28.0, 35.0, 53.0, 48.0, 48.0, 68.0, 80.0, 76.0, 70.0, 77.0, 68.0, 68.0, 39.0, 54.0, 31.0, 29.0, 25.0, 14.0, 11.0, 13.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.138671875, -3.062103271484375, -2.98553466796875, -2.908966064453125, -2.8323974609375, -2.755828857421875, -2.67926025390625, -2.602691650390625, -2.526123046875, -2.449554443359375, -2.37298583984375, -2.296417236328125, -2.2198486328125, -2.143280029296875, -2.06671142578125, -1.990142822265625, -1.91357421875, -1.837005615234375, -1.76043701171875, -1.683868408203125, -1.6072998046875, -1.530731201171875, -1.45416259765625, -1.377593994140625, -1.301025390625, -1.224456787109375, -1.14788818359375, -1.071319580078125, -0.9947509765625, -0.918182373046875, -0.84161376953125, -0.765045166015625, -0.6884765625, -0.611907958984375, -0.53533935546875, -0.458770751953125, -0.3822021484375, -0.305633544921875, -0.22906494140625, -0.152496337890625, -0.075927734375, 0.000640869140625, 0.07720947265625, 0.153778076171875, 0.2303466796875, 0.306915283203125, 0.38348388671875, 0.460052490234375, 0.53662109375, 0.613189697265625, 0.68975830078125, 0.766326904296875, 0.8428955078125, 0.919464111328125, 0.99603271484375, 1.072601318359375, 1.149169921875, 1.225738525390625, 1.30230712890625, 1.378875732421875, 1.4554443359375, 1.532012939453125, 1.60858154296875, 1.685150146484375, 1.76171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 9.0, 3.0, 11.0, 13.0, 13.0, 17.0, 25.0, 45.0, 60.0, 54.0, 114.0, 122.0, 195.0, 237.0, 362.0, 619.0, 958.0, 1772.0, 3266.0, 6409.0, 13594.0, 31966.0, 76225.0, 176059.0, 306015.0, 236113.0, 109383.0, 46227.0, 19714.0, 9140.0, 4284.0, 2209.0, 1170.0, 718.0, 445.0, 305.0, 197.0, 116.0, 99.0, 66.0, 64.0, 36.0, 32.0, 19.0, 18.0, 11.0, 9.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-5.42578125, -5.26483154296875, -5.1038818359375, -4.94293212890625, -4.781982421875, -4.62103271484375, -4.4600830078125, -4.29913330078125, -4.13818359375, -3.97723388671875, -3.8162841796875, -3.65533447265625, -3.494384765625, -3.33343505859375, -3.1724853515625, -3.01153564453125, -2.8505859375, -2.68963623046875, -2.5286865234375, -2.36773681640625, -2.206787109375, -2.04583740234375, -1.8848876953125, -1.72393798828125, -1.56298828125, -1.40203857421875, -1.2410888671875, -1.08013916015625, -0.919189453125, -0.75823974609375, -0.5972900390625, -0.43634033203125, -0.275390625, -0.11444091796875, 0.0465087890625, 0.20745849609375, 0.368408203125, 0.52935791015625, 0.6903076171875, 0.85125732421875, 1.01220703125, 1.17315673828125, 1.3341064453125, 1.49505615234375, 1.656005859375, 1.81695556640625, 1.9779052734375, 2.13885498046875, 2.2998046875, 2.46075439453125, 2.6217041015625, 2.78265380859375, 2.943603515625, 3.10455322265625, 3.2655029296875, 3.42645263671875, 3.58740234375, 3.74835205078125, 3.9093017578125, 4.07025146484375, 4.231201171875, 4.39215087890625, 4.5531005859375, 4.71405029296875, 4.875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 2.0, 5.0, 8.0, 6.0, 9.0, 14.0, 10.0, 15.0, 26.0, 15.0, 20.0, 23.0, 27.0, 30.0, 26.0, 27.0, 29.0, 46.0, 33.0, 48.0, 44.0, 45.0, 50.0, 32.0, 39.0, 40.0, 35.0, 32.0, 42.0, 26.0, 28.0, 26.0, 24.0, 19.0, 21.0, 14.0, 14.0, 15.0, 12.0, 5.0, 4.0, 3.0, 4.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.4921875, -6.30755615234375, -6.1229248046875, -5.93829345703125, -5.753662109375, -5.56903076171875, -5.3843994140625, -5.19976806640625, -5.01513671875, -4.83050537109375, -4.6458740234375, -4.46124267578125, -4.276611328125, -4.09197998046875, -3.9073486328125, -3.72271728515625, -3.5380859375, -3.35345458984375, -3.1688232421875, -2.98419189453125, -2.799560546875, -2.61492919921875, -2.4302978515625, -2.24566650390625, -2.06103515625, -1.87640380859375, -1.6917724609375, -1.50714111328125, -1.322509765625, -1.13787841796875, -0.9532470703125, -0.76861572265625, -0.583984375, -0.39935302734375, -0.2147216796875, -0.03009033203125, 0.154541015625, 0.33917236328125, 0.5238037109375, 0.70843505859375, 0.89306640625, 1.07769775390625, 1.2623291015625, 1.44696044921875, 1.631591796875, 1.81622314453125, 2.0008544921875, 2.18548583984375, 2.3701171875, 2.55474853515625, 2.7393798828125, 2.92401123046875, 3.108642578125, 3.29327392578125, 3.4779052734375, 3.66253662109375, 3.84716796875, 4.03179931640625, 4.2164306640625, 4.40106201171875, 4.585693359375, 4.77032470703125, 4.9549560546875, 5.13958740234375, 5.32421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 11.0, 9.0, 11.0, 14.0, 17.0, 26.0, 51.0, 52.0, 81.0, 235.0, 772.0, 3483.0, 29679.0, 618373.0, 373354.0, 18852.0, 2503.0, 523.0, 193.0, 84.0, 47.0, 38.0, 30.0, 28.0, 26.0, 13.0, 14.0, 8.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5625, -10.2314453125, -9.900390625, -9.5693359375, -9.23828125, -8.9072265625, -8.576171875, -8.2451171875, -7.9140625, -7.5830078125, -7.251953125, -6.9208984375, -6.58984375, -6.2587890625, -5.927734375, -5.5966796875, -5.265625, -4.9345703125, -4.603515625, -4.2724609375, -3.94140625, -3.6103515625, -3.279296875, -2.9482421875, -2.6171875, -2.2861328125, -1.955078125, -1.6240234375, -1.29296875, -0.9619140625, -0.630859375, -0.2998046875, 0.03125, 0.3623046875, 0.693359375, 1.0244140625, 1.35546875, 1.6865234375, 2.017578125, 2.3486328125, 2.6796875, 3.0107421875, 3.341796875, 3.6728515625, 4.00390625, 4.3349609375, 4.666015625, 4.9970703125, 5.328125, 5.6591796875, 5.990234375, 6.3212890625, 6.65234375, 6.9833984375, 7.314453125, 7.6455078125, 7.9765625, 8.3076171875, 8.638671875, 8.9697265625, 9.30078125, 9.6318359375, 9.962890625, 10.2939453125, 10.625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 8.0, 9.0, 16.0, 23.0, 33.0, 44.0, 60.0, 72.0, 93.0, 125.0, 141.0, 93.0, 75.0, 57.0, 46.0, 25.0, 20.0, 15.0, 6.0, 10.0, 2.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005350112915039062, -0.0005117207765579224, -0.0004884302616119385, -0.0004651397466659546, -0.0004418492317199707, -0.0004185587167739868, -0.00039526820182800293, -0.00037197768688201904, -0.00034868717193603516, -0.00032539665699005127, -0.0003021061420440674, -0.0002788156270980835, -0.0002555251121520996, -0.00023223459720611572, -0.00020894408226013184, -0.00018565356731414795, -0.00016236305236816406, -0.00013907253742218018, -0.00011578202247619629, -9.24915075302124e-05, -6.920099258422852e-05, -4.591047763824463e-05, -2.2619962692260742e-05, 6.705522537231445e-07, 2.396106719970703e-05, 4.725158214569092e-05, 7.05420970916748e-05, 9.383261203765869e-05, 0.00011712312698364258, 0.00014041364192962646, 0.00016370415687561035, 0.00018699467182159424, 0.00021028518676757812, 0.000233575701713562, 0.0002568662166595459, 0.0002801567316055298, 0.00030344724655151367, 0.00032673776149749756, 0.00035002827644348145, 0.00037331879138946533, 0.0003966093063354492, 0.0004198998212814331, 0.000443190336227417, 0.0004664808511734009, 0.0004897713661193848, 0.0005130618810653687, 0.0005363523960113525, 0.0005596429109573364, 0.0005829334259033203, 0.0006062239408493042, 0.0006295144557952881, 0.000652804970741272, 0.0006760954856872559, 0.0006993860006332397, 0.0007226765155792236, 0.0007459670305252075, 0.0007692575454711914, 0.0007925480604171753, 0.0008158385753631592, 0.0008391290903091431, 0.000862419605255127, 0.0008857101202011108, 0.0009090006351470947, 0.0009322911500930786, 0.0009555816650390625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 17.0, 11.0, 17.0, 21.0, 34.0, 45.0, 70.0, 94.0, 211.0, 330.0, 625.0, 1210.0, 2753.0, 7040.0, 20416.0, 71723.0, 331182.0, 460989.0, 107404.0, 28211.0, 9398.0, 3541.0, 1504.0, 721.0, 389.0, 211.0, 128.0, 96.0, 45.0, 35.0, 25.0, 14.0, 11.0, 10.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.83203125, -4.68621826171875, -4.5404052734375, -4.39459228515625, -4.248779296875, -4.10296630859375, -3.9571533203125, -3.81134033203125, -3.66552734375, -3.51971435546875, -3.3739013671875, -3.22808837890625, -3.082275390625, -2.93646240234375, -2.7906494140625, -2.64483642578125, -2.4990234375, -2.35321044921875, -2.2073974609375, -2.06158447265625, -1.915771484375, -1.76995849609375, -1.6241455078125, -1.47833251953125, -1.33251953125, -1.18670654296875, -1.0408935546875, -0.89508056640625, -0.749267578125, -0.60345458984375, -0.4576416015625, -0.31182861328125, -0.166015625, -0.02020263671875, 0.1256103515625, 0.27142333984375, 0.417236328125, 0.56304931640625, 0.7088623046875, 0.85467529296875, 1.00048828125, 1.14630126953125, 1.2921142578125, 1.43792724609375, 1.583740234375, 1.72955322265625, 1.8753662109375, 2.02117919921875, 2.1669921875, 2.31280517578125, 2.4586181640625, 2.60443115234375, 2.750244140625, 2.89605712890625, 3.0418701171875, 3.18768310546875, 3.33349609375, 3.47930908203125, 3.6251220703125, 3.77093505859375, 3.916748046875, 4.06256103515625, 4.2083740234375, 4.35418701171875, 4.5]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 6.0, 12.0, 18.0, 14.0, 23.0, 36.0, 45.0, 46.0, 82.0, 83.0, 107.0, 97.0, 100.0, 80.0, 59.0, 43.0, 35.0, 17.0, 22.0, 17.0, 12.0, 11.0, 3.0, 5.0, 4.0, 5.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.625, -6.466827392578125, -6.30865478515625, -6.150482177734375, -5.9923095703125, -5.834136962890625, -5.67596435546875, -5.517791748046875, -5.359619140625, -5.201446533203125, -5.04327392578125, -4.885101318359375, -4.7269287109375, -4.568756103515625, -4.41058349609375, -4.252410888671875, -4.09423828125, -3.936065673828125, -3.77789306640625, -3.619720458984375, -3.4615478515625, -3.303375244140625, -3.14520263671875, -2.987030029296875, -2.828857421875, -2.670684814453125, -2.51251220703125, -2.354339599609375, -2.1961669921875, -2.037994384765625, -1.87982177734375, -1.721649169921875, -1.5634765625, -1.405303955078125, -1.24713134765625, -1.088958740234375, -0.9307861328125, -0.772613525390625, -0.61444091796875, -0.456268310546875, -0.298095703125, -0.139923095703125, 0.01824951171875, 0.176422119140625, 0.3345947265625, 0.492767333984375, 0.65093994140625, 0.809112548828125, 0.96728515625, 1.125457763671875, 1.28363037109375, 1.441802978515625, 1.5999755859375, 1.758148193359375, 1.91632080078125, 2.074493408203125, 2.232666015625, 2.390838623046875, 2.54901123046875, 2.707183837890625, 2.8653564453125, 3.023529052734375, 3.18170166015625, 3.339874267578125, 3.498046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 9.0, 13.0, 27.0, 48.0, 67.0, 129.0, 151.0, 163.0, 153.0, 118.0, 55.0, 33.0, 10.0, 10.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-79.2953109741211, -77.04991149902344, -74.80451202392578, -72.55911254882812, -70.31371307373047, -68.06831359863281, -65.82291412353516, -63.5775146484375, -61.332115173339844, -59.08671569824219, -56.84131622314453, -54.595916748046875, -52.35051727294922, -50.10511779785156, -47.859718322753906, -45.61431884765625, -43.368919372558594, -41.12351989746094, -38.87812042236328, -36.632720947265625, -34.38732147216797, -32.14192199707031, -29.896522521972656, -27.651123046875, -25.405723571777344, -23.160324096679688, -20.91492462158203, -18.669525146484375, -16.42412567138672, -14.178726196289062, -11.933326721191406, -9.68792724609375, -7.4425201416015625, -5.197120666503906, -2.95172119140625, -0.7063217163085938, 1.5390777587890625, 3.7844772338867188, 6.029876708984375, 8.275276184082031, 10.520675659179688, 12.766075134277344, 15.011474609375, 17.256874084472656, 19.502273559570312, 21.74767303466797, 23.993072509765625, 26.23847198486328, 28.483871459960938, 30.729270935058594, 32.97467041015625, 35.220069885253906, 37.46546936035156, 39.71086883544922, 41.956268310546875, 44.20166778564453, 46.44706726074219, 48.692466735839844, 50.9378662109375, 53.183265686035156, 55.42866516113281, 57.67406463623047, 59.919464111328125, 62.16486358642578, 64.41026306152344]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 3.0, 9.0, 7.0, 15.0, 9.0, 9.0, 11.0, 27.0, 21.0, 36.0, 33.0, 34.0, 39.0, 40.0, 49.0, 42.0, 51.0, 52.0, 42.0, 40.0, 51.0, 43.0, 49.0, 41.0, 32.0, 25.0, 23.0, 28.0, 20.0, 25.0, 8.0, 14.0, 20.0, 12.0, 9.0, 5.0, 9.0, 1.0, 3.0, 0.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.67726135253906, -34.480857849121094, -33.284454345703125, -32.08805465698242, -30.891651153564453, -29.695247650146484, -28.49884605407715, -27.302444458007812, -26.106040954589844, -24.909637451171875, -23.71323585510254, -22.516834259033203, -21.320430755615234, -20.124027252197266, -18.92762565612793, -17.731224060058594, -16.534820556640625, -15.338418006896973, -14.14201545715332, -12.945612907409668, -11.749210357666016, -10.552807807922363, -9.356405258178711, -8.160002708435059, -6.963600158691406, -5.767197608947754, -4.570795059204102, -3.374392509460449, -2.177989959716797, -0.9815874099731445, 0.2148151397705078, 1.4112176895141602, 2.607624053955078, 3.8040266036987305, 5.000429153442383, 6.196831703186035, 7.3932342529296875, 8.58963680267334, 9.786039352416992, 10.982441902160645, 12.178844451904297, 13.37524700164795, 14.571649551391602, 15.768052101135254, 16.964454650878906, 18.160858154296875, 19.35725975036621, 20.553661346435547, 21.750064849853516, 22.946468353271484, 24.14286994934082, 25.339271545410156, 26.535675048828125, 27.732078552246094, 28.92848014831543, 30.124881744384766, 31.321285247802734, 32.5176887512207, 33.714088439941406, 34.910491943359375, 36.106895446777344, 37.30329895019531, 38.49970245361328, 39.696102142333984, 40.89250564575195]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 7.0, 5.0, 12.0, 16.0, 14.0, 24.0, 23.0, 35.0, 42.0, 62.0, 80.0, 101.0, 139.0, 204.0, 380.0, 569.0, 1106.0, 2186.0, 4545.0, 11193.0, 33560.0, 172385.0, 3643209.0, 259693.0, 41064.0, 13209.0, 5385.0, 2346.0, 1173.0, 600.0, 335.0, 200.0, 126.0, 79.0, 57.0, 32.0, 22.0, 23.0, 10.0, 8.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-13.953125, -13.5914306640625, -13.229736328125, -12.8680419921875, -12.50634765625, -12.1446533203125, -11.782958984375, -11.4212646484375, -11.0595703125, -10.6978759765625, -10.336181640625, -9.9744873046875, -9.61279296875, -9.2510986328125, -8.889404296875, -8.5277099609375, -8.166015625, -7.8043212890625, -7.442626953125, -7.0809326171875, -6.71923828125, -6.3575439453125, -5.995849609375, -5.6341552734375, -5.2724609375, -4.9107666015625, -4.549072265625, -4.1873779296875, -3.82568359375, -3.4639892578125, -3.102294921875, -2.7406005859375, -2.37890625, -2.0172119140625, -1.655517578125, -1.2938232421875, -0.93212890625, -0.5704345703125, -0.208740234375, 0.1529541015625, 0.5146484375, 0.8763427734375, 1.238037109375, 1.5997314453125, 1.96142578125, 2.3231201171875, 2.684814453125, 3.0465087890625, 3.408203125, 3.7698974609375, 4.131591796875, 4.4932861328125, 4.85498046875, 5.2166748046875, 5.578369140625, 5.9400634765625, 6.3017578125, 6.6634521484375, 7.025146484375, 7.3868408203125, 7.74853515625, 8.1102294921875, 8.471923828125, 8.8336181640625, 9.1953125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 9.0, 2.0, 9.0, 14.0, 15.0, 12.0, 16.0, 18.0, 27.0, 29.0, 29.0, 38.0, 50.0, 49.0, 57.0, 59.0, 64.0, 55.0, 51.0, 47.0, 60.0, 50.0, 35.0, 37.0, 29.0, 29.0, 17.0, 25.0, 22.0, 12.0, 13.0, 6.0, 11.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.197265625, -2.134765625, -2.072265625, -2.009765625, -1.947265625, -1.884765625, -1.822265625, -1.759765625, -1.697265625, -1.634765625, -1.572265625, -1.509765625, -1.447265625, -1.384765625, -1.322265625, -1.259765625, -1.197265625, -1.134765625, -1.072265625, -1.009765625, -0.947265625, -0.884765625, -0.822265625, -0.759765625, -0.697265625, -0.634765625, -0.572265625, -0.509765625, -0.447265625, -0.384765625, -0.322265625, -0.259765625, -0.197265625, -0.134765625, -0.072265625, -0.009765625, 0.052734375, 0.115234375, 0.177734375, 0.240234375, 0.302734375, 0.365234375, 0.427734375, 0.490234375, 0.552734375, 0.615234375, 0.677734375, 0.740234375, 0.802734375, 0.865234375, 0.927734375, 0.990234375, 1.052734375, 1.115234375, 1.177734375, 1.240234375, 1.302734375, 1.365234375, 1.427734375, 1.490234375, 1.552734375, 1.615234375, 1.677734375, 1.740234375, 1.802734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 9.0, 21.0, 29.0, 33.0, 34.0, 55.0, 98.0, 152.0, 294.0, 801.0, 2672.0, 12172.0, 99499.0, 3738967.0, 308942.0, 23842.0, 4505.0, 1199.0, 396.0, 180.0, 106.0, 70.0, 53.0, 44.0, 23.0, 17.0, 9.0, 13.0, 10.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.109375, -17.6287841796875, -17.148193359375, -16.6676025390625, -16.18701171875, -15.7064208984375, -15.225830078125, -14.7452392578125, -14.2646484375, -13.7840576171875, -13.303466796875, -12.8228759765625, -12.34228515625, -11.8616943359375, -11.381103515625, -10.9005126953125, -10.419921875, -9.9393310546875, -9.458740234375, -8.9781494140625, -8.49755859375, -8.0169677734375, -7.536376953125, -7.0557861328125, -6.5751953125, -6.0946044921875, -5.614013671875, -5.1334228515625, -4.65283203125, -4.1722412109375, -3.691650390625, -3.2110595703125, -2.73046875, -2.2498779296875, -1.769287109375, -1.2886962890625, -0.80810546875, -0.3275146484375, 0.153076171875, 0.6336669921875, 1.1142578125, 1.5948486328125, 2.075439453125, 2.5560302734375, 3.03662109375, 3.5172119140625, 3.997802734375, 4.4783935546875, 4.958984375, 5.4395751953125, 5.920166015625, 6.4007568359375, 6.88134765625, 7.3619384765625, 7.842529296875, 8.3231201171875, 8.8037109375, 9.2843017578125, 9.764892578125, 10.2454833984375, 10.72607421875, 11.2066650390625, 11.687255859375, 12.1678466796875, 12.6484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 7.0, 9.0, 14.0, 26.0, 52.0, 72.0, 131.0, 294.0, 1102.0, 1569.0, 388.0, 160.0, 89.0, 49.0, 40.0, 18.0, 16.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.779296875, -3.608306884765625, -3.43731689453125, -3.266326904296875, -3.0953369140625, -2.924346923828125, -2.75335693359375, -2.582366943359375, -2.411376953125, -2.240386962890625, -2.06939697265625, -1.898406982421875, -1.7274169921875, -1.556427001953125, -1.38543701171875, -1.214447021484375, -1.04345703125, -0.872467041015625, -0.70147705078125, -0.530487060546875, -0.3594970703125, -0.188507080078125, -0.01751708984375, 0.153472900390625, 0.324462890625, 0.495452880859375, 0.66644287109375, 0.837432861328125, 1.0084228515625, 1.179412841796875, 1.35040283203125, 1.521392822265625, 1.6923828125, 1.863372802734375, 2.03436279296875, 2.205352783203125, 2.3763427734375, 2.547332763671875, 2.71832275390625, 2.889312744140625, 3.060302734375, 3.231292724609375, 3.40228271484375, 3.573272705078125, 3.7442626953125, 3.915252685546875, 4.08624267578125, 4.257232666015625, 4.42822265625, 4.599212646484375, 4.77020263671875, 4.941192626953125, 5.1121826171875, 5.283172607421875, 5.45416259765625, 5.625152587890625, 5.796142578125, 5.967132568359375, 6.13812255859375, 6.309112548828125, 6.4801025390625, 6.651092529296875, 6.82208251953125, 6.993072509765625, 7.1640625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 13.0, 17.0, 37.0, 59.0, 96.0, 123.0, 163.0, 150.0, 113.0, 83.0, 62.0, 29.0, 16.0, 13.0, 9.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.84695816040039, -31.923946380615234, -31.000934600830078, -30.07792091369629, -29.154909133911133, -28.231897354125977, -27.30888557434082, -26.38587188720703, -25.462860107421875, -24.53984832763672, -23.616836547851562, -22.693822860717773, -21.770811080932617, -20.84779930114746, -19.924787521362305, -19.001773834228516, -18.07876205444336, -17.155750274658203, -16.232738494873047, -15.309725761413574, -14.386713027954102, -13.463701248168945, -12.540689468383789, -11.617676734924316, -10.694665908813477, -9.77165412902832, -8.848641395568848, -7.925629615783691, -7.002616882324219, -6.0796051025390625, -5.156592845916748, -4.233580589294434, -3.310567855834961, -2.3875555992126465, -1.4645434617996216, -0.5415313243865967, 0.3814809322357178, 1.3044929504394531, 2.2275052070617676, 3.150517463684082, 4.0735297203063965, 4.996541976928711, 5.919554233551025, 6.84256649017334, 7.765578269958496, 8.688591003417969, 9.611602783203125, 10.534614562988281, 11.457627296447754, 12.38063907623291, 13.303651809692383, 14.226663589477539, 15.149676322937012, 16.072689056396484, 16.99570083618164, 17.918712615966797, 18.841724395751953, 19.76473617553711, 20.687747955322266, 21.610761642456055, 22.53377342224121, 23.456785202026367, 24.379796981811523, 25.302810668945312, 26.22582244873047]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 16.0, 20.0, 19.0, 49.0, 52.0, 51.0, 62.0, 83.0, 85.0, 88.0, 57.0, 70.0, 68.0, 54.0, 56.0, 44.0, 41.0, 19.0, 19.0, 11.0, 10.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.2783260345459, -17.54317855834961, -16.808032989501953, -16.072885513305664, -15.337739944458008, -14.602592468261719, -13.867445945739746, -13.132299423217773, -12.3971529006958, -11.662006378173828, -10.926859855651855, -10.191713333129883, -9.456565856933594, -8.721420288085938, -7.986272811889648, -7.251126289367676, -6.515979766845703, -5.7808332443237305, -5.045686721801758, -4.310539722442627, -3.5753931999206543, -2.8402466773986816, -2.105099678039551, -1.3699531555175781, -0.6348066329956055, 0.10034000873565674, 0.835486650466919, 1.5706334114074707, 2.3057799339294434, 3.040926456451416, 3.776073455810547, 4.5112199783325195, 5.246366500854492, 5.981513023376465, 6.7166595458984375, 7.451806545257568, 8.186952590942383, 8.922100067138672, 9.657246589660645, 10.392393112182617, 11.12753963470459, 11.862686157226562, 12.597832679748535, 13.332979202270508, 14.068126678466797, 14.803272247314453, 15.538419723510742, 16.27356719970703, 17.008712768554688, 17.743860244750977, 18.479005813598633, 19.214153289794922, 19.949298858642578, 20.684446334838867, 21.419593811035156, 22.154739379882812, 22.88988494873047, 23.625032424926758, 24.360177993774414, 25.095325469970703, 25.83047103881836, 26.56561851501465, 27.300765991210938, 28.035911560058594, 28.771059036254883]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 2.0, 6.0, 3.0, 16.0, 16.0, 14.0, 21.0, 22.0, 35.0, 67.0, 105.0, 138.0, 246.0, 464.0, 746.0, 1451.0, 2941.0, 6300.0, 15170.0, 40428.0, 123132.0, 411589.0, 303030.0, 89767.0, 30529.0, 11915.0, 5054.0, 2445.0, 1191.0, 687.0, 391.0, 225.0, 133.0, 75.0, 55.0, 48.0, 33.0, 24.0, 11.0, 8.0, 5.0, 9.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.796875, -8.5118408203125, -8.226806640625, -7.9417724609375, -7.65673828125, -7.3717041015625, -7.086669921875, -6.8016357421875, -6.5166015625, -6.2315673828125, -5.946533203125, -5.6614990234375, -5.37646484375, -5.0914306640625, -4.806396484375, -4.5213623046875, -4.236328125, -3.9512939453125, -3.666259765625, -3.3812255859375, -3.09619140625, -2.8111572265625, -2.526123046875, -2.2410888671875, -1.9560546875, -1.6710205078125, -1.385986328125, -1.1009521484375, -0.81591796875, -0.5308837890625, -0.245849609375, 0.0391845703125, 0.32421875, 0.6092529296875, 0.894287109375, 1.1793212890625, 1.46435546875, 1.7493896484375, 2.034423828125, 2.3194580078125, 2.6044921875, 2.8895263671875, 3.174560546875, 3.4595947265625, 3.74462890625, 4.0296630859375, 4.314697265625, 4.5997314453125, 4.884765625, 5.1697998046875, 5.454833984375, 5.7398681640625, 6.02490234375, 6.3099365234375, 6.594970703125, 6.8800048828125, 7.1650390625, 7.4500732421875, 7.735107421875, 8.0201416015625, 8.30517578125, 8.5902099609375, 8.875244140625, 9.1602783203125, 9.4453125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 11.0, 13.0, 12.0, 11.0, 16.0, 27.0, 26.0, 26.0, 34.0, 52.0, 42.0, 44.0, 53.0, 65.0, 56.0, 75.0, 44.0, 50.0, 59.0, 40.0, 35.0, 34.0, 33.0, 39.0, 22.0, 17.0, 18.0, 13.0, 6.0, 11.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.3147125244140625, -2.248565673828125, -2.1824188232421875, -2.11627197265625, -2.0501251220703125, -1.983978271484375, -1.9178314208984375, -1.8516845703125, -1.7855377197265625, -1.719390869140625, -1.6532440185546875, -1.58709716796875, -1.5209503173828125, -1.454803466796875, -1.3886566162109375, -1.322509765625, -1.2563629150390625, -1.190216064453125, -1.1240692138671875, -1.05792236328125, -0.9917755126953125, -0.925628662109375, -0.8594818115234375, -0.7933349609375, -0.7271881103515625, -0.661041259765625, -0.5948944091796875, -0.52874755859375, -0.4626007080078125, -0.396453857421875, -0.3303070068359375, -0.26416015625, -0.1980133056640625, -0.131866455078125, -0.0657196044921875, 0.00042724609375, 0.0665740966796875, 0.132720947265625, 0.1988677978515625, 0.2650146484375, 0.3311614990234375, 0.397308349609375, 0.4634552001953125, 0.52960205078125, 0.5957489013671875, 0.661895751953125, 0.7280426025390625, 0.794189453125, 0.8603363037109375, 0.926483154296875, 0.9926300048828125, 1.05877685546875, 1.1249237060546875, 1.191070556640625, 1.2572174072265625, 1.3233642578125, 1.3895111083984375, 1.455657958984375, 1.5218048095703125, 1.58795166015625, 1.6540985107421875, 1.720245361328125, 1.7863922119140625, 1.8525390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 6.0, 10.0, 8.0, 8.0, 21.0, 23.0, 27.0, 45.0, 62.0, 99.0, 123.0, 202.0, 280.0, 467.0, 820.0, 1503.0, 2774.0, 6006.0, 13887.0, 36150.0, 99554.0, 324872.0, 374299.0, 116429.0, 41266.0, 15858.0, 6739.0, 3097.0, 1562.0, 844.0, 538.0, 303.0, 214.0, 141.0, 91.0, 55.0, 36.0, 25.0, 30.0, 21.0, 9.0, 15.0, 12.0, 10.0, 7.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16015625, -5.940673828125, -5.72119140625, -5.501708984375, -5.2822265625, -5.062744140625, -4.84326171875, -4.623779296875, -4.404296875, -4.184814453125, -3.96533203125, -3.745849609375, -3.5263671875, -3.306884765625, -3.08740234375, -2.867919921875, -2.6484375, -2.428955078125, -2.20947265625, -1.989990234375, -1.7705078125, -1.551025390625, -1.33154296875, -1.112060546875, -0.892578125, -0.673095703125, -0.45361328125, -0.234130859375, -0.0146484375, 0.204833984375, 0.42431640625, 0.643798828125, 0.86328125, 1.082763671875, 1.30224609375, 1.521728515625, 1.7412109375, 1.960693359375, 2.18017578125, 2.399658203125, 2.619140625, 2.838623046875, 3.05810546875, 3.277587890625, 3.4970703125, 3.716552734375, 3.93603515625, 4.155517578125, 4.375, 4.594482421875, 4.81396484375, 5.033447265625, 5.2529296875, 5.472412109375, 5.69189453125, 5.911376953125, 6.130859375, 6.350341796875, 6.56982421875, 6.789306640625, 7.0087890625, 7.228271484375, 7.44775390625, 7.667236328125, 7.88671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 8.0, 17.0, 14.0, 16.0, 24.0, 16.0, 24.0, 35.0, 36.0, 45.0, 54.0, 57.0, 60.0, 52.0, 68.0, 60.0, 75.0, 44.0, 66.0, 49.0, 26.0, 30.0, 29.0, 21.0, 14.0, 16.0, 10.0, 5.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.5498046875, -8.255859375, -7.9619140625, -7.66796875, -7.3740234375, -7.080078125, -6.7861328125, -6.4921875, -6.1982421875, -5.904296875, -5.6103515625, -5.31640625, -5.0224609375, -4.728515625, -4.4345703125, -4.140625, -3.8466796875, -3.552734375, -3.2587890625, -2.96484375, -2.6708984375, -2.376953125, -2.0830078125, -1.7890625, -1.4951171875, -1.201171875, -0.9072265625, -0.61328125, -0.3193359375, -0.025390625, 0.2685546875, 0.5625, 0.8564453125, 1.150390625, 1.4443359375, 1.73828125, 2.0322265625, 2.326171875, 2.6201171875, 2.9140625, 3.2080078125, 3.501953125, 3.7958984375, 4.08984375, 4.3837890625, 4.677734375, 4.9716796875, 5.265625, 5.5595703125, 5.853515625, 6.1474609375, 6.44140625, 6.7353515625, 7.029296875, 7.3232421875, 7.6171875, 7.9111328125, 8.205078125, 8.4990234375, 8.79296875, 9.0869140625, 9.380859375, 9.6748046875, 9.96875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 6.0, 5.0, 15.0, 28.0, 67.0, 131.0, 324.0, 891.0, 6888.0, 185621.0, 831688.0, 20286.0, 1794.0, 442.0, 185.0, 96.0, 40.0, 21.0, 7.0, 10.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6484375, -12.1998291015625, -11.751220703125, -11.3026123046875, -10.85400390625, -10.4053955078125, -9.956787109375, -9.5081787109375, -9.0595703125, -8.6109619140625, -8.162353515625, -7.7137451171875, -7.26513671875, -6.8165283203125, -6.367919921875, -5.9193115234375, -5.470703125, -5.0220947265625, -4.573486328125, -4.1248779296875, -3.67626953125, -3.2276611328125, -2.779052734375, -2.3304443359375, -1.8818359375, -1.4332275390625, -0.984619140625, -0.5360107421875, -0.08740234375, 0.3612060546875, 0.809814453125, 1.2584228515625, 1.70703125, 2.1556396484375, 2.604248046875, 3.0528564453125, 3.50146484375, 3.9500732421875, 4.398681640625, 4.8472900390625, 5.2958984375, 5.7445068359375, 6.193115234375, 6.6417236328125, 7.09033203125, 7.5389404296875, 7.987548828125, 8.4361572265625, 8.884765625, 9.3333740234375, 9.781982421875, 10.2305908203125, 10.67919921875, 11.1278076171875, 11.576416015625, 12.0250244140625, 12.4736328125, 12.9222412109375, 13.370849609375, 13.8194580078125, 14.26806640625, 14.7166748046875, 15.165283203125, 15.6138916015625, 16.0625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 15.0, 5.0, 5.0, 8.0, 17.0, 26.0, 35.0, 37.0, 53.0, 104.0, 152.0, 148.0, 110.0, 68.0, 49.0, 26.0, 29.0, 17.0, 8.0, 13.0, 17.0, 8.0, 5.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005354881286621094, -0.0005183145403862, -0.0005011409521102905, -0.0004839673638343811, -0.0004667937755584717, -0.00044962018728256226, -0.00043244659900665283, -0.0004152730107307434, -0.000398099422454834, -0.00038092583417892456, -0.00036375224590301514, -0.0003465786576271057, -0.0003294050693511963, -0.00031223148107528687, -0.00029505789279937744, -0.000277884304523468, -0.0002607107162475586, -0.00024353712797164917, -0.00022636353969573975, -0.00020918995141983032, -0.0001920163631439209, -0.00017484277486801147, -0.00015766918659210205, -0.00014049559831619263, -0.0001233220100402832, -0.00010614842176437378, -8.897483348846436e-05, -7.180124521255493e-05, -5.462765693664551e-05, -3.7454068660736084e-05, -2.028048038482666e-05, -3.1068921089172363e-06, 1.4066696166992188e-05, 3.124028444290161e-05, 4.8413872718811035e-05, 6.558746099472046e-05, 8.276104927062988e-05, 9.99346375465393e-05, 0.00011710822582244873, 0.00013428181409835815, 0.00015145540237426758, 0.000168628990650177, 0.00018580257892608643, 0.00020297616720199585, 0.00022014975547790527, 0.0002373233437538147, 0.0002544969320297241, 0.00027167052030563354, 0.00028884410858154297, 0.0003060176968574524, 0.0003231912851333618, 0.00034036487340927124, 0.00035753846168518066, 0.0003747120499610901, 0.0003918856382369995, 0.00040905922651290894, 0.00042623281478881836, 0.0004434064030647278, 0.0004605799913406372, 0.00047775357961654663, 0.0004949271678924561, 0.0005121007561683655, 0.0005292743444442749, 0.0005464479327201843, 0.0005636215209960938]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 5.0, 13.0, 19.0, 26.0, 41.0, 60.0, 78.0, 127.0, 216.0, 560.0, 2440.0, 24959.0, 863647.0, 147290.0, 7140.0, 1124.0, 332.0, 157.0, 104.0, 73.0, 47.0, 36.0, 24.0, 7.0, 10.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.1171875, -14.6944580078125, -14.271728515625, -13.8489990234375, -13.42626953125, -13.0035400390625, -12.580810546875, -12.1580810546875, -11.7353515625, -11.3126220703125, -10.889892578125, -10.4671630859375, -10.04443359375, -9.6217041015625, -9.198974609375, -8.7762451171875, -8.353515625, -7.9307861328125, -7.508056640625, -7.0853271484375, -6.66259765625, -6.2398681640625, -5.817138671875, -5.3944091796875, -4.9716796875, -4.5489501953125, -4.126220703125, -3.7034912109375, -3.28076171875, -2.8580322265625, -2.435302734375, -2.0125732421875, -1.58984375, -1.1671142578125, -0.744384765625, -0.3216552734375, 0.10107421875, 0.5238037109375, 0.946533203125, 1.3692626953125, 1.7919921875, 2.2147216796875, 2.637451171875, 3.0601806640625, 3.48291015625, 3.9056396484375, 4.328369140625, 4.7510986328125, 5.173828125, 5.5965576171875, 6.019287109375, 6.4420166015625, 6.86474609375, 7.2874755859375, 7.710205078125, 8.1329345703125, 8.5556640625, 8.9783935546875, 9.401123046875, 9.8238525390625, 10.24658203125, 10.6693115234375, 11.092041015625, 11.5147705078125, 11.9375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 15.0, 12.0, 30.0, 73.0, 134.0, 300.0, 228.0, 121.0, 33.0, 21.0, 19.0, 14.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.359375, -15.9371337890625, -15.514892578125, -15.0926513671875, -14.67041015625, -14.2481689453125, -13.825927734375, -13.4036865234375, -12.9814453125, -12.5592041015625, -12.136962890625, -11.7147216796875, -11.29248046875, -10.8702392578125, -10.447998046875, -10.0257568359375, -9.603515625, -9.1812744140625, -8.759033203125, -8.3367919921875, -7.91455078125, -7.4923095703125, -7.070068359375, -6.6478271484375, -6.2255859375, -5.8033447265625, -5.381103515625, -4.9588623046875, -4.53662109375, -4.1143798828125, -3.692138671875, -3.2698974609375, -2.84765625, -2.4254150390625, -2.003173828125, -1.5809326171875, -1.15869140625, -0.7364501953125, -0.314208984375, 0.1080322265625, 0.5302734375, 0.9525146484375, 1.374755859375, 1.7969970703125, 2.21923828125, 2.6414794921875, 3.063720703125, 3.4859619140625, 3.908203125, 4.3304443359375, 4.752685546875, 5.1749267578125, 5.59716796875, 6.0194091796875, 6.441650390625, 6.8638916015625, 7.2861328125, 7.7083740234375, 8.130615234375, 8.5528564453125, 8.97509765625, 9.3973388671875, 9.819580078125, 10.2418212890625, 10.6640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 21.0, 56.0, 119.0, 214.0, 226.0, 183.0, 93.0, 47.0, 19.0, 6.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-154.6444854736328, -151.14031982421875, -147.6361541748047, -144.13197326660156, -140.6278076171875, -137.12364196777344, -133.61947631835938, -130.11529541015625, -126.61112976074219, -123.10696411132812, -119.60279083251953, -116.09862518310547, -112.59445190429688, -109.09028625488281, -105.58612060546875, -102.08194732666016, -98.5777816772461, -95.07361602783203, -91.56944274902344, -88.06527709960938, -84.56110382080078, -81.05693817138672, -77.55276489257812, -74.04859924316406, -70.54443359375, -67.04026794433594, -63.536094665527344, -60.03192901611328, -56.52775573730469, -53.023590087890625, -49.5194206237793, -46.01525115966797, -42.511085510253906, -39.00691604614258, -35.50274658203125, -31.998579025268555, -28.494409561157227, -24.9902400970459, -21.486072540283203, -17.981903076171875, -14.477733612060547, -10.973564147949219, -7.469395637512207, -3.9652271270751953, -0.4610576629638672, 3.043111801147461, 6.547279357910156, 10.051448822021484, 13.555618286132812, 17.05978775024414, 20.56395721435547, 24.068124771118164, 27.572294235229492, 31.07646369934082, 34.580631256103516, 38.084800720214844, 41.58897018432617, 45.0931396484375, 48.59730911254883, 52.101478576660156, 55.60564422607422, 59.10981750488281, 62.613983154296875, 66.11814880371094, 69.62232208251953]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 11.0, 2.0, 8.0, 8.0, 8.0, 11.0, 11.0, 10.0, 20.0, 28.0, 27.0, 34.0, 24.0, 29.0, 36.0, 36.0, 42.0, 45.0, 36.0, 37.0, 36.0, 51.0, 28.0, 40.0, 34.0, 38.0, 32.0, 26.0, 25.0, 30.0, 23.0, 22.0, 27.0, 16.0, 13.0, 17.0, 8.0, 14.0, 10.0, 9.0, 6.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-35.76211929321289, -34.684757232666016, -33.60739517211914, -32.530029296875, -31.452667236328125, -30.37530517578125, -29.297943115234375, -28.2205810546875, -27.143217086791992, -26.065855026245117, -24.98849105834961, -23.911128997802734, -22.83376693725586, -21.75640296936035, -20.679040908813477, -19.60167694091797, -18.524314880371094, -17.44695281982422, -16.36958885192871, -15.292226791381836, -14.214863777160645, -13.137500762939453, -12.060138702392578, -10.982775688171387, -9.905412673950195, -8.828049659729004, -7.750687122344971, -6.6733245849609375, -5.595961570739746, -4.518598556518555, -3.4412360191345215, -2.3638734817504883, -1.2865142822265625, -0.2091515064239502, 0.8682112693786621, 1.9455740451812744, 3.0229368209838867, 4.100299835205078, 5.177662372589111, 6.2550249099731445, 7.332387924194336, 8.409750938415527, 9.487113952636719, 10.564476013183594, 11.641839027404785, 12.719202041625977, 13.796564102172852, 14.873927116394043, 15.951290130615234, 17.02865219116211, 18.106016159057617, 19.183378219604492, 20.2607421875, 21.338104248046875, 22.41546630859375, 23.492828369140625, 24.570192337036133, 25.647554397583008, 26.724918365478516, 27.80228042602539, 28.879642486572266, 29.957006454467773, 31.03436851501465, 32.111732482910156, 33.18909454345703]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 7.0, 5.0, 11.0, 12.0, 18.0, 18.0, 28.0, 40.0, 61.0, 84.0, 110.0, 217.0, 393.0, 704.0, 1547.0, 3783.0, 10331.0, 39118.0, 957446.0, 3112999.0, 47889.0, 11847.0, 4223.0, 1726.0, 782.0, 370.0, 204.0, 127.0, 65.0, 47.0, 23.0, 14.0, 11.0, 9.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.0625, -20.523193359375, -19.98388671875, -19.444580078125, -18.9052734375, -18.365966796875, -17.82666015625, -17.287353515625, -16.748046875, -16.208740234375, -15.66943359375, -15.130126953125, -14.5908203125, -14.051513671875, -13.51220703125, -12.972900390625, -12.43359375, -11.894287109375, -11.35498046875, -10.815673828125, -10.2763671875, -9.737060546875, -9.19775390625, -8.658447265625, -8.119140625, -7.579833984375, -7.04052734375, -6.501220703125, -5.9619140625, -5.422607421875, -4.88330078125, -4.343994140625, -3.8046875, -3.265380859375, -2.72607421875, -2.186767578125, -1.6474609375, -1.108154296875, -0.56884765625, -0.029541015625, 0.509765625, 1.049072265625, 1.58837890625, 2.127685546875, 2.6669921875, 3.206298828125, 3.74560546875, 4.284912109375, 4.82421875, 5.363525390625, 5.90283203125, 6.442138671875, 6.9814453125, 7.520751953125, 8.06005859375, 8.599365234375, 9.138671875, 9.677978515625, 10.21728515625, 10.756591796875, 11.2958984375, 11.835205078125, 12.37451171875, 12.913818359375, 13.453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 8.0, 8.0, 18.0, 16.0, 18.0, 24.0, 26.0, 39.0, 37.0, 51.0, 39.0, 39.0, 58.0, 56.0, 51.0, 67.0, 69.0, 63.0, 46.0, 40.0, 36.0, 27.0, 32.0, 33.0, 32.0, 16.0, 11.0, 12.0, 5.0, 10.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.455078125, -2.382781982421875, -2.31048583984375, -2.238189697265625, -2.1658935546875, -2.093597412109375, -2.02130126953125, -1.949005126953125, -1.876708984375, -1.804412841796875, -1.73211669921875, -1.659820556640625, -1.5875244140625, -1.515228271484375, -1.44293212890625, -1.370635986328125, -1.29833984375, -1.226043701171875, -1.15374755859375, -1.081451416015625, -1.0091552734375, -0.936859130859375, -0.86456298828125, -0.792266845703125, -0.719970703125, -0.647674560546875, -0.57537841796875, -0.503082275390625, -0.4307861328125, -0.358489990234375, -0.28619384765625, -0.213897705078125, -0.1416015625, -0.069305419921875, 0.00299072265625, 0.075286865234375, 0.1475830078125, 0.219879150390625, 0.29217529296875, 0.364471435546875, 0.436767578125, 0.509063720703125, 0.58135986328125, 0.653656005859375, 0.7259521484375, 0.798248291015625, 0.87054443359375, 0.942840576171875, 1.01513671875, 1.087432861328125, 1.15972900390625, 1.232025146484375, 1.3043212890625, 1.376617431640625, 1.44891357421875, 1.521209716796875, 1.593505859375, 1.665802001953125, 1.73809814453125, 1.810394287109375, 1.8826904296875, 1.954986572265625, 2.02728271484375, 2.099578857421875, 2.171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 17.0, 11.0, 9.0, 18.0, 20.0, 27.0, 29.0, 25.0, 39.0, 24.0, 40.0, 39.0, 117.0, 520.0, 4362.0, 132227.0, 4035950.0, 18718.0, 1447.0, 204.0, 88.0, 56.0, 45.0, 32.0, 40.0, 31.0, 24.0, 13.0, 19.0, 17.0, 13.0, 16.0, 3.0, 7.0, 5.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.875, -34.79638671875, -33.7177734375, -32.63916015625, -31.560546875, -30.48193359375, -29.4033203125, -28.32470703125, -27.24609375, -26.16748046875, -25.0888671875, -24.01025390625, -22.931640625, -21.85302734375, -20.7744140625, -19.69580078125, -18.6171875, -17.53857421875, -16.4599609375, -15.38134765625, -14.302734375, -13.22412109375, -12.1455078125, -11.06689453125, -9.98828125, -8.90966796875, -7.8310546875, -6.75244140625, -5.673828125, -4.59521484375, -3.5166015625, -2.43798828125, -1.359375, -0.28076171875, 0.7978515625, 1.87646484375, 2.955078125, 4.03369140625, 5.1123046875, 6.19091796875, 7.26953125, 8.34814453125, 9.4267578125, 10.50537109375, 11.583984375, 12.66259765625, 13.7412109375, 14.81982421875, 15.8984375, 16.97705078125, 18.0556640625, 19.13427734375, 20.212890625, 21.29150390625, 22.3701171875, 23.44873046875, 24.52734375, 25.60595703125, 26.6845703125, 27.76318359375, 28.841796875, 29.92041015625, 30.9990234375, 32.07763671875, 33.15625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 15.0, 37.0, 68.0, 289.0, 3045.0, 481.0, 91.0, 20.0, 16.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.6832275390625, -4.280517578125, -3.8778076171875, -3.47509765625, -3.0723876953125, -2.669677734375, -2.2669677734375, -1.8642578125, -1.4615478515625, -1.058837890625, -0.6561279296875, -0.25341796875, 0.1492919921875, 0.552001953125, 0.9547119140625, 1.357421875, 1.7601318359375, 2.162841796875, 2.5655517578125, 2.96826171875, 3.3709716796875, 3.773681640625, 4.1763916015625, 4.5791015625, 4.9818115234375, 5.384521484375, 5.7872314453125, 6.18994140625, 6.5926513671875, 6.995361328125, 7.3980712890625, 7.80078125, 8.2034912109375, 8.606201171875, 9.0089111328125, 9.41162109375, 9.8143310546875, 10.217041015625, 10.6197509765625, 11.0224609375, 11.4251708984375, 11.827880859375, 12.2305908203125, 12.63330078125, 13.0360107421875, 13.438720703125, 13.8414306640625, 14.244140625, 14.6468505859375, 15.049560546875, 15.4522705078125, 15.85498046875, 16.2576904296875, 16.660400390625, 17.0631103515625, 17.4658203125, 17.8685302734375, 18.271240234375, 18.6739501953125, 19.07666015625, 19.4793701171875, 19.882080078125, 20.2847900390625, 20.6875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 11.0, 34.0, 95.0, 194.0, 251.0, 207.0, 112.0, 41.0, 21.0, 13.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.70167541503906, -56.17005157470703, -54.638427734375, -53.1068000793457, -51.57517623901367, -50.04355239868164, -48.51192855834961, -46.98030090332031, -45.44867706298828, -43.91705322265625, -42.38542938232422, -40.85380172729492, -39.32217788696289, -37.79055404663086, -36.25893020629883, -34.72730255126953, -33.1956787109375, -31.66405487060547, -30.132429122924805, -28.600805282592773, -27.06917953491211, -25.537555694580078, -24.005931854248047, -22.474306106567383, -20.942684173583984, -19.411060333251953, -17.87943458557129, -16.347810745239258, -14.816184997558594, -13.284561157226562, -11.752936363220215, -10.221311569213867, -8.689685821533203, -7.1580610275268555, -5.626436233520508, -4.094811916351318, -2.5631871223449707, -1.031562328338623, 0.5000619888305664, 2.031686782836914, 3.5633115768432617, 5.094936370849609, 6.626561164855957, 8.158185958862305, 9.689809799194336, 11.221435546875, 12.753059387207031, 14.284684181213379, 15.816308975219727, 17.347932815551758, 18.879558563232422, 20.411182403564453, 21.942808151245117, 23.47443199157715, 25.006057739257812, 26.537681579589844, 28.069305419921875, 29.600929260253906, 31.13255500793457, 32.664180755615234, 34.195804595947266, 35.7274284362793, 37.25905227661133, 38.790679931640625, 40.322303771972656]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 13.0, 15.0, 23.0, 35.0, 34.0, 55.0, 73.0, 82.0, 97.0, 94.0, 89.0, 90.0, 64.0, 72.0, 35.0, 43.0, 28.0, 22.0, 10.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.79719924926758, -32.89847183227539, -31.99974822998047, -31.10102081298828, -30.202295303344727, -29.303569793701172, -28.404842376708984, -27.50611686706543, -26.607391357421875, -25.70866584777832, -24.809940338134766, -23.911212921142578, -23.012487411499023, -22.11376190185547, -21.21503448486328, -20.316308975219727, -19.417583465576172, -18.518857955932617, -17.620132446289062, -16.721405029296875, -15.82267951965332, -14.923954010009766, -14.025227546691895, -13.126501083374023, -12.227775573730469, -11.329050064086914, -10.430323600769043, -9.531597137451172, -8.632871627807617, -7.734145641326904, -6.835419654846191, -5.9366936683654785, -5.037969589233398, -4.1392436027526855, -3.2405176162719727, -2.3417916297912598, -1.4430656433105469, -0.544339656829834, 0.3543863296508789, 1.2531123161315918, 2.1518383026123047, 3.0505642890930176, 3.9492902755737305, 4.848016262054443, 5.746742248535156, 6.645468235015869, 7.544194221496582, 8.442920684814453, 9.341646194458008, 10.240371704101562, 11.139098167419434, 12.037824630737305, 12.93655014038086, 13.835275650024414, 14.734002113342285, 15.632728576660156, 16.53145408630371, 17.430179595947266, 18.328907012939453, 19.227632522583008, 20.126358032226562, 21.025083541870117, 21.923809051513672, 22.82253646850586, 23.721261978149414]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 12.0, 28.0, 29.0, 46.0, 55.0, 83.0, 97.0, 181.0, 284.0, 482.0, 854.0, 1638.0, 3728.0, 9086.0, 25575.0, 86872.0, 370593.0, 409083.0, 94626.0, 27835.0, 9495.0, 3866.0, 1724.0, 908.0, 460.0, 307.0, 197.0, 110.0, 83.0, 46.0, 39.0, 44.0, 20.0, 12.0, 10.0, 13.0, 5.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.078125, -10.7322998046875, -10.386474609375, -10.0406494140625, -9.69482421875, -9.3489990234375, -9.003173828125, -8.6573486328125, -8.3115234375, -7.9656982421875, -7.619873046875, -7.2740478515625, -6.92822265625, -6.5823974609375, -6.236572265625, -5.8907470703125, -5.544921875, -5.1990966796875, -4.853271484375, -4.5074462890625, -4.16162109375, -3.8157958984375, -3.469970703125, -3.1241455078125, -2.7783203125, -2.4324951171875, -2.086669921875, -1.7408447265625, -1.39501953125, -1.0491943359375, -0.703369140625, -0.3575439453125, -0.01171875, 0.3341064453125, 0.679931640625, 1.0257568359375, 1.37158203125, 1.7174072265625, 2.063232421875, 2.4090576171875, 2.7548828125, 3.1007080078125, 3.446533203125, 3.7923583984375, 4.13818359375, 4.4840087890625, 4.829833984375, 5.1756591796875, 5.521484375, 5.8673095703125, 6.213134765625, 6.5589599609375, 6.90478515625, 7.2506103515625, 7.596435546875, 7.9422607421875, 8.2880859375, 8.6339111328125, 8.979736328125, 9.3255615234375, 9.67138671875, 10.0172119140625, 10.363037109375, 10.7088623046875, 11.0546875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 10.0, 10.0, 8.0, 12.0, 26.0, 25.0, 30.0, 35.0, 35.0, 41.0, 64.0, 50.0, 61.0, 62.0, 64.0, 86.0, 49.0, 57.0, 47.0, 44.0, 38.0, 29.0, 31.0, 21.0, 16.0, 16.0, 9.0, 10.0, 9.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.751495361328125, -2.66900634765625, -2.586517333984375, -2.5040283203125, -2.421539306640625, -2.33905029296875, -2.256561279296875, -2.174072265625, -2.091583251953125, -2.00909423828125, -1.926605224609375, -1.8441162109375, -1.761627197265625, -1.67913818359375, -1.596649169921875, -1.51416015625, -1.431671142578125, -1.34918212890625, -1.266693115234375, -1.1842041015625, -1.101715087890625, -1.01922607421875, -0.936737060546875, -0.854248046875, -0.771759033203125, -0.68927001953125, -0.606781005859375, -0.5242919921875, -0.441802978515625, -0.35931396484375, -0.276824951171875, -0.1943359375, -0.111846923828125, -0.02935791015625, 0.053131103515625, 0.1356201171875, 0.218109130859375, 0.30059814453125, 0.383087158203125, 0.465576171875, 0.548065185546875, 0.63055419921875, 0.713043212890625, 0.7955322265625, 0.878021240234375, 0.96051025390625, 1.042999267578125, 1.12548828125, 1.207977294921875, 1.29046630859375, 1.372955322265625, 1.4554443359375, 1.537933349609375, 1.62042236328125, 1.702911376953125, 1.785400390625, 1.867889404296875, 1.95037841796875, 2.032867431640625, 2.1153564453125, 2.197845458984375, 2.28033447265625, 2.362823486328125, 2.4453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 8.0, 10.0, 13.0, 14.0, 20.0, 39.0, 53.0, 69.0, 109.0, 149.0, 277.0, 503.0, 873.0, 2005.0, 4402.0, 11109.0, 30157.0, 89268.0, 318217.0, 412664.0, 116464.0, 37992.0, 13774.0, 5449.0, 2347.0, 1074.0, 552.0, 327.0, 194.0, 143.0, 69.0, 71.0, 42.0, 21.0, 19.0, 12.0, 11.0, 10.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.671875, -7.440185546875, -7.20849609375, -6.976806640625, -6.7451171875, -6.513427734375, -6.28173828125, -6.050048828125, -5.818359375, -5.586669921875, -5.35498046875, -5.123291015625, -4.8916015625, -4.659912109375, -4.42822265625, -4.196533203125, -3.96484375, -3.733154296875, -3.50146484375, -3.269775390625, -3.0380859375, -2.806396484375, -2.57470703125, -2.343017578125, -2.111328125, -1.879638671875, -1.64794921875, -1.416259765625, -1.1845703125, -0.952880859375, -0.72119140625, -0.489501953125, -0.2578125, -0.026123046875, 0.20556640625, 0.437255859375, 0.6689453125, 0.900634765625, 1.13232421875, 1.364013671875, 1.595703125, 1.827392578125, 2.05908203125, 2.290771484375, 2.5224609375, 2.754150390625, 2.98583984375, 3.217529296875, 3.44921875, 3.680908203125, 3.91259765625, 4.144287109375, 4.3759765625, 4.607666015625, 4.83935546875, 5.071044921875, 5.302734375, 5.534423828125, 5.76611328125, 5.997802734375, 6.2294921875, 6.461181640625, 6.69287109375, 6.924560546875, 7.15625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 4.0, 7.0, 9.0, 12.0, 16.0, 20.0, 21.0, 28.0, 39.0, 39.0, 43.0, 38.0, 54.0, 33.0, 51.0, 43.0, 55.0, 42.0, 49.0, 46.0, 45.0, 49.0, 31.0, 25.0, 32.0, 32.0, 14.0, 27.0, 14.0, 13.0, 12.0, 12.0, 7.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0703125, -7.815185546875, -7.56005859375, -7.304931640625, -7.0498046875, -6.794677734375, -6.53955078125, -6.284423828125, -6.029296875, -5.774169921875, -5.51904296875, -5.263916015625, -5.0087890625, -4.753662109375, -4.49853515625, -4.243408203125, -3.98828125, -3.733154296875, -3.47802734375, -3.222900390625, -2.9677734375, -2.712646484375, -2.45751953125, -2.202392578125, -1.947265625, -1.692138671875, -1.43701171875, -1.181884765625, -0.9267578125, -0.671630859375, -0.41650390625, -0.161376953125, 0.09375, 0.348876953125, 0.60400390625, 0.859130859375, 1.1142578125, 1.369384765625, 1.62451171875, 1.879638671875, 2.134765625, 2.389892578125, 2.64501953125, 2.900146484375, 3.1552734375, 3.410400390625, 3.66552734375, 3.920654296875, 4.17578125, 4.430908203125, 4.68603515625, 4.941162109375, 5.1962890625, 5.451416015625, 5.70654296875, 5.961669921875, 6.216796875, 6.471923828125, 6.72705078125, 6.982177734375, 7.2373046875, 7.492431640625, 7.74755859375, 8.002685546875, 8.2578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 9.0, 8.0, 39.0, 42.0, 83.0, 154.0, 232.0, 435.0, 979.0, 2839.0, 9527.0, 43356.0, 339188.0, 566847.0, 65345.0, 13314.0, 3673.0, 1275.0, 519.0, 265.0, 159.0, 89.0, 60.0, 30.0, 29.0, 16.0, 10.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.25390625, -6.08984375, -5.92578125, -5.76171875, -5.59765625, -5.43359375, -5.26953125, -5.10546875, -4.94140625, -4.77734375, -4.61328125, -4.44921875, -4.28515625, -4.12109375, -3.95703125, -3.79296875, -3.62890625, -3.46484375, -3.30078125, -3.13671875, -2.97265625, -2.80859375, -2.64453125, -2.48046875, -2.31640625, -2.15234375, -1.98828125, -1.82421875, -1.66015625, -1.49609375, -1.33203125, -1.16796875, -1.00390625, -0.83984375, -0.67578125, -0.51171875, -0.34765625, -0.18359375, -0.01953125, 0.14453125, 0.30859375, 0.47265625, 0.63671875, 0.80078125, 0.96484375, 1.12890625, 1.29296875, 1.45703125, 1.62109375, 1.78515625, 1.94921875, 2.11328125, 2.27734375, 2.44140625, 2.60546875, 2.76953125, 2.93359375, 3.09765625, 3.26171875, 3.42578125, 3.58984375, 3.75390625, 3.91796875, 4.08203125, 4.24609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 7.0, 6.0, 6.0, 11.0, 10.0, 12.0, 16.0, 25.0, 26.0, 41.0, 58.0, 117.0, 184.0, 161.0, 94.0, 61.0, 32.0, 24.0, 26.0, 12.0, 12.0, 7.0, 5.0, 4.0, 5.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004949569702148438, -0.0004772096872329712, -0.00045946240425109863, -0.0004417151212692261, -0.0004239678382873535, -0.00040622055530548096, -0.0003884732723236084, -0.00037072598934173584, -0.0003529787063598633, -0.0003352314233779907, -0.00031748414039611816, -0.0002997368574142456, -0.00028198957443237305, -0.0002642422914505005, -0.00024649500846862793, -0.00022874772548675537, -0.0002110004425048828, -0.00019325315952301025, -0.0001755058765411377, -0.00015775859355926514, -0.00014001131057739258, -0.00012226402759552002, -0.00010451674461364746, -8.67694616317749e-05, -6.902217864990234e-05, -5.1274895668029785e-05, -3.3527612686157227e-05, -1.5780329704284668e-05, 1.9669532775878906e-06, 1.971423625946045e-05, 3.746151924133301e-05, 5.5208802223205566e-05, 7.295608520507812e-05, 9.070336818695068e-05, 0.00010845065116882324, 0.0001261979341506958, 0.00014394521713256836, 0.00016169250011444092, 0.00017943978309631348, 0.00019718706607818604, 0.0002149343490600586, 0.00023268163204193115, 0.0002504289150238037, 0.00026817619800567627, 0.00028592348098754883, 0.0003036707639694214, 0.00032141804695129395, 0.0003391653299331665, 0.00035691261291503906, 0.0003746598958969116, 0.0003924071788787842, 0.00041015446186065674, 0.0004279017448425293, 0.00044564902782440186, 0.0004633963108062744, 0.00048114359378814697, 0.0004988908767700195, 0.0005166381597518921, 0.0005343854427337646, 0.0005521327257156372, 0.0005698800086975098, 0.0005876272916793823, 0.0006053745746612549, 0.0006231218576431274, 0.000640869140625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 14.0, 11.0, 21.0, 51.0, 45.0, 78.0, 119.0, 203.0, 375.0, 760.0, 1981.0, 6549.0, 29999.0, 296162.0, 646507.0, 51357.0, 9582.0, 2640.0, 962.0, 464.0, 223.0, 164.0, 91.0, 68.0, 43.0, 25.0, 16.0, 12.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.7265625, -5.54840087890625, -5.3702392578125, -5.19207763671875, -5.013916015625, -4.83575439453125, -4.6575927734375, -4.47943115234375, -4.30126953125, -4.12310791015625, -3.9449462890625, -3.76678466796875, -3.588623046875, -3.41046142578125, -3.2322998046875, -3.05413818359375, -2.8759765625, -2.69781494140625, -2.5196533203125, -2.34149169921875, -2.163330078125, -1.98516845703125, -1.8070068359375, -1.62884521484375, -1.45068359375, -1.27252197265625, -1.0943603515625, -0.91619873046875, -0.738037109375, -0.55987548828125, -0.3817138671875, -0.20355224609375, -0.025390625, 0.15277099609375, 0.3309326171875, 0.50909423828125, 0.687255859375, 0.86541748046875, 1.0435791015625, 1.22174072265625, 1.39990234375, 1.57806396484375, 1.7562255859375, 1.93438720703125, 2.112548828125, 2.29071044921875, 2.4688720703125, 2.64703369140625, 2.8251953125, 3.00335693359375, 3.1815185546875, 3.35968017578125, 3.537841796875, 3.71600341796875, 3.8941650390625, 4.07232666015625, 4.25048828125, 4.42864990234375, 4.6068115234375, 4.78497314453125, 4.963134765625, 5.14129638671875, 5.3194580078125, 5.49761962890625, 5.67578125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 12.0, 17.0, 28.0, 46.0, 102.0, 209.0, 227.0, 165.0, 68.0, 40.0, 36.0, 17.0, 13.0, 11.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75390625, -5.51715087890625, -5.2803955078125, -5.04364013671875, -4.806884765625, -4.57012939453125, -4.3333740234375, -4.09661865234375, -3.85986328125, -3.62310791015625, -3.3863525390625, -3.14959716796875, -2.912841796875, -2.67608642578125, -2.4393310546875, -2.20257568359375, -1.9658203125, -1.72906494140625, -1.4923095703125, -1.25555419921875, -1.018798828125, -0.78204345703125, -0.5452880859375, -0.30853271484375, -0.07177734375, 0.16497802734375, 0.4017333984375, 0.63848876953125, 0.875244140625, 1.11199951171875, 1.3487548828125, 1.58551025390625, 1.822265625, 2.05902099609375, 2.2957763671875, 2.53253173828125, 2.769287109375, 3.00604248046875, 3.2427978515625, 3.47955322265625, 3.71630859375, 3.95306396484375, 4.1898193359375, 4.42657470703125, 4.663330078125, 4.90008544921875, 5.1368408203125, 5.37359619140625, 5.6103515625, 5.84710693359375, 6.0838623046875, 6.32061767578125, 6.557373046875, 6.79412841796875, 7.0308837890625, 7.26763916015625, 7.50439453125, 7.74114990234375, 7.9779052734375, 8.21466064453125, 8.451416015625, 8.68817138671875, 8.9249267578125, 9.16168212890625, 9.3984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 23.0, 66.0, 132.0, 225.0, 264.0, 143.0, 77.0, 29.0, 19.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.70284271240234, -124.26227569580078, -120.82170104980469, -117.38113403320312, -113.94056701660156, -110.5, -107.05943298339844, -103.61885833740234, -100.17829132080078, -96.73772430419922, -93.29714965820312, -89.85658264160156, -86.416015625, -82.97544860839844, -79.53488159179688, -76.09430694580078, -72.65373992919922, -69.21317291259766, -65.77259826660156, -62.33203125, -58.89146423339844, -55.450897216796875, -52.01032638549805, -48.56975555419922, -45.129188537597656, -41.688621520996094, -38.248050689697266, -34.80747985839844, -31.366912841796875, -27.92634391784668, -24.485774993896484, -21.04520606994629, -17.604644775390625, -14.16407585144043, -10.723506927490234, -7.282938003540039, -3.8423690795898438, -0.40180015563964844, 3.038768768310547, 6.479337692260742, 9.919906616210938, 13.360475540161133, 16.801044464111328, 20.241613388061523, 23.68218231201172, 27.122751235961914, 30.56332015991211, 34.00389099121094, 37.4444580078125, 40.88502502441406, 44.32559585571289, 47.76616668701172, 51.20673370361328, 54.647300720214844, 58.08787155151367, 61.5284423828125, 64.96900939941406, 68.40957641601562, 71.85014343261719, 75.29071807861328, 78.73128509521484, 82.1718521118164, 85.6124267578125, 89.05299377441406, 92.49356079101562]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 6.0, 7.0, 7.0, 6.0, 8.0, 12.0, 11.0, 17.0, 15.0, 15.0, 28.0, 22.0, 23.0, 19.0, 22.0, 35.0, 29.0, 30.0, 35.0, 39.0, 38.0, 50.0, 37.0, 47.0, 43.0, 45.0, 41.0, 39.0, 31.0, 32.0, 22.0, 25.0, 21.0, 19.0, 17.0, 17.0, 11.0, 12.0, 11.0, 14.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.669301986694336, -30.62922477722168, -29.589147567749023, -28.549070358276367, -27.50899314880371, -26.468915939331055, -25.4288387298584, -24.388761520385742, -23.348684310913086, -22.30860710144043, -21.268529891967773, -20.228452682495117, -19.18837547302246, -18.148298263549805, -17.10822105407715, -16.068143844604492, -15.028066635131836, -13.98798942565918, -12.947912216186523, -11.907835006713867, -10.867757797241211, -9.827680587768555, -8.787603378295898, -7.747526168823242, -6.707448959350586, -5.66737174987793, -4.627294540405273, -3.587217330932617, -2.547140121459961, -1.5070629119873047, -0.46698570251464844, 0.5730915069580078, 1.6131668090820312, 2.6532440185546875, 3.6933212280273438, 4.7333984375, 5.773475646972656, 6.8135528564453125, 7.853630065917969, 8.893707275390625, 9.933784484863281, 10.973861694335938, 12.013938903808594, 13.05401611328125, 14.094093322753906, 15.134170532226562, 16.17424774169922, 17.214324951171875, 18.25440216064453, 19.294479370117188, 20.334556579589844, 21.3746337890625, 22.414710998535156, 23.454788208007812, 24.49486541748047, 25.534942626953125, 26.57501983642578, 27.615097045898438, 28.655174255371094, 29.69525146484375, 30.735328674316406, 31.775405883789062, 32.81548309326172, 33.855560302734375, 34.89563751220703]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 10.0, 8.0, 11.0, 16.0, 24.0, 34.0, 39.0, 53.0, 83.0, 100.0, 133.0, 173.0, 250.0, 392.0, 719.0, 948.0, 1679.0, 3092.0, 6044.0, 12734.0, 33577.0, 178796.0, 3776922.0, 125404.0, 28696.0, 11549.0, 5617.0, 2857.0, 1583.0, 968.0, 572.0, 360.0, 265.0, 176.0, 112.0, 75.0, 62.0, 38.0, 28.0, 13.0, 12.0, 12.0, 13.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-16.625, -16.14208984375, -15.6591796875, -15.17626953125, -14.693359375, -14.21044921875, -13.7275390625, -13.24462890625, -12.76171875, -12.27880859375, -11.7958984375, -11.31298828125, -10.830078125, -10.34716796875, -9.8642578125, -9.38134765625, -8.8984375, -8.41552734375, -7.9326171875, -7.44970703125, -6.966796875, -6.48388671875, -6.0009765625, -5.51806640625, -5.03515625, -4.55224609375, -4.0693359375, -3.58642578125, -3.103515625, -2.62060546875, -2.1376953125, -1.65478515625, -1.171875, -0.68896484375, -0.2060546875, 0.27685546875, 0.759765625, 1.24267578125, 1.7255859375, 2.20849609375, 2.69140625, 3.17431640625, 3.6572265625, 4.14013671875, 4.623046875, 5.10595703125, 5.5888671875, 6.07177734375, 6.5546875, 7.03759765625, 7.5205078125, 8.00341796875, 8.486328125, 8.96923828125, 9.4521484375, 9.93505859375, 10.41796875, 10.90087890625, 11.3837890625, 11.86669921875, 12.349609375, 12.83251953125, 13.3154296875, 13.79833984375, 14.28125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 14.0, 7.0, 6.0, 6.0, 26.0, 17.0, 24.0, 43.0, 36.0, 61.0, 58.0, 36.0, 62.0, 62.0, 65.0, 67.0, 53.0, 63.0, 44.0, 43.0, 34.0, 56.0, 26.0, 21.0, 17.0, 15.0, 12.0, 14.0, 7.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83203125, -2.7479248046875, -2.663818359375, -2.5797119140625, -2.49560546875, -2.4114990234375, -2.327392578125, -2.2432861328125, -2.1591796875, -2.0750732421875, -1.990966796875, -1.9068603515625, -1.82275390625, -1.7386474609375, -1.654541015625, -1.5704345703125, -1.486328125, -1.4022216796875, -1.318115234375, -1.2340087890625, -1.14990234375, -1.0657958984375, -0.981689453125, -0.8975830078125, -0.8134765625, -0.7293701171875, -0.645263671875, -0.5611572265625, -0.47705078125, -0.3929443359375, -0.308837890625, -0.2247314453125, -0.140625, -0.0565185546875, 0.027587890625, 0.1116943359375, 0.19580078125, 0.2799072265625, 0.364013671875, 0.4481201171875, 0.5322265625, 0.6163330078125, 0.700439453125, 0.7845458984375, 0.86865234375, 0.9527587890625, 1.036865234375, 1.1209716796875, 1.205078125, 1.2891845703125, 1.373291015625, 1.4573974609375, 1.54150390625, 1.6256103515625, 1.709716796875, 1.7938232421875, 1.8779296875, 1.9620361328125, 2.046142578125, 2.1302490234375, 2.21435546875, 2.2984619140625, 2.382568359375, 2.4666748046875, 2.55078125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 8.0, 19.0, 27.0, 34.0, 79.0, 150.0, 247.0, 519.0, 1082.0, 2281.0, 5228.0, 13568.0, 41093.0, 207949.0, 3660590.0, 198074.0, 40088.0, 13414.0, 5296.0, 2248.0, 1084.0, 511.0, 275.0, 160.0, 108.0, 56.0, 29.0, 25.0, 11.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8046875, -9.4345703125, -9.064453125, -8.6943359375, -8.32421875, -7.9541015625, -7.583984375, -7.2138671875, -6.84375, -6.4736328125, -6.103515625, -5.7333984375, -5.36328125, -4.9931640625, -4.623046875, -4.2529296875, -3.8828125, -3.5126953125, -3.142578125, -2.7724609375, -2.40234375, -2.0322265625, -1.662109375, -1.2919921875, -0.921875, -0.5517578125, -0.181640625, 0.1884765625, 0.55859375, 0.9287109375, 1.298828125, 1.6689453125, 2.0390625, 2.4091796875, 2.779296875, 3.1494140625, 3.51953125, 3.8896484375, 4.259765625, 4.6298828125, 5.0, 5.3701171875, 5.740234375, 6.1103515625, 6.48046875, 6.8505859375, 7.220703125, 7.5908203125, 7.9609375, 8.3310546875, 8.701171875, 9.0712890625, 9.44140625, 9.8115234375, 10.181640625, 10.5517578125, 10.921875, 11.2919921875, 11.662109375, 12.0322265625, 12.40234375, 12.7724609375, 13.142578125, 13.5126953125, 13.8828125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 2.0, 4.0, 9.0, 6.0, 12.0, 14.0, 12.0, 14.0, 25.0, 31.0, 59.0, 64.0, 106.0, 216.0, 913.0, 1906.0, 297.0, 112.0, 71.0, 46.0, 26.0, 22.0, 29.0, 15.0, 8.0, 7.0, 9.0, 5.0, 7.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.380859375, -3.246307373046875, -3.11175537109375, -2.977203369140625, -2.8426513671875, -2.708099365234375, -2.57354736328125, -2.438995361328125, -2.304443359375, -2.169891357421875, -2.03533935546875, -1.900787353515625, -1.7662353515625, -1.631683349609375, -1.49713134765625, -1.362579345703125, -1.22802734375, -1.093475341796875, -0.95892333984375, -0.824371337890625, -0.6898193359375, -0.555267333984375, -0.42071533203125, -0.286163330078125, -0.151611328125, -0.017059326171875, 0.11749267578125, 0.252044677734375, 0.3865966796875, 0.521148681640625, 0.65570068359375, 0.790252685546875, 0.9248046875, 1.059356689453125, 1.19390869140625, 1.328460693359375, 1.4630126953125, 1.597564697265625, 1.73211669921875, 1.866668701171875, 2.001220703125, 2.135772705078125, 2.27032470703125, 2.404876708984375, 2.5394287109375, 2.673980712890625, 2.80853271484375, 2.943084716796875, 3.07763671875, 3.212188720703125, 3.34674072265625, 3.481292724609375, 3.6158447265625, 3.750396728515625, 3.88494873046875, 4.019500732421875, 4.154052734375, 4.288604736328125, 4.42315673828125, 4.557708740234375, 4.6922607421875, 4.826812744140625, 4.96136474609375, 5.095916748046875, 5.23046875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 13.0, 64.0, 228.0, 348.0, 224.0, 83.0, 32.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.54302978515625, -71.5330581665039, -69.52307891845703, -67.51310729980469, -65.50312805175781, -63.49315643310547, -61.483184814453125, -59.473209381103516, -57.463233947753906, -55.4532585144043, -53.44328308105469, -51.433311462402344, -49.423336029052734, -47.413360595703125, -45.40338897705078, -43.39341354370117, -41.38343811035156, -39.37346267700195, -37.363487243652344, -35.353515625, -33.34354019165039, -31.33356475830078, -29.323591232299805, -27.313617706298828, -25.30364227294922, -23.29366683959961, -21.283693313598633, -19.273719787597656, -17.263744354248047, -15.253769874572754, -13.243795394897461, -11.233820915222168, -9.223838806152344, -7.213864326477051, -5.203889846801758, -3.193915367126465, -1.1839408874511719, 0.8260335922241211, 2.836008071899414, 4.845982551574707, 6.85595703125, 8.865931510925293, 10.875905990600586, 12.885880470275879, 14.895854949951172, 16.90583038330078, 18.915803909301758, 20.925777435302734, 22.935752868652344, 24.945728302001953, 26.95570182800293, 28.965675354003906, 30.975650787353516, 32.985626220703125, 34.99559783935547, 37.00557327270508, 39.01554870605469, 41.0255241394043, 43.035499572753906, 45.04547119140625, 47.05544662475586, 49.06542205810547, 51.07539367675781, 53.08536911010742, 55.09534454345703]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 6.0, 6.0, 15.0, 16.0, 18.0, 26.0, 26.0, 27.0, 36.0, 29.0, 41.0, 46.0, 47.0, 48.0, 37.0, 52.0, 52.0, 57.0, 47.0, 47.0, 43.0, 41.0, 41.0, 30.0, 34.0, 28.0, 20.0, 15.0, 10.0, 10.0, 12.0, 11.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.950754165649414, -14.505043983459473, -14.059333801269531, -13.613622665405273, -13.167912483215332, -12.72220230102539, -12.276491165161133, -11.830780982971191, -11.38507080078125, -10.939360618591309, -10.493650436401367, -10.04793930053711, -9.602229118347168, -9.156518936157227, -8.710807800292969, -8.265097618103027, -7.819387435913086, -7.3736772537231445, -6.927966594696045, -6.482255935668945, -6.036545753479004, -5.5908355712890625, -5.145124912261963, -4.699414253234863, -4.253704071044922, -3.8079936504364014, -3.362283229827881, -2.9165728092193604, -2.47086238861084, -2.0251519680023193, -1.5794415473937988, -1.1337311267852783, -0.6880216598510742, -0.2423112392425537, 0.2033991813659668, 0.6491096019744873, 1.0948200225830078, 1.5405304431915283, 1.9862408638000488, 2.4319512844085693, 2.87766170501709, 3.3233721256256104, 3.769082546234131, 4.2147932052612305, 4.660503387451172, 5.106213569641113, 5.551924228668213, 5.9976348876953125, 6.443345069885254, 6.889055252075195, 7.334765911102295, 7.7804765701293945, 8.226186752319336, 8.671896934509277, 9.117607116699219, 9.563318252563477, 10.009028434753418, 10.45473861694336, 10.900449752807617, 11.346159934997559, 11.7918701171875, 12.237580299377441, 12.683290481567383, 13.12900161743164, 13.574711799621582]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 10.0, 16.0, 16.0, 18.0, 20.0, 52.0, 58.0, 98.0, 138.0, 216.0, 350.0, 505.0, 958.0, 1686.0, 3491.0, 7833.0, 18624.0, 49902.0, 151262.0, 408756.0, 264768.0, 87244.0, 30020.0, 11745.0, 5121.0, 2441.0, 1256.0, 723.0, 423.0, 268.0, 189.0, 116.0, 75.0, 43.0, 35.0, 11.0, 12.0, 12.0, 9.0, 11.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6015625, -8.280029296875, -7.95849609375, -7.636962890625, -7.3154296875, -6.993896484375, -6.67236328125, -6.350830078125, -6.029296875, -5.707763671875, -5.38623046875, -5.064697265625, -4.7431640625, -4.421630859375, -4.10009765625, -3.778564453125, -3.45703125, -3.135498046875, -2.81396484375, -2.492431640625, -2.1708984375, -1.849365234375, -1.52783203125, -1.206298828125, -0.884765625, -0.563232421875, -0.24169921875, 0.079833984375, 0.4013671875, 0.722900390625, 1.04443359375, 1.365966796875, 1.6875, 2.009033203125, 2.33056640625, 2.652099609375, 2.9736328125, 3.295166015625, 3.61669921875, 3.938232421875, 4.259765625, 4.581298828125, 4.90283203125, 5.224365234375, 5.5458984375, 5.867431640625, 6.18896484375, 6.510498046875, 6.83203125, 7.153564453125, 7.47509765625, 7.796630859375, 8.1181640625, 8.439697265625, 8.76123046875, 9.082763671875, 9.404296875, 9.725830078125, 10.04736328125, 10.368896484375, 10.6904296875, 11.011962890625, 11.33349609375, 11.655029296875, 11.9765625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 14.0, 10.0, 17.0, 21.0, 28.0, 28.0, 29.0, 43.0, 59.0, 61.0, 48.0, 61.0, 52.0, 68.0, 60.0, 44.0, 49.0, 53.0, 43.0, 49.0, 44.0, 29.0, 21.0, 13.0, 16.0, 11.0, 6.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0, -2.914886474609375, -2.82977294921875, -2.744659423828125, -2.6595458984375, -2.574432373046875, -2.48931884765625, -2.404205322265625, -2.319091796875, -2.233978271484375, -2.14886474609375, -2.063751220703125, -1.9786376953125, -1.893524169921875, -1.80841064453125, -1.723297119140625, -1.63818359375, -1.553070068359375, -1.46795654296875, -1.382843017578125, -1.2977294921875, -1.212615966796875, -1.12750244140625, -1.042388916015625, -0.957275390625, -0.872161865234375, -0.78704833984375, -0.701934814453125, -0.6168212890625, -0.531707763671875, -0.44659423828125, -0.361480712890625, -0.2763671875, -0.191253662109375, -0.10614013671875, -0.021026611328125, 0.0640869140625, 0.149200439453125, 0.23431396484375, 0.319427490234375, 0.404541015625, 0.489654541015625, 0.57476806640625, 0.659881591796875, 0.7449951171875, 0.830108642578125, 0.91522216796875, 1.000335693359375, 1.08544921875, 1.170562744140625, 1.25567626953125, 1.340789794921875, 1.4259033203125, 1.511016845703125, 1.59613037109375, 1.681243896484375, 1.766357421875, 1.851470947265625, 1.93658447265625, 2.021697998046875, 2.1068115234375, 2.191925048828125, 2.27703857421875, 2.362152099609375, 2.447265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 0.0, 5.0, 7.0, 2.0, 5.0, 7.0, 9.0, 26.0, 21.0, 36.0, 48.0, 53.0, 98.0, 127.0, 195.0, 293.0, 499.0, 882.0, 1843.0, 4371.0, 12549.0, 42685.0, 162588.0, 490174.0, 239661.0, 63383.0, 17588.0, 6051.0, 2471.0, 1063.0, 610.0, 395.0, 247.0, 154.0, 105.0, 79.0, 59.0, 34.0, 29.0, 28.0, 22.0, 14.0, 14.0, 5.0, 6.0, 5.0, 5.0, 4.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.796875, -7.5042724609375, -7.211669921875, -6.9190673828125, -6.62646484375, -6.3338623046875, -6.041259765625, -5.7486572265625, -5.4560546875, -5.1634521484375, -4.870849609375, -4.5782470703125, -4.28564453125, -3.9930419921875, -3.700439453125, -3.4078369140625, -3.115234375, -2.8226318359375, -2.530029296875, -2.2374267578125, -1.94482421875, -1.6522216796875, -1.359619140625, -1.0670166015625, -0.7744140625, -0.4818115234375, -0.189208984375, 0.1033935546875, 0.39599609375, 0.6885986328125, 0.981201171875, 1.2738037109375, 1.56640625, 1.8590087890625, 2.151611328125, 2.4442138671875, 2.73681640625, 3.0294189453125, 3.322021484375, 3.6146240234375, 3.9072265625, 4.1998291015625, 4.492431640625, 4.7850341796875, 5.07763671875, 5.3702392578125, 5.662841796875, 5.9554443359375, 6.248046875, 6.5406494140625, 6.833251953125, 7.1258544921875, 7.41845703125, 7.7110595703125, 8.003662109375, 8.2962646484375, 8.5888671875, 8.8814697265625, 9.174072265625, 9.4666748046875, 9.75927734375, 10.0518798828125, 10.344482421875, 10.6370849609375, 10.9296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 2.0, 6.0, 5.0, 10.0, 5.0, 15.0, 13.0, 21.0, 24.0, 26.0, 35.0, 31.0, 41.0, 46.0, 49.0, 48.0, 42.0, 53.0, 46.0, 43.0, 39.0, 52.0, 53.0, 46.0, 36.0, 33.0, 33.0, 29.0, 18.0, 14.0, 22.0, 14.0, 13.0, 6.0, 4.0, 7.0, 5.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.8690185546875, -8.550537109375, -8.2320556640625, -7.91357421875, -7.5950927734375, -7.276611328125, -6.9581298828125, -6.6396484375, -6.3211669921875, -6.002685546875, -5.6842041015625, -5.36572265625, -5.0472412109375, -4.728759765625, -4.4102783203125, -4.091796875, -3.7733154296875, -3.454833984375, -3.1363525390625, -2.81787109375, -2.4993896484375, -2.180908203125, -1.8624267578125, -1.5439453125, -1.2254638671875, -0.906982421875, -0.5885009765625, -0.27001953125, 0.0484619140625, 0.366943359375, 0.6854248046875, 1.00390625, 1.3223876953125, 1.640869140625, 1.9593505859375, 2.27783203125, 2.5963134765625, 2.914794921875, 3.2332763671875, 3.5517578125, 3.8702392578125, 4.188720703125, 4.5072021484375, 4.82568359375, 5.1441650390625, 5.462646484375, 5.7811279296875, 6.099609375, 6.4180908203125, 6.736572265625, 7.0550537109375, 7.37353515625, 7.6920166015625, 8.010498046875, 8.3289794921875, 8.6474609375, 8.9659423828125, 9.284423828125, 9.6029052734375, 9.92138671875, 10.2398681640625, 10.558349609375, 10.8768310546875, 11.1953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 4.0, 9.0, 14.0, 20.0, 42.0, 61.0, 104.0, 167.0, 315.0, 698.0, 1461.0, 3474.0, 8918.0, 31473.0, 251853.0, 670989.0, 57251.0, 13053.0, 4816.0, 1923.0, 898.0, 459.0, 230.0, 115.0, 84.0, 34.0, 24.0, 26.0, 14.0, 6.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.515625, -12.2188720703125, -11.922119140625, -11.6253662109375, -11.32861328125, -11.0318603515625, -10.735107421875, -10.4383544921875, -10.1416015625, -9.8448486328125, -9.548095703125, -9.2513427734375, -8.95458984375, -8.6578369140625, -8.361083984375, -8.0643310546875, -7.767578125, -7.4708251953125, -7.174072265625, -6.8773193359375, -6.58056640625, -6.2838134765625, -5.987060546875, -5.6903076171875, -5.3935546875, -5.0968017578125, -4.800048828125, -4.5032958984375, -4.20654296875, -3.9097900390625, -3.613037109375, -3.3162841796875, -3.01953125, -2.7227783203125, -2.426025390625, -2.1292724609375, -1.83251953125, -1.5357666015625, -1.239013671875, -0.9422607421875, -0.6455078125, -0.3487548828125, -0.052001953125, 0.2447509765625, 0.54150390625, 0.8382568359375, 1.135009765625, 1.4317626953125, 1.728515625, 2.0252685546875, 2.322021484375, 2.6187744140625, 2.91552734375, 3.2122802734375, 3.509033203125, 3.8057861328125, 4.1025390625, 4.3992919921875, 4.696044921875, 4.9927978515625, 5.28955078125, 5.5863037109375, 5.883056640625, 6.1798095703125, 6.4765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 5.0, 8.0, 7.0, 15.0, 27.0, 39.0, 41.0, 62.0, 70.0, 132.0, 229.0, 101.0, 71.0, 69.0, 36.0, 30.0, 11.0, 15.0, 9.0, 8.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00069427490234375, -0.0006656348705291748, -0.0006369948387145996, -0.0006083548069000244, -0.0005797147750854492, -0.000551074743270874, -0.0005224347114562988, -0.0004937946796417236, -0.00046515464782714844, -0.00043651461601257324, -0.00040787458419799805, -0.00037923455238342285, -0.00035059452056884766, -0.00032195448875427246, -0.00029331445693969727, -0.00026467442512512207, -0.00023603439331054688, -0.00020739436149597168, -0.00017875432968139648, -0.0001501142978668213, -0.0001214742660522461, -9.28342342376709e-05, -6.41942024230957e-05, -3.555417060852051e-05, -6.9141387939453125e-06, 2.1725893020629883e-05, 5.036592483520508e-05, 7.900595664978027e-05, 0.00010764598846435547, 0.00013628602027893066, 0.00016492605209350586, 0.00019356608390808105, 0.00022220611572265625, 0.00025084614753723145, 0.00027948617935180664, 0.00030812621116638184, 0.00033676624298095703, 0.0003654062747955322, 0.0003940463066101074, 0.0004226863384246826, 0.0004513263702392578, 0.000479966402053833, 0.0005086064338684082, 0.0005372464656829834, 0.0005658864974975586, 0.0005945265293121338, 0.000623166561126709, 0.0006518065929412842, 0.0006804466247558594, 0.0007090866565704346, 0.0007377266883850098, 0.000766366720199585, 0.0007950067520141602, 0.0008236467838287354, 0.0008522868156433105, 0.0008809268474578857, 0.0009095668792724609, 0.0009382069110870361, 0.0009668469429016113, 0.0009954869747161865, 0.0010241270065307617, 0.001052767038345337, 0.0010814070701599121, 0.0011100471019744873, 0.0011386871337890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 9.0, 7.0, 13.0, 32.0, 30.0, 50.0, 108.0, 238.0, 679.0, 3069.0, 42761.0, 961202.0, 36439.0, 2867.0, 609.0, 207.0, 101.0, 56.0, 23.0, 18.0, 16.0, 11.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.65625, -13.90380859375, -13.1513671875, -12.39892578125, -11.646484375, -10.89404296875, -10.1416015625, -9.38916015625, -8.63671875, -7.88427734375, -7.1318359375, -6.37939453125, -5.626953125, -4.87451171875, -4.1220703125, -3.36962890625, -2.6171875, -1.86474609375, -1.1123046875, -0.35986328125, 0.392578125, 1.14501953125, 1.8974609375, 2.64990234375, 3.40234375, 4.15478515625, 4.9072265625, 5.65966796875, 6.412109375, 7.16455078125, 7.9169921875, 8.66943359375, 9.421875, 10.17431640625, 10.9267578125, 11.67919921875, 12.431640625, 13.18408203125, 13.9365234375, 14.68896484375, 15.44140625, 16.19384765625, 16.9462890625, 17.69873046875, 18.451171875, 19.20361328125, 19.9560546875, 20.70849609375, 21.4609375, 22.21337890625, 22.9658203125, 23.71826171875, 24.470703125, 25.22314453125, 25.9755859375, 26.72802734375, 27.48046875, 28.23291015625, 28.9853515625, 29.73779296875, 30.490234375, 31.24267578125, 31.9951171875, 32.74755859375, 33.5]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 15.0, 15.0, 27.0, 34.0, 60.0, 92.0, 211.0, 260.0, 112.0, 63.0, 35.0, 26.0, 14.0, 7.0, 8.0, 4.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.734375, -15.152587890625, -14.57080078125, -13.989013671875, -13.4072265625, -12.825439453125, -12.24365234375, -11.661865234375, -11.080078125, -10.498291015625, -9.91650390625, -9.334716796875, -8.7529296875, -8.171142578125, -7.58935546875, -7.007568359375, -6.42578125, -5.843994140625, -5.26220703125, -4.680419921875, -4.0986328125, -3.516845703125, -2.93505859375, -2.353271484375, -1.771484375, -1.189697265625, -0.60791015625, -0.026123046875, 0.5556640625, 1.137451171875, 1.71923828125, 2.301025390625, 2.8828125, 3.464599609375, 4.04638671875, 4.628173828125, 5.2099609375, 5.791748046875, 6.37353515625, 6.955322265625, 7.537109375, 8.118896484375, 8.70068359375, 9.282470703125, 9.8642578125, 10.446044921875, 11.02783203125, 11.609619140625, 12.19140625, 12.773193359375, 13.35498046875, 13.936767578125, 14.5185546875, 15.100341796875, 15.68212890625, 16.263916015625, 16.845703125, 17.427490234375, 18.00927734375, 18.591064453125, 19.1728515625, 19.754638671875, 20.33642578125, 20.918212890625, 21.5]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 12.0, 41.0, 118.0, 267.0, 342.0, 167.0, 38.0, 11.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.1201629638672, -174.6456298828125, -167.17111206054688, -159.6965789794922, -152.2220458984375, -144.7475128173828, -137.27297973632812, -129.7984619140625, -122.32392883300781, -114.84939575195312, -107.37487030029297, -99.90034484863281, -92.42581176757812, -84.95127868652344, -77.47675323486328, -70.00222778320312, -62.52769470214844, -55.053165435791016, -47.578636169433594, -40.10410690307617, -32.62957763671875, -25.155048370361328, -17.680519104003906, -10.205989837646484, -2.7314605712890625, 4.743068695068359, 12.217597961425781, 19.692127227783203, 27.166656494140625, 34.64118576049805, 42.11571502685547, 49.59024429321289, 57.064788818359375, 64.53932189941406, 72.01384735107422, 79.48837280273438, 86.96290588378906, 94.43743896484375, 101.9119644165039, 109.38648986816406, 116.86102294921875, 124.33555603027344, 131.81008911132812, 139.28460693359375, 146.75914001464844, 154.23367309570312, 161.70819091796875, 169.18272399902344, 176.65725708007812, 184.1317901611328, 191.6063232421875, 199.08084106445312, 206.5553741455078, 214.0299072265625, 221.50442504882812, 228.9789581298828, 236.4534912109375, 243.9280242919922, 251.40255737304688, 258.8770751953125, 266.35162353515625, 273.8261413574219, 281.3006591796875, 288.77520751953125, 296.2497253417969]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 7.0, 5.0, 6.0, 13.0, 13.0, 11.0, 8.0, 18.0, 21.0, 16.0, 29.0, 26.0, 42.0, 32.0, 37.0, 39.0, 37.0, 48.0, 35.0, 53.0, 38.0, 42.0, 40.0, 39.0, 42.0, 31.0, 25.0, 38.0, 26.0, 28.0, 27.0, 21.0, 15.0, 16.0, 10.0, 12.0, 13.0, 14.0, 5.0, 6.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-67.58433532714844, -65.66551208496094, -63.74668502807617, -61.82786178588867, -59.90903854370117, -57.990211486816406, -56.071388244628906, -54.152565002441406, -52.23373794555664, -50.31491470336914, -48.396087646484375, -46.477264404296875, -44.558441162109375, -42.63961410522461, -40.72079086303711, -38.801963806152344, -36.883140563964844, -34.964317321777344, -33.04549026489258, -31.126667022705078, -29.207841873168945, -27.289016723632812, -25.370193481445312, -23.45136833190918, -21.532546997070312, -19.61372184753418, -17.69489860534668, -15.776073455810547, -13.857248306274414, -11.938424110412598, -10.019599914550781, -8.100774765014648, -6.181949615478516, -4.263124942779541, -2.3443005084991455, -0.42547607421875, 1.4933485984802246, 3.412173271179199, 5.330997467041016, 7.249822616577148, 9.168646812438965, 11.087471008300781, 13.006296157836914, 14.92512035369873, 16.843944549560547, 18.76276969909668, 20.681594848632812, 22.600418090820312, 24.519243240356445, 26.438068389892578, 28.356891632080078, 30.27571678161621, 32.194541931152344, 34.113365173339844, 36.032188415527344, 37.95101547241211, 39.86983871459961, 41.78866195678711, 43.707489013671875, 45.626312255859375, 47.545135498046875, 49.46396255493164, 51.38278579711914, 53.301612854003906, 55.220436096191406]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 11.0, 12.0, 29.0, 31.0, 46.0, 93.0, 131.0, 219.0, 427.0, 931.0, 2359.0, 7652.0, 38431.0, 2638768.0, 1456087.0, 37016.0, 7780.0, 2421.0, 921.0, 426.0, 203.0, 105.0, 65.0, 41.0, 18.0, 15.0, 7.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.578125, -24.802734375, -24.02734375, -23.251953125, -22.4765625, -21.701171875, -20.92578125, -20.150390625, -19.375, -18.599609375, -17.82421875, -17.048828125, -16.2734375, -15.498046875, -14.72265625, -13.947265625, -13.171875, -12.396484375, -11.62109375, -10.845703125, -10.0703125, -9.294921875, -8.51953125, -7.744140625, -6.96875, -6.193359375, -5.41796875, -4.642578125, -3.8671875, -3.091796875, -2.31640625, -1.541015625, -0.765625, 0.009765625, 0.78515625, 1.560546875, 2.3359375, 3.111328125, 3.88671875, 4.662109375, 5.4375, 6.212890625, 6.98828125, 7.763671875, 8.5390625, 9.314453125, 10.08984375, 10.865234375, 11.640625, 12.416015625, 13.19140625, 13.966796875, 14.7421875, 15.517578125, 16.29296875, 17.068359375, 17.84375, 18.619140625, 19.39453125, 20.169921875, 20.9453125, 21.720703125, 22.49609375, 23.271484375, 24.046875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 19.0, 14.0, 30.0, 11.0, 29.0, 31.0, 42.0, 35.0, 46.0, 52.0, 60.0, 68.0, 47.0, 45.0, 49.0, 43.0, 36.0, 45.0, 44.0, 45.0, 24.0, 26.0, 21.0, 20.0, 20.0, 17.0, 15.0, 5.0, 5.0, 9.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.048828125, -2.959503173828125, -2.87017822265625, -2.780853271484375, -2.6915283203125, -2.602203369140625, -2.51287841796875, -2.423553466796875, -2.334228515625, -2.244903564453125, -2.15557861328125, -2.066253662109375, -1.9769287109375, -1.887603759765625, -1.79827880859375, -1.708953857421875, -1.61962890625, -1.530303955078125, -1.44097900390625, -1.351654052734375, -1.2623291015625, -1.173004150390625, -1.08367919921875, -0.994354248046875, -0.905029296875, -0.815704345703125, -0.72637939453125, -0.637054443359375, -0.5477294921875, -0.458404541015625, -0.36907958984375, -0.279754638671875, -0.1904296875, -0.101104736328125, -0.01177978515625, 0.077545166015625, 0.1668701171875, 0.256195068359375, 0.34552001953125, 0.434844970703125, 0.524169921875, 0.613494873046875, 0.70281982421875, 0.792144775390625, 0.8814697265625, 0.970794677734375, 1.06011962890625, 1.149444580078125, 1.23876953125, 1.328094482421875, 1.41741943359375, 1.506744384765625, 1.5960693359375, 1.685394287109375, 1.77471923828125, 1.864044189453125, 1.953369140625, 2.042694091796875, 2.13201904296875, 2.221343994140625, 2.3106689453125, 2.399993896484375, 2.48931884765625, 2.578643798828125, 2.66796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 5.0, 9.0, 19.0, 20.0, 38.0, 67.0, 107.0, 223.0, 405.0, 927.0, 1909.0, 4746.0, 14327.0, 62371.0, 1756738.0, 2264660.0, 64305.0, 14721.0, 4841.0, 2033.0, 872.0, 438.0, 211.0, 118.0, 78.0, 46.0, 16.0, 8.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2109375, -14.6678466796875, -14.124755859375, -13.5816650390625, -13.03857421875, -12.4954833984375, -11.952392578125, -11.4093017578125, -10.8662109375, -10.3231201171875, -9.780029296875, -9.2369384765625, -8.69384765625, -8.1507568359375, -7.607666015625, -7.0645751953125, -6.521484375, -5.9783935546875, -5.435302734375, -4.8922119140625, -4.34912109375, -3.8060302734375, -3.262939453125, -2.7198486328125, -2.1767578125, -1.6336669921875, -1.090576171875, -0.5474853515625, -0.00439453125, 0.5386962890625, 1.081787109375, 1.6248779296875, 2.16796875, 2.7110595703125, 3.254150390625, 3.7972412109375, 4.34033203125, 4.8834228515625, 5.426513671875, 5.9696044921875, 6.5126953125, 7.0557861328125, 7.598876953125, 8.1419677734375, 8.68505859375, 9.2281494140625, 9.771240234375, 10.3143310546875, 10.857421875, 11.4005126953125, 11.943603515625, 12.4866943359375, 13.02978515625, 13.5728759765625, 14.115966796875, 14.6590576171875, 15.2021484375, 15.7452392578125, 16.288330078125, 16.8314208984375, 17.37451171875, 17.9176025390625, 18.460693359375, 19.0037841796875, 19.546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 16.0, 6.0, 17.0, 12.0, 26.0, 39.0, 54.0, 132.0, 313.0, 2241.0, 789.0, 190.0, 77.0, 63.0, 30.0, 18.0, 16.0, 8.0, 5.0, 2.0, 1.0, 7.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.484375, -7.1693115234375, -6.854248046875, -6.5391845703125, -6.22412109375, -5.9090576171875, -5.593994140625, -5.2789306640625, -4.9638671875, -4.6488037109375, -4.333740234375, -4.0186767578125, -3.70361328125, -3.3885498046875, -3.073486328125, -2.7584228515625, -2.443359375, -2.1282958984375, -1.813232421875, -1.4981689453125, -1.18310546875, -0.8680419921875, -0.552978515625, -0.2379150390625, 0.0771484375, 0.3922119140625, 0.707275390625, 1.0223388671875, 1.33740234375, 1.6524658203125, 1.967529296875, 2.2825927734375, 2.59765625, 2.9127197265625, 3.227783203125, 3.5428466796875, 3.85791015625, 4.1729736328125, 4.488037109375, 4.8031005859375, 5.1181640625, 5.4332275390625, 5.748291015625, 6.0633544921875, 6.37841796875, 6.6934814453125, 7.008544921875, 7.3236083984375, 7.638671875, 7.9537353515625, 8.268798828125, 8.5838623046875, 8.89892578125, 9.2139892578125, 9.529052734375, 9.8441162109375, 10.1591796875, 10.4742431640625, 10.789306640625, 11.1043701171875, 11.41943359375, 11.7344970703125, 12.049560546875, 12.3646240234375, 12.6796875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 25.0, 51.0, 141.0, 223.0, 255.0, 176.0, 73.0, 34.0, 11.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.861888885498047, -25.419986724853516, -22.978084564208984, -20.53618049621582, -18.09427833557129, -15.652376174926758, -13.21047306060791, -10.768569946289062, -8.326667785644531, -5.884765148162842, -3.4428625106811523, -1.000959873199463, 1.4409427642822266, 3.882844924926758, 6.3247480392456055, 8.766651153564453, 11.208553314208984, 13.650455474853516, 16.092357635498047, 18.53426170349121, 20.976163864135742, 23.418066024780273, 25.859970092773438, 28.30187225341797, 30.7437744140625, 33.18567657470703, 35.62757873535156, 38.069480895996094, 40.511383056640625, 42.953285217285156, 45.39519119262695, 47.837093353271484, 50.27899169921875, 52.72089385986328, 55.16279602050781, 57.604698181152344, 60.046600341796875, 62.488502502441406, 64.93040466308594, 67.372314453125, 69.814208984375, 72.25611114501953, 74.69801330566406, 77.1399154663086, 79.58181762695312, 82.02371978759766, 84.46562194824219, 86.90753173828125, 89.34943389892578, 91.79133605957031, 94.23323822021484, 96.67514038085938, 99.1170425415039, 101.55894470214844, 104.00084686279297, 106.4427490234375, 108.88465881347656, 111.3265609741211, 113.76846313476562, 116.21036529541016, 118.65226745605469, 121.09416961669922, 123.53607177734375, 125.97798156738281, 128.4198760986328]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 4.0, 5.0, 7.0, 13.0, 9.0, 12.0, 16.0, 10.0, 20.0, 27.0, 28.0, 28.0, 33.0, 39.0, 37.0, 26.0, 38.0, 36.0, 48.0, 50.0, 58.0, 48.0, 37.0, 41.0, 45.0, 30.0, 34.0, 34.0, 22.0, 33.0, 14.0, 23.0, 18.0, 11.0, 20.0, 12.0, 9.0, 9.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.93290138244629, -24.19645881652832, -23.46001434326172, -22.72357177734375, -21.98712921142578, -21.250686645507812, -20.51424217224121, -19.777799606323242, -19.04135513305664, -18.304912567138672, -17.56846809387207, -16.8320255279541, -16.095582962036133, -15.359139442443848, -14.622695922851562, -13.886253356933594, -13.149810791015625, -12.41336727142334, -11.676924705505371, -10.940481185913086, -10.204038619995117, -9.467595100402832, -8.731151580810547, -7.99470853805542, -7.258265495300293, -6.521822452545166, -5.785379409790039, -5.048935890197754, -4.312492847442627, -3.5760498046875, -2.839606285095215, -2.103163242340088, -1.3667221069335938, -0.6302789449691772, 0.10616421699523926, 0.8426074981689453, 1.5790505409240723, 2.315493583679199, 3.0519371032714844, 3.7883801460266113, 4.524823188781738, 5.261266231536865, 5.997709274291992, 6.734152793884277, 7.470595836639404, 8.207038879394531, 8.943482398986816, 9.679925918579102, 10.41636848449707, 11.152812004089355, 11.889254570007324, 12.62569808959961, 13.362140655517578, 14.098584175109863, 14.835027694702148, 15.571470260620117, 16.30791473388672, 17.044357299804688, 17.78080177307129, 18.517244338989258, 19.253686904907227, 19.990131378173828, 20.726573944091797, 21.463016510009766, 22.199459075927734]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 11.0, 7.0, 10.0, 17.0, 15.0, 15.0, 29.0, 35.0, 32.0, 76.0, 122.0, 187.0, 300.0, 527.0, 943.0, 1883.0, 3860.0, 8592.0, 21761.0, 60550.0, 175081.0, 360216.0, 262002.0, 95490.0, 33265.0, 12550.0, 5430.0, 2587.0, 1239.0, 657.0, 345.0, 224.0, 136.0, 89.0, 51.0, 53.0, 35.0, 15.0, 21.0, 13.0, 8.0, 12.0, 14.0, 3.0, 6.0, 5.0, 4.0, 3.0, 5.0, 5.0, 2.0, 1.0], "bins": [-11.296875, -10.9617919921875, -10.626708984375, -10.2916259765625, -9.95654296875, -9.6214599609375, -9.286376953125, -8.9512939453125, -8.6162109375, -8.2811279296875, -7.946044921875, -7.6109619140625, -7.27587890625, -6.9407958984375, -6.605712890625, -6.2706298828125, -5.935546875, -5.6004638671875, -5.265380859375, -4.9302978515625, -4.59521484375, -4.2601318359375, -3.925048828125, -3.5899658203125, -3.2548828125, -2.9197998046875, -2.584716796875, -2.2496337890625, -1.91455078125, -1.5794677734375, -1.244384765625, -0.9093017578125, -0.57421875, -0.2391357421875, 0.095947265625, 0.4310302734375, 0.76611328125, 1.1011962890625, 1.436279296875, 1.7713623046875, 2.1064453125, 2.4415283203125, 2.776611328125, 3.1116943359375, 3.44677734375, 3.7818603515625, 4.116943359375, 4.4520263671875, 4.787109375, 5.1221923828125, 5.457275390625, 5.7923583984375, 6.12744140625, 6.4625244140625, 6.797607421875, 7.1326904296875, 7.4677734375, 7.8028564453125, 8.137939453125, 8.4730224609375, 8.80810546875, 9.1431884765625, 9.478271484375, 9.8133544921875, 10.1484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 6.0, 4.0, 7.0, 8.0, 12.0, 14.0, 11.0, 16.0, 24.0, 30.0, 17.0, 34.0, 30.0, 44.0, 41.0, 67.0, 44.0, 41.0, 43.0, 40.0, 40.0, 44.0, 40.0, 51.0, 45.0, 34.0, 29.0, 38.0, 29.0, 19.0, 19.0, 11.0, 9.0, 12.0, 10.0, 12.0, 8.0, 10.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.38671875, -3.296051025390625, -3.20538330078125, -3.114715576171875, -3.0240478515625, -2.933380126953125, -2.84271240234375, -2.752044677734375, -2.661376953125, -2.570709228515625, -2.48004150390625, -2.389373779296875, -2.2987060546875, -2.208038330078125, -2.11737060546875, -2.026702880859375, -1.93603515625, -1.845367431640625, -1.75469970703125, -1.664031982421875, -1.5733642578125, -1.482696533203125, -1.39202880859375, -1.301361083984375, -1.210693359375, -1.120025634765625, -1.02935791015625, -0.938690185546875, -0.8480224609375, -0.757354736328125, -0.66668701171875, -0.576019287109375, -0.4853515625, -0.394683837890625, -0.30401611328125, -0.213348388671875, -0.1226806640625, -0.032012939453125, 0.05865478515625, 0.149322509765625, 0.239990234375, 0.330657958984375, 0.42132568359375, 0.511993408203125, 0.6026611328125, 0.693328857421875, 0.78399658203125, 0.874664306640625, 0.96533203125, 1.055999755859375, 1.14666748046875, 1.237335205078125, 1.3280029296875, 1.418670654296875, 1.50933837890625, 1.600006103515625, 1.690673828125, 1.781341552734375, 1.87200927734375, 1.962677001953125, 2.0533447265625, 2.144012451171875, 2.23468017578125, 2.325347900390625, 2.416015625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 3.0, 11.0, 17.0, 25.0, 35.0, 42.0, 63.0, 78.0, 134.0, 162.0, 350.0, 562.0, 1111.0, 2437.0, 6697.0, 23100.0, 111741.0, 494524.0, 323613.0, 61372.0, 14278.0, 4339.0, 1794.0, 821.0, 437.0, 281.0, 178.0, 91.0, 73.0, 44.0, 40.0, 27.0, 11.0, 17.0, 9.0, 3.0, 4.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.703125, -16.209228515625, -15.71533203125, -15.221435546875, -14.7275390625, -14.233642578125, -13.73974609375, -13.245849609375, -12.751953125, -12.258056640625, -11.76416015625, -11.270263671875, -10.7763671875, -10.282470703125, -9.78857421875, -9.294677734375, -8.80078125, -8.306884765625, -7.81298828125, -7.319091796875, -6.8251953125, -6.331298828125, -5.83740234375, -5.343505859375, -4.849609375, -4.355712890625, -3.86181640625, -3.367919921875, -2.8740234375, -2.380126953125, -1.88623046875, -1.392333984375, -0.8984375, -0.404541015625, 0.08935546875, 0.583251953125, 1.0771484375, 1.571044921875, 2.06494140625, 2.558837890625, 3.052734375, 3.546630859375, 4.04052734375, 4.534423828125, 5.0283203125, 5.522216796875, 6.01611328125, 6.510009765625, 7.00390625, 7.497802734375, 7.99169921875, 8.485595703125, 8.9794921875, 9.473388671875, 9.96728515625, 10.461181640625, 10.955078125, 11.448974609375, 11.94287109375, 12.436767578125, 12.9306640625, 13.424560546875, 13.91845703125, 14.412353515625, 14.90625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 5.0, 6.0, 11.0, 11.0, 20.0, 23.0, 19.0, 16.0, 31.0, 24.0, 37.0, 27.0, 44.0, 38.0, 46.0, 39.0, 44.0, 45.0, 41.0, 42.0, 48.0, 48.0, 50.0, 40.0, 34.0, 35.0, 29.0, 19.0, 25.0, 13.0, 14.0, 9.0, 11.0, 13.0, 8.0, 4.0, 7.0, 3.0, 2.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-17.46875, -16.93408203125, -16.3994140625, -15.86474609375, -15.330078125, -14.79541015625, -14.2607421875, -13.72607421875, -13.19140625, -12.65673828125, -12.1220703125, -11.58740234375, -11.052734375, -10.51806640625, -9.9833984375, -9.44873046875, -8.9140625, -8.37939453125, -7.8447265625, -7.31005859375, -6.775390625, -6.24072265625, -5.7060546875, -5.17138671875, -4.63671875, -4.10205078125, -3.5673828125, -3.03271484375, -2.498046875, -1.96337890625, -1.4287109375, -0.89404296875, -0.359375, 0.17529296875, 0.7099609375, 1.24462890625, 1.779296875, 2.31396484375, 2.8486328125, 3.38330078125, 3.91796875, 4.45263671875, 4.9873046875, 5.52197265625, 6.056640625, 6.59130859375, 7.1259765625, 7.66064453125, 8.1953125, 8.72998046875, 9.2646484375, 9.79931640625, 10.333984375, 10.86865234375, 11.4033203125, 11.93798828125, 12.47265625, 13.00732421875, 13.5419921875, 14.07666015625, 14.611328125, 15.14599609375, 15.6806640625, 16.21533203125, 16.75]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 12.0, 13.0, 16.0, 45.0, 67.0, 126.0, 228.0, 450.0, 916.0, 2466.0, 7283.0, 27122.0, 141073.0, 584680.0, 227369.0, 41150.0, 10002.0, 3189.0, 1208.0, 572.0, 265.0, 108.0, 78.0, 58.0, 26.0, 16.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.142822265625, -7.84814453125, -7.553466796875, -7.2587890625, -6.964111328125, -6.66943359375, -6.374755859375, -6.080078125, -5.785400390625, -5.49072265625, -5.196044921875, -4.9013671875, -4.606689453125, -4.31201171875, -4.017333984375, -3.72265625, -3.427978515625, -3.13330078125, -2.838623046875, -2.5439453125, -2.249267578125, -1.95458984375, -1.659912109375, -1.365234375, -1.070556640625, -0.77587890625, -0.481201171875, -0.1865234375, 0.108154296875, 0.40283203125, 0.697509765625, 0.9921875, 1.286865234375, 1.58154296875, 1.876220703125, 2.1708984375, 2.465576171875, 2.76025390625, 3.054931640625, 3.349609375, 3.644287109375, 3.93896484375, 4.233642578125, 4.5283203125, 4.822998046875, 5.11767578125, 5.412353515625, 5.70703125, 6.001708984375, 6.29638671875, 6.591064453125, 6.8857421875, 7.180419921875, 7.47509765625, 7.769775390625, 8.064453125, 8.359130859375, 8.65380859375, 8.948486328125, 9.2431640625, 9.537841796875, 9.83251953125, 10.127197265625, 10.421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 6.0, 17.0, 16.0, 19.0, 12.0, 28.0, 40.0, 47.0, 57.0, 78.0, 77.0, 91.0, 78.0, 75.0, 72.0, 56.0, 45.0, 32.0, 31.0, 23.0, 25.0, 14.0, 11.0, 7.0, 11.0, 3.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007424354553222656, -0.0007156208157539368, -0.0006888061761856079, -0.000661991536617279, -0.0006351768970489502, -0.0006083622574806213, -0.0005815476179122925, -0.0005547329783439636, -0.0005279183387756348, -0.0005011036992073059, -0.00047428905963897705, -0.0004474744200706482, -0.00042065978050231934, -0.0003938451409339905, -0.0003670305013656616, -0.00034021586179733276, -0.0003134012222290039, -0.00028658658266067505, -0.0002597719430923462, -0.00023295730352401733, -0.00020614266395568848, -0.00017932802438735962, -0.00015251338481903076, -0.0001256987452507019, -9.888410568237305e-05, -7.206946611404419e-05, -4.525482654571533e-05, -1.8440186977386475e-05, 8.374452590942383e-06, 3.518909215927124e-05, 6.20037317276001e-05, 8.881837129592896e-05, 0.00011563301086425781, 0.00014244765043258667, 0.00016926229000091553, 0.00019607692956924438, 0.00022289156913757324, 0.0002497062087059021, 0.00027652084827423096, 0.0003033354878425598, 0.00033015012741088867, 0.00035696476697921753, 0.0003837794065475464, 0.00041059404611587524, 0.0004374086856842041, 0.00046422332525253296, 0.0004910379648208618, 0.0005178526043891907, 0.0005446672439575195, 0.0005714818835258484, 0.0005982965230941772, 0.0006251111626625061, 0.000651925802230835, 0.0006787404417991638, 0.0007055550813674927, 0.0007323697209358215, 0.0007591843605041504, 0.0007859990000724792, 0.0008128136396408081, 0.000839628279209137, 0.0008664429187774658, 0.0008932575583457947, 0.0009200721979141235, 0.0009468868374824524, 0.0009737014770507812]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 9.0, 5.0, 5.0, 22.0, 18.0, 27.0, 33.0, 44.0, 57.0, 130.0, 177.0, 316.0, 624.0, 1218.0, 3183.0, 11270.0, 69915.0, 514961.0, 383541.0, 49050.0, 8882.0, 2636.0, 1108.0, 526.0, 286.0, 159.0, 122.0, 62.0, 45.0, 40.0, 26.0, 9.0, 9.0, 9.0, 7.0, 4.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-11.7109375, -11.37548828125, -11.0400390625, -10.70458984375, -10.369140625, -10.03369140625, -9.6982421875, -9.36279296875, -9.02734375, -8.69189453125, -8.3564453125, -8.02099609375, -7.685546875, -7.35009765625, -7.0146484375, -6.67919921875, -6.34375, -6.00830078125, -5.6728515625, -5.33740234375, -5.001953125, -4.66650390625, -4.3310546875, -3.99560546875, -3.66015625, -3.32470703125, -2.9892578125, -2.65380859375, -2.318359375, -1.98291015625, -1.6474609375, -1.31201171875, -0.9765625, -0.64111328125, -0.3056640625, 0.02978515625, 0.365234375, 0.70068359375, 1.0361328125, 1.37158203125, 1.70703125, 2.04248046875, 2.3779296875, 2.71337890625, 3.048828125, 3.38427734375, 3.7197265625, 4.05517578125, 4.390625, 4.72607421875, 5.0615234375, 5.39697265625, 5.732421875, 6.06787109375, 6.4033203125, 6.73876953125, 7.07421875, 7.40966796875, 7.7451171875, 8.08056640625, 8.416015625, 8.75146484375, 9.0869140625, 9.42236328125, 9.7578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 4.0, 8.0, 9.0, 19.0, 40.0, 43.0, 61.0, 74.0, 78.0, 81.0, 117.0, 112.0, 94.0, 60.0, 53.0, 35.0, 34.0, 15.0, 17.0, 14.0, 15.0, 3.0, 6.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.964111328125, -15.53759765625, -15.111083984375, -14.6845703125, -14.258056640625, -13.83154296875, -13.405029296875, -12.978515625, -12.552001953125, -12.12548828125, -11.698974609375, -11.2724609375, -10.845947265625, -10.41943359375, -9.992919921875, -9.56640625, -9.139892578125, -8.71337890625, -8.286865234375, -7.8603515625, -7.433837890625, -7.00732421875, -6.580810546875, -6.154296875, -5.727783203125, -5.30126953125, -4.874755859375, -4.4482421875, -4.021728515625, -3.59521484375, -3.168701171875, -2.7421875, -2.315673828125, -1.88916015625, -1.462646484375, -1.0361328125, -0.609619140625, -0.18310546875, 0.243408203125, 0.669921875, 1.096435546875, 1.52294921875, 1.949462890625, 2.3759765625, 2.802490234375, 3.22900390625, 3.655517578125, 4.08203125, 4.508544921875, 4.93505859375, 5.361572265625, 5.7880859375, 6.214599609375, 6.64111328125, 7.067626953125, 7.494140625, 7.920654296875, 8.34716796875, 8.773681640625, 9.2001953125, 9.626708984375, 10.05322265625, 10.479736328125, 10.90625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 20.0, 78.0, 471.0, 369.0, 54.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.98785400390625, -253.12005615234375, -237.2522735595703, -221.38449096679688, -205.51669311523438, -189.64889526367188, -173.78111267089844, -157.913330078125, -142.0455322265625, -126.17774200439453, -110.30995178222656, -94.4421615600586, -78.57437133789062, -62.706581115722656, -46.83879089355469, -30.97100067138672, -15.10321044921875, 0.7645797729492188, 16.632369995117188, 32.500160217285156, 48.367950439453125, 64.2357406616211, 80.10353088378906, 95.97132110595703, 111.839111328125, 127.70690155029297, 143.57469177246094, 159.44247436523438, 175.31027221679688, 191.17807006835938, 207.0458526611328, 222.91363525390625, 238.78143310546875, 254.64923095703125, 270.51702880859375, 286.3847961425781, 302.2525939941406, 318.1203918457031, 333.9881591796875, 349.85595703125, 365.7237548828125, 381.591552734375, 397.4593505859375, 413.3271179199219, 429.1949157714844, 445.0627136230469, 460.93048095703125, 476.79827880859375, 492.66607666015625, 508.53387451171875, 524.4016723632812, 540.2694702148438, 556.13720703125, 572.0050048828125, 587.872802734375, 603.7406005859375, 619.6083984375, 635.4761962890625, 651.343994140625, 667.2117919921875, 683.07958984375, 698.9473266601562, 714.8151245117188, 730.6829223632812, 746.5507202148438]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 7.0, 14.0, 5.0, 10.0, 4.0, 15.0, 11.0, 18.0, 22.0, 28.0, 28.0, 28.0, 25.0, 32.0, 40.0, 38.0, 52.0, 51.0, 43.0, 37.0, 57.0, 47.0, 40.0, 39.0, 53.0, 36.0, 35.0, 30.0, 24.0, 26.0, 17.0, 19.0, 13.0, 13.0, 9.0, 11.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-91.45722961425781, -88.45296478271484, -85.44869995117188, -82.4444351196289, -79.44017028808594, -76.4359130859375, -73.43164825439453, -70.42738342285156, -67.4231185913086, -64.41885375976562, -61.414588928222656, -58.41032791137695, -55.406063079833984, -52.401798248291016, -49.39753723144531, -46.393272399902344, -43.389007568359375, -40.384742736816406, -37.38047790527344, -34.376216888427734, -31.371952056884766, -28.367687225341797, -25.36342430114746, -22.359161376953125, -19.354896545410156, -16.350631713867188, -13.346368789672852, -10.3421049118042, -7.337841033935547, -4.3335771560668945, -1.3293132781982422, 1.6749496459960938, 4.679222106933594, 7.683485984802246, 10.687749862670898, 13.69201374053955, 16.696277618408203, 19.700542449951172, 22.704805374145508, 25.709068298339844, 28.713333129882812, 31.71759796142578, 34.72186279296875, 37.72612380981445, 40.73038864135742, 43.73465347290039, 46.738914489746094, 49.74317932128906, 52.74744415283203, 55.751708984375, 58.75597381591797, 61.76023483276367, 64.76449584960938, 67.76876068115234, 70.77302551269531, 73.77729034423828, 76.78155517578125, 79.78582000732422, 82.79008483886719, 85.79434967041016, 88.79861450195312, 91.80287170410156, 94.80713653564453, 97.8114013671875, 100.81566619873047]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 3.0, 9.0, 14.0, 14.0, 12.0, 36.0, 31.0, 56.0, 111.0, 201.0, 361.0, 659.0, 1460.0, 4126.0, 18964.0, 4078698.0, 77376.0, 7696.0, 2383.0, 976.0, 428.0, 246.0, 162.0, 95.0, 57.0, 34.0, 18.0, 14.0, 8.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-40.3125, -39.244384765625, -38.17626953125, -37.108154296875, -36.0400390625, -34.971923828125, -33.90380859375, -32.835693359375, -31.767578125, -30.699462890625, -29.63134765625, -28.563232421875, -27.4951171875, -26.427001953125, -25.35888671875, -24.290771484375, -23.22265625, -22.154541015625, -21.08642578125, -20.018310546875, -18.9501953125, -17.882080078125, -16.81396484375, -15.745849609375, -14.677734375, -13.609619140625, -12.54150390625, -11.473388671875, -10.4052734375, -9.337158203125, -8.26904296875, -7.200927734375, -6.1328125, -5.064697265625, -3.99658203125, -2.928466796875, -1.8603515625, -0.792236328125, 0.27587890625, 1.343994140625, 2.412109375, 3.480224609375, 4.54833984375, 5.616455078125, 6.6845703125, 7.752685546875, 8.82080078125, 9.888916015625, 10.95703125, 12.025146484375, 13.09326171875, 14.161376953125, 15.2294921875, 16.297607421875, 17.36572265625, 18.433837890625, 19.501953125, 20.570068359375, 21.63818359375, 22.706298828125, 23.7744140625, 24.842529296875, 25.91064453125, 26.978759765625, 28.046875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 1.0, 7.0, 6.0, 8.0, 10.0, 16.0, 19.0, 23.0, 23.0, 33.0, 47.0, 42.0, 51.0, 65.0, 59.0, 56.0, 61.0, 65.0, 44.0, 60.0, 35.0, 54.0, 36.0, 34.0, 33.0, 19.0, 21.0, 13.0, 11.0, 5.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0390625, -3.89605712890625, -3.7530517578125, -3.61004638671875, -3.467041015625, -3.32403564453125, -3.1810302734375, -3.03802490234375, -2.89501953125, -2.75201416015625, -2.6090087890625, -2.46600341796875, -2.322998046875, -2.17999267578125, -2.0369873046875, -1.89398193359375, -1.7509765625, -1.60797119140625, -1.4649658203125, -1.32196044921875, -1.178955078125, -1.03594970703125, -0.8929443359375, -0.74993896484375, -0.60693359375, -0.46392822265625, -0.3209228515625, -0.17791748046875, -0.034912109375, 0.10809326171875, 0.2510986328125, 0.39410400390625, 0.537109375, 0.68011474609375, 0.8231201171875, 0.96612548828125, 1.109130859375, 1.25213623046875, 1.3951416015625, 1.53814697265625, 1.68115234375, 1.82415771484375, 1.9671630859375, 2.11016845703125, 2.253173828125, 2.39617919921875, 2.5391845703125, 2.68218994140625, 2.8251953125, 2.96820068359375, 3.1112060546875, 3.25421142578125, 3.397216796875, 3.54022216796875, 3.6832275390625, 3.82623291015625, 3.96923828125, 4.11224365234375, 4.2552490234375, 4.39825439453125, 4.541259765625, 4.68426513671875, 4.8272705078125, 4.97027587890625, 5.11328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 6.0, 3.0, 4.0, 10.0, 10.0, 14.0, 18.0, 31.0, 34.0, 54.0, 76.0, 105.0, 159.0, 345.0, 617.0, 1306.0, 2909.0, 9042.0, 57472.0, 4065500.0, 43392.0, 7670.0, 2764.0, 1204.0, 605.0, 351.0, 192.0, 99.0, 79.0, 39.0, 40.0, 33.0, 22.0, 14.0, 17.0, 16.0, 7.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.625, -22.873779296875, -22.12255859375, -21.371337890625, -20.6201171875, -19.868896484375, -19.11767578125, -18.366455078125, -17.615234375, -16.864013671875, -16.11279296875, -15.361572265625, -14.6103515625, -13.859130859375, -13.10791015625, -12.356689453125, -11.60546875, -10.854248046875, -10.10302734375, -9.351806640625, -8.6005859375, -7.849365234375, -7.09814453125, -6.346923828125, -5.595703125, -4.844482421875, -4.09326171875, -3.342041015625, -2.5908203125, -1.839599609375, -1.08837890625, -0.337158203125, 0.4140625, 1.165283203125, 1.91650390625, 2.667724609375, 3.4189453125, 4.170166015625, 4.92138671875, 5.672607421875, 6.423828125, 7.175048828125, 7.92626953125, 8.677490234375, 9.4287109375, 10.179931640625, 10.93115234375, 11.682373046875, 12.43359375, 13.184814453125, 13.93603515625, 14.687255859375, 15.4384765625, 16.189697265625, 16.94091796875, 17.692138671875, 18.443359375, 19.194580078125, 19.94580078125, 20.697021484375, 21.4482421875, 22.199462890625, 22.95068359375, 23.701904296875, 24.453125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 18.0, 26.0, 74.0, 3305.0, 543.0, 55.0, 18.0, 8.0, 6.0, 2.0, 1.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.74609375, -3.52459716796875, -3.3031005859375, -3.08160400390625, -2.860107421875, -2.63861083984375, -2.4171142578125, -2.19561767578125, -1.97412109375, -1.75262451171875, -1.5311279296875, -1.30963134765625, -1.088134765625, -0.86663818359375, -0.6451416015625, -0.42364501953125, -0.2021484375, 0.01934814453125, 0.2408447265625, 0.46234130859375, 0.683837890625, 0.90533447265625, 1.1268310546875, 1.34832763671875, 1.56982421875, 1.79132080078125, 2.0128173828125, 2.23431396484375, 2.455810546875, 2.67730712890625, 2.8988037109375, 3.12030029296875, 3.341796875, 3.56329345703125, 3.7847900390625, 4.00628662109375, 4.227783203125, 4.44927978515625, 4.6707763671875, 4.89227294921875, 5.11376953125, 5.33526611328125, 5.5567626953125, 5.77825927734375, 5.999755859375, 6.22125244140625, 6.4427490234375, 6.66424560546875, 6.8857421875, 7.10723876953125, 7.3287353515625, 7.55023193359375, 7.771728515625, 7.99322509765625, 8.2147216796875, 8.43621826171875, 8.65771484375, 8.87921142578125, 9.1007080078125, 9.32220458984375, 9.543701171875, 9.76519775390625, 9.9866943359375, 10.20819091796875, 10.4296875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 12.0, 16.0, 39.0, 89.0, 152.0, 200.0, 195.0, 126.0, 76.0, 42.0, 27.0, 14.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.069580078125, -23.43726921081543, -22.80495834350586, -22.17264747619629, -21.54033660888672, -20.90802574157715, -20.275714874267578, -19.64340591430664, -19.011093139648438, -18.378782272338867, -17.746471405029297, -17.114160537719727, -16.481849670410156, -15.849538803100586, -15.217228889465332, -14.584918022155762, -13.952608108520508, -13.320297241210938, -12.687986373901367, -12.055675506591797, -11.423364639282227, -10.791053771972656, -10.158743858337402, -9.526432991027832, -8.894122123718262, -8.261811256408691, -7.629500389099121, -6.997189998626709, -6.364879131317139, -5.732568264007568, -5.100257873535156, -4.467947006225586, -3.8356380462646484, -3.203327178955078, -2.571016550064087, -1.9387058019638062, -1.3063950538635254, -0.6740841865539551, -0.04177355766296387, 0.5905370712280273, 1.2228479385375977, 1.8551586866378784, 2.487469434738159, 3.1197800636291504, 3.7520909309387207, 4.384401798248291, 5.016712188720703, 5.649023056030273, 6.281333923339844, 6.913644790649414, 7.545955657958984, 8.178266525268555, 8.810577392578125, 9.442888259887695, 10.07519817352295, 10.70750904083252, 11.33981990814209, 11.97213077545166, 12.60444164276123, 13.2367525100708, 13.869062423706055, 14.501373291015625, 15.133684158325195, 15.765995025634766, 16.398305892944336]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 7.0, 12.0, 12.0, 15.0, 21.0, 24.0, 28.0, 31.0, 28.0, 43.0, 49.0, 38.0, 53.0, 50.0, 62.0, 38.0, 52.0, 55.0, 44.0, 30.0, 37.0, 35.0, 19.0, 32.0, 33.0, 25.0, 11.0, 16.0, 18.0, 18.0, 11.0, 7.0, 9.0, 11.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.743284225463867, -7.49510383605957, -7.246923446655273, -6.998743057250977, -6.75056266784668, -6.502382278442383, -6.254201412200928, -6.006021022796631, -5.757840633392334, -5.509660243988037, -5.26147985458374, -5.013299465179443, -4.765118598937988, -4.516938209533691, -4.2687578201293945, -4.020577430725098, -3.772397041320801, -3.524216651916504, -3.276036262512207, -3.027855634689331, -2.779675245285034, -2.5314948558807373, -2.2833142280578613, -2.0351338386535645, -1.7869534492492676, -1.5387730598449707, -1.2905925512313843, -1.0424120426177979, -0.794231653213501, -0.5460512638092041, -0.2978707551956177, -0.04969024658203125, 0.19849014282226562, 0.4466705918312073, 0.6948510408401489, 0.9430314898490906, 1.1912119388580322, 1.439392328262329, 1.6875728368759155, 1.935753345489502, 2.183933734893799, 2.4321141242980957, 2.6802945137023926, 2.9284751415252686, 3.1766555309295654, 3.4248359203338623, 3.6730165481567383, 3.921196937561035, 4.169377326965332, 4.417557716369629, 4.665738105773926, 4.913918495178223, 5.1620988845825195, 5.410279273986816, 5.6584601402282715, 5.906640529632568, 6.154820919036865, 6.403001308441162, 6.651181697845459, 6.899362087249756, 7.147542953491211, 7.395723342895508, 7.643903732299805, 7.892084121704102, 8.140264511108398]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 10.0, 11.0, 17.0, 23.0, 41.0, 42.0, 75.0, 98.0, 162.0, 270.0, 432.0, 670.0, 1096.0, 1865.0, 3631.0, 7119.0, 15009.0, 34957.0, 84668.0, 199001.0, 313148.0, 217391.0, 96094.0, 38938.0, 16741.0, 7869.0, 4019.0, 2029.0, 1203.0, 653.0, 448.0, 280.0, 173.0, 105.0, 68.0, 53.0, 36.0, 35.0, 18.0, 13.0, 8.0, 8.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.796875, -8.5181884765625, -8.239501953125, -7.9608154296875, -7.68212890625, -7.4034423828125, -7.124755859375, -6.8460693359375, -6.5673828125, -6.2886962890625, -6.010009765625, -5.7313232421875, -5.45263671875, -5.1739501953125, -4.895263671875, -4.6165771484375, -4.337890625, -4.0592041015625, -3.780517578125, -3.5018310546875, -3.22314453125, -2.9444580078125, -2.665771484375, -2.3870849609375, -2.1083984375, -1.8297119140625, -1.551025390625, -1.2723388671875, -0.99365234375, -0.7149658203125, -0.436279296875, -0.1575927734375, 0.12109375, 0.3997802734375, 0.678466796875, 0.9571533203125, 1.23583984375, 1.5145263671875, 1.793212890625, 2.0718994140625, 2.3505859375, 2.6292724609375, 2.907958984375, 3.1866455078125, 3.46533203125, 3.7440185546875, 4.022705078125, 4.3013916015625, 4.580078125, 4.8587646484375, 5.137451171875, 5.4161376953125, 5.69482421875, 5.9735107421875, 6.252197265625, 6.5308837890625, 6.8095703125, 7.0882568359375, 7.366943359375, 7.6456298828125, 7.92431640625, 8.2030029296875, 8.481689453125, 8.7603759765625, 9.0390625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 4.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 7.0, 14.0, 20.0, 14.0, 25.0, 22.0, 27.0, 44.0, 41.0, 56.0, 49.0, 67.0, 52.0, 60.0, 51.0, 60.0, 48.0, 57.0, 48.0, 45.0, 31.0, 32.0, 15.0, 19.0, 13.0, 14.0, 6.0, 9.0, 7.0, 8.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.9432373046875, -3.800537109375, -3.6578369140625, -3.51513671875, -3.3724365234375, -3.229736328125, -3.0870361328125, -2.9443359375, -2.8016357421875, -2.658935546875, -2.5162353515625, -2.37353515625, -2.2308349609375, -2.088134765625, -1.9454345703125, -1.802734375, -1.6600341796875, -1.517333984375, -1.3746337890625, -1.23193359375, -1.0892333984375, -0.946533203125, -0.8038330078125, -0.6611328125, -0.5184326171875, -0.375732421875, -0.2330322265625, -0.09033203125, 0.0523681640625, 0.195068359375, 0.3377685546875, 0.48046875, 0.6231689453125, 0.765869140625, 0.9085693359375, 1.05126953125, 1.1939697265625, 1.336669921875, 1.4793701171875, 1.6220703125, 1.7647705078125, 1.907470703125, 2.0501708984375, 2.19287109375, 2.3355712890625, 2.478271484375, 2.6209716796875, 2.763671875, 2.9063720703125, 3.049072265625, 3.1917724609375, 3.33447265625, 3.4771728515625, 3.619873046875, 3.7625732421875, 3.9052734375, 4.0479736328125, 4.190673828125, 4.3333740234375, 4.47607421875, 4.6187744140625, 4.761474609375, 4.9041748046875, 5.046875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 14.0, 8.0, 15.0, 16.0, 26.0, 33.0, 45.0, 65.0, 85.0, 127.0, 165.0, 253.0, 353.0, 659.0, 1254.0, 3110.0, 9647.0, 41420.0, 257274.0, 587574.0, 114974.0, 21172.0, 5845.0, 1994.0, 913.0, 485.0, 318.0, 186.0, 125.0, 108.0, 74.0, 39.0, 31.0, 27.0, 28.0, 22.0, 19.0, 14.0, 5.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.96875, -18.41552734375, -17.8623046875, -17.30908203125, -16.755859375, -16.20263671875, -15.6494140625, -15.09619140625, -14.54296875, -13.98974609375, -13.4365234375, -12.88330078125, -12.330078125, -11.77685546875, -11.2236328125, -10.67041015625, -10.1171875, -9.56396484375, -9.0107421875, -8.45751953125, -7.904296875, -7.35107421875, -6.7978515625, -6.24462890625, -5.69140625, -5.13818359375, -4.5849609375, -4.03173828125, -3.478515625, -2.92529296875, -2.3720703125, -1.81884765625, -1.265625, -0.71240234375, -0.1591796875, 0.39404296875, 0.947265625, 1.50048828125, 2.0537109375, 2.60693359375, 3.16015625, 3.71337890625, 4.2666015625, 4.81982421875, 5.373046875, 5.92626953125, 6.4794921875, 7.03271484375, 7.5859375, 8.13916015625, 8.6923828125, 9.24560546875, 9.798828125, 10.35205078125, 10.9052734375, 11.45849609375, 12.01171875, 12.56494140625, 13.1181640625, 13.67138671875, 14.224609375, 14.77783203125, 15.3310546875, 15.88427734375, 16.4375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 1.0, 4.0, 5.0, 10.0, 8.0, 12.0, 15.0, 21.0, 23.0, 24.0, 28.0, 34.0, 47.0, 46.0, 41.0, 54.0, 53.0, 52.0, 57.0, 40.0, 36.0, 45.0, 54.0, 40.0, 42.0, 26.0, 30.0, 26.0, 28.0, 15.0, 17.0, 18.0, 7.0, 11.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.625, -22.8583984375, -22.091796875, -21.3251953125, -20.55859375, -19.7919921875, -19.025390625, -18.2587890625, -17.4921875, -16.7255859375, -15.958984375, -15.1923828125, -14.42578125, -13.6591796875, -12.892578125, -12.1259765625, -11.359375, -10.5927734375, -9.826171875, -9.0595703125, -8.29296875, -7.5263671875, -6.759765625, -5.9931640625, -5.2265625, -4.4599609375, -3.693359375, -2.9267578125, -2.16015625, -1.3935546875, -0.626953125, 0.1396484375, 0.90625, 1.6728515625, 2.439453125, 3.2060546875, 3.97265625, 4.7392578125, 5.505859375, 6.2724609375, 7.0390625, 7.8056640625, 8.572265625, 9.3388671875, 10.10546875, 10.8720703125, 11.638671875, 12.4052734375, 13.171875, 13.9384765625, 14.705078125, 15.4716796875, 16.23828125, 17.0048828125, 17.771484375, 18.5380859375, 19.3046875, 20.0712890625, 20.837890625, 21.6044921875, 22.37109375, 23.1376953125, 23.904296875, 24.6708984375, 25.4375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 9.0, 12.0, 12.0, 30.0, 44.0, 40.0, 87.0, 110.0, 217.0, 473.0, 1026.0, 2716.0, 9179.0, 41856.0, 278077.0, 584643.0, 103627.0, 18611.0, 4692.0, 1666.0, 638.0, 315.0, 169.0, 98.0, 58.0, 48.0, 32.0, 20.0, 14.0, 13.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.31988525390625, -7.0928955078125, -6.86590576171875, -6.638916015625, -6.41192626953125, -6.1849365234375, -5.95794677734375, -5.73095703125, -5.50396728515625, -5.2769775390625, -5.04998779296875, -4.822998046875, -4.59600830078125, -4.3690185546875, -4.14202880859375, -3.9150390625, -3.68804931640625, -3.4610595703125, -3.23406982421875, -3.007080078125, -2.78009033203125, -2.5531005859375, -2.32611083984375, -2.09912109375, -1.87213134765625, -1.6451416015625, -1.41815185546875, -1.191162109375, -0.96417236328125, -0.7371826171875, -0.51019287109375, -0.283203125, -0.05621337890625, 0.1707763671875, 0.39776611328125, 0.624755859375, 0.85174560546875, 1.0787353515625, 1.30572509765625, 1.53271484375, 1.75970458984375, 1.9866943359375, 2.21368408203125, 2.440673828125, 2.66766357421875, 2.8946533203125, 3.12164306640625, 3.3486328125, 3.57562255859375, 3.8026123046875, 4.02960205078125, 4.256591796875, 4.48358154296875, 4.7105712890625, 4.93756103515625, 5.16455078125, 5.39154052734375, 5.6185302734375, 5.84552001953125, 6.072509765625, 6.29949951171875, 6.5264892578125, 6.75347900390625, 6.98046875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 7.0, 8.0, 14.0, 10.0, 20.0, 32.0, 44.0, 58.0, 82.0, 83.0, 100.0, 107.0, 81.0, 92.0, 75.0, 55.0, 34.0, 25.0, 17.0, 15.0, 16.0, 7.0, 3.0, 2.0, 2.0, 6.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00115966796875, -0.0011277943849563599, -0.0010959208011627197, -0.0010640472173690796, -0.0010321736335754395, -0.0010003000497817993, -0.0009684264659881592, -0.000936552882194519, -0.0009046792984008789, -0.0008728057146072388, -0.0008409321308135986, -0.0008090585470199585, -0.0007771849632263184, -0.0007453113794326782, -0.0007134377956390381, -0.000681564211845398, -0.0006496906280517578, -0.0006178170442581177, -0.0005859434604644775, -0.0005540698766708374, -0.0005221962928771973, -0.0004903227090835571, -0.000458449125289917, -0.00042657554149627686, -0.0003947019577026367, -0.0003628283739089966, -0.00033095479011535645, -0.0002990812063217163, -0.00026720762252807617, -0.00023533403873443604, -0.0002034604549407959, -0.00017158687114715576, -0.00013971328735351562, -0.00010783970355987549, -7.596611976623535e-05, -4.4092535972595215e-05, -1.2218952178955078e-05, 1.965463161468506e-05, 5.1528215408325195e-05, 8.340179920196533e-05, 0.00011527538299560547, 0.0001471489667892456, 0.00017902255058288574, 0.00021089613437652588, 0.00024276971817016602, 0.00027464330196380615, 0.0003065168857574463, 0.0003383904695510864, 0.00037026405334472656, 0.0004021376371383667, 0.00043401122093200684, 0.00046588480472564697, 0.0004977583885192871, 0.0005296319723129272, 0.0005615055561065674, 0.0005933791399002075, 0.0006252527236938477, 0.0006571263074874878, 0.0006889998912811279, 0.0007208734750747681, 0.0007527470588684082, 0.0007846206426620483, 0.0008164942264556885, 0.0008483678102493286, 0.0008802413940429688]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 7.0, 3.0, 10.0, 11.0, 11.0, 25.0, 17.0, 32.0, 47.0, 88.0, 171.0, 261.0, 504.0, 944.0, 2101.0, 6754.0, 36605.0, 338562.0, 578625.0, 68202.0, 10221.0, 2800.0, 1165.0, 544.0, 295.0, 197.0, 118.0, 65.0, 52.0, 23.0, 31.0, 17.0, 13.0, 6.0, 7.0, 6.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-9.5859375, -9.32073974609375, -9.0555419921875, -8.79034423828125, -8.525146484375, -8.25994873046875, -7.9947509765625, -7.72955322265625, -7.46435546875, -7.19915771484375, -6.9339599609375, -6.66876220703125, -6.403564453125, -6.13836669921875, -5.8731689453125, -5.60797119140625, -5.3427734375, -5.07757568359375, -4.8123779296875, -4.54718017578125, -4.281982421875, -4.01678466796875, -3.7515869140625, -3.48638916015625, -3.22119140625, -2.95599365234375, -2.6907958984375, -2.42559814453125, -2.160400390625, -1.89520263671875, -1.6300048828125, -1.36480712890625, -1.099609375, -0.83441162109375, -0.5692138671875, -0.30401611328125, -0.038818359375, 0.22637939453125, 0.4915771484375, 0.75677490234375, 1.02197265625, 1.28717041015625, 1.5523681640625, 1.81756591796875, 2.082763671875, 2.34796142578125, 2.6131591796875, 2.87835693359375, 3.1435546875, 3.40875244140625, 3.6739501953125, 3.93914794921875, 4.204345703125, 4.46954345703125, 4.7347412109375, 4.99993896484375, 5.26513671875, 5.53033447265625, 5.7955322265625, 6.06072998046875, 6.325927734375, 6.59112548828125, 6.8563232421875, 7.12152099609375, 7.38671875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 6.0, 3.0, 4.0, 9.0, 10.0, 9.0, 11.0, 38.0, 24.0, 36.0, 56.0, 68.0, 64.0, 77.0, 64.0, 90.0, 87.0, 61.0, 52.0, 56.0, 41.0, 33.0, 21.0, 19.0, 11.0, 15.0, 10.0, 10.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.98516845703125, -8.7359619140625, -8.48675537109375, -8.237548828125, -7.98834228515625, -7.7391357421875, -7.48992919921875, -7.24072265625, -6.99151611328125, -6.7423095703125, -6.49310302734375, -6.243896484375, -5.99468994140625, -5.7454833984375, -5.49627685546875, -5.2470703125, -4.99786376953125, -4.7486572265625, -4.49945068359375, -4.250244140625, -4.00103759765625, -3.7518310546875, -3.50262451171875, -3.25341796875, -3.00421142578125, -2.7550048828125, -2.50579833984375, -2.256591796875, -2.00738525390625, -1.7581787109375, -1.50897216796875, -1.259765625, -1.01055908203125, -0.7613525390625, -0.51214599609375, -0.262939453125, -0.01373291015625, 0.2354736328125, 0.48468017578125, 0.73388671875, 0.98309326171875, 1.2322998046875, 1.48150634765625, 1.730712890625, 1.97991943359375, 2.2291259765625, 2.47833251953125, 2.7275390625, 2.97674560546875, 3.2259521484375, 3.47515869140625, 3.724365234375, 3.97357177734375, 4.2227783203125, 4.47198486328125, 4.72119140625, 4.97039794921875, 5.2196044921875, 5.46881103515625, 5.718017578125, 5.96722412109375, 6.2164306640625, 6.46563720703125, 6.71484375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 20.0, 130.0, 516.0, 297.0, 32.0, 10.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.62188720703125, -186.0924530029297, -171.56300354003906, -157.0335693359375, -142.50413513183594, -127.97469329833984, -113.44525146484375, -98.91581726074219, -84.3863754272461, -69.85693359375, -55.32749938964844, -40.798057556152344, -26.268619537353516, -11.739181518554688, 2.7902603149414062, 17.31969451904297, 31.849136352539062, 46.37857437133789, 60.90801239013672, 75.43745422363281, 89.96688842773438, 104.49633026123047, 119.02577209472656, 133.55520629882812, 148.08465576171875, 162.6140899658203, 177.14353942871094, 191.6729736328125, 206.20240783691406, 220.73184204101562, 235.26129150390625, 249.7907257080078, 264.3201599121094, 278.849609375, 293.3790283203125, 307.9084777832031, 322.43792724609375, 336.96734619140625, 351.4967956542969, 366.0262451171875, 380.5556640625, 395.0851135253906, 409.6145324707031, 424.14398193359375, 438.6734313964844, 453.2028503417969, 467.7322998046875, 482.26171875, 496.79119873046875, 511.3206481933594, 525.85009765625, 540.3795166015625, 554.908935546875, 569.4384155273438, 583.9678344726562, 598.4972534179688, 613.0266723632812, 627.5560913085938, 642.0855712890625, 656.614990234375, 671.1444091796875, 685.6738891601562, 700.2033081054688, 714.7327270507812, 729.26220703125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 3.0, 10.0, 16.0, 9.0, 16.0, 13.0, 21.0, 19.0, 21.0, 26.0, 49.0, 44.0, 33.0, 57.0, 46.0, 52.0, 53.0, 64.0, 54.0, 56.0, 49.0, 40.0, 28.0, 33.0, 31.0, 30.0, 18.0, 17.0, 22.0, 6.0, 14.0, 12.0, 6.0, 9.0, 6.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-98.25900268554688, -94.96586608886719, -91.67272186279297, -88.37958526611328, -85.0864486694336, -81.79330444335938, -78.50016784667969, -75.20703125, -71.91389465332031, -68.62075805664062, -65.3276138305664, -62.03447723388672, -58.74134063720703, -55.44820022583008, -52.155059814453125, -48.86192321777344, -45.568782806396484, -42.27564239501953, -38.982505798339844, -35.68936538696289, -32.3962287902832, -29.10308837890625, -25.80994987487793, -22.51681137084961, -19.22367286682129, -15.930534362792969, -12.637395858764648, -9.344256401062012, -6.051117897033691, -2.7579784393310547, 0.5351600646972656, 3.828298568725586, 7.121437072753906, 10.414575576782227, 13.707714080810547, 17.0008544921875, 20.293991088867188, 23.58713150024414, 26.88027000427246, 30.17340850830078, 33.46654510498047, 36.75968551635742, 40.05282211303711, 43.34596252441406, 46.63909912109375, 49.9322395324707, 53.225379943847656, 56.518516540527344, 59.8116569519043, 63.10479736328125, 66.39793395996094, 69.69107055664062, 72.98421478271484, 76.27735137939453, 79.57048797607422, 82.86363220214844, 86.15676879882812, 89.44990539550781, 92.74304962158203, 96.03618621826172, 99.3293228149414, 102.62246704101562, 105.91560363769531, 109.208740234375, 112.50187683105469]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 5.0, 14.0, 22.0, 39.0, 81.0, 119.0, 208.0, 488.0, 1118.0, 3428.0, 14687.0, 661999.0, 3490648.0, 15555.0, 3520.0, 1240.0, 513.0, 265.0, 136.0, 71.0, 39.0, 30.0, 13.0, 5.0, 9.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.612060546875, -22.97412109375, -22.336181640625, -21.6982421875, -21.060302734375, -20.42236328125, -19.784423828125, -19.146484375, -18.508544921875, -17.87060546875, -17.232666015625, -16.5947265625, -15.956787109375, -15.31884765625, -14.680908203125, -14.04296875, -13.405029296875, -12.76708984375, -12.129150390625, -11.4912109375, -10.853271484375, -10.21533203125, -9.577392578125, -8.939453125, -8.301513671875, -7.66357421875, -7.025634765625, -6.3876953125, -5.749755859375, -5.11181640625, -4.473876953125, -3.8359375, -3.197998046875, -2.56005859375, -1.922119140625, -1.2841796875, -0.646240234375, -0.00830078125, 0.629638671875, 1.267578125, 1.905517578125, 2.54345703125, 3.181396484375, 3.8193359375, 4.457275390625, 5.09521484375, 5.733154296875, 6.37109375, 7.009033203125, 7.64697265625, 8.284912109375, 8.9228515625, 9.560791015625, 10.19873046875, 10.836669921875, 11.474609375, 12.112548828125, 12.75048828125, 13.388427734375, 14.0263671875, 14.664306640625, 15.30224609375, 15.940185546875, 16.578125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 8.0, 1.0, 4.0, 13.0, 16.0, 16.0, 26.0, 19.0, 26.0, 31.0, 36.0, 39.0, 46.0, 52.0, 50.0, 74.0, 65.0, 56.0, 47.0, 54.0, 46.0, 59.0, 39.0, 36.0, 34.0, 24.0, 20.0, 17.0, 12.0, 5.0, 9.0, 4.0, 7.0, 3.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3125, -4.1629638671875, -4.013427734375, -3.8638916015625, -3.71435546875, -3.5648193359375, -3.415283203125, -3.2657470703125, -3.1162109375, -2.9666748046875, -2.817138671875, -2.6676025390625, -2.51806640625, -2.3685302734375, -2.218994140625, -2.0694580078125, -1.919921875, -1.7703857421875, -1.620849609375, -1.4713134765625, -1.32177734375, -1.1722412109375, -1.022705078125, -0.8731689453125, -0.7236328125, -0.5740966796875, -0.424560546875, -0.2750244140625, -0.12548828125, 0.0240478515625, 0.173583984375, 0.3231201171875, 0.47265625, 0.6221923828125, 0.771728515625, 0.9212646484375, 1.07080078125, 1.2203369140625, 1.369873046875, 1.5194091796875, 1.6689453125, 1.8184814453125, 1.968017578125, 2.1175537109375, 2.26708984375, 2.4166259765625, 2.566162109375, 2.7156982421875, 2.865234375, 3.0147705078125, 3.164306640625, 3.3138427734375, 3.46337890625, 3.6129150390625, 3.762451171875, 3.9119873046875, 4.0615234375, 4.2110595703125, 4.360595703125, 4.5101318359375, 4.65966796875, 4.8092041015625, 4.958740234375, 5.1082763671875, 5.2578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 7.0, 13.0, 6.0, 4.0, 23.0, 38.0, 29.0, 44.0, 70.0, 66.0, 107.0, 149.0, 226.0, 291.0, 418.0, 524.0, 744.0, 1046.0, 1429.0, 2338.0, 3780.0, 6411.0, 11819.0, 26993.0, 82712.0, 3315647.0, 619629.0, 68510.0, 23630.0, 10897.0, 5844.0, 3501.0, 2228.0, 1506.0, 1010.0, 752.0, 482.0, 347.0, 258.0, 185.0, 159.0, 116.0, 80.0, 52.0, 51.0, 41.0, 16.0, 18.0, 12.0, 8.0, 5.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.0078125, -5.82537841796875, -5.6429443359375, -5.46051025390625, -5.278076171875, -5.09564208984375, -4.9132080078125, -4.73077392578125, -4.54833984375, -4.36590576171875, -4.1834716796875, -4.00103759765625, -3.818603515625, -3.63616943359375, -3.4537353515625, -3.27130126953125, -3.0888671875, -2.90643310546875, -2.7239990234375, -2.54156494140625, -2.359130859375, -2.17669677734375, -1.9942626953125, -1.81182861328125, -1.62939453125, -1.44696044921875, -1.2645263671875, -1.08209228515625, -0.899658203125, -0.71722412109375, -0.5347900390625, -0.35235595703125, -0.169921875, 0.01251220703125, 0.1949462890625, 0.37738037109375, 0.559814453125, 0.74224853515625, 0.9246826171875, 1.10711669921875, 1.28955078125, 1.47198486328125, 1.6544189453125, 1.83685302734375, 2.019287109375, 2.20172119140625, 2.3841552734375, 2.56658935546875, 2.7490234375, 2.93145751953125, 3.1138916015625, 3.29632568359375, 3.478759765625, 3.66119384765625, 3.8436279296875, 4.02606201171875, 4.20849609375, 4.39093017578125, 4.5733642578125, 4.75579833984375, 4.938232421875, 5.12066650390625, 5.3031005859375, 5.48553466796875, 5.66796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 4.0, 4.0, 6.0, 12.0, 11.0, 15.0, 30.0, 43.0, 70.0, 162.0, 2773.0, 589.0, 128.0, 73.0, 45.0, 23.0, 15.0, 12.0, 12.0, 6.0, 5.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.537109375, -2.464385986328125, -2.39166259765625, -2.318939208984375, -2.2462158203125, -2.173492431640625, -2.10076904296875, -2.028045654296875, -1.955322265625, -1.882598876953125, -1.80987548828125, -1.737152099609375, -1.6644287109375, -1.591705322265625, -1.51898193359375, -1.446258544921875, -1.37353515625, -1.300811767578125, -1.22808837890625, -1.155364990234375, -1.0826416015625, -1.009918212890625, -0.93719482421875, -0.864471435546875, -0.791748046875, -0.719024658203125, -0.64630126953125, -0.573577880859375, -0.5008544921875, -0.428131103515625, -0.35540771484375, -0.282684326171875, -0.2099609375, -0.137237548828125, -0.06451416015625, 0.008209228515625, 0.0809326171875, 0.153656005859375, 0.22637939453125, 0.299102783203125, 0.371826171875, 0.444549560546875, 0.51727294921875, 0.589996337890625, 0.6627197265625, 0.735443115234375, 0.80816650390625, 0.880889892578125, 0.95361328125, 1.026336669921875, 1.09906005859375, 1.171783447265625, 1.2445068359375, 1.317230224609375, 1.38995361328125, 1.462677001953125, 1.535400390625, 1.608123779296875, 1.68084716796875, 1.753570556640625, 1.8262939453125, 1.899017333984375, 1.97174072265625, 2.044464111328125, 2.1171875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 1.0, 8.0, 14.0, 21.0, 29.0, 55.0, 72.0, 102.0, 127.0, 129.0, 108.0, 111.0, 83.0, 50.0, 39.0, 19.0, 16.0, 4.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.549036026000977, -14.209025382995605, -13.869013786315918, -13.529003143310547, -13.18899154663086, -12.848980903625488, -12.508970260620117, -12.16895866394043, -11.828948020935059, -11.488937377929688, -11.14892578125, -10.808915138244629, -10.468904495239258, -10.12889289855957, -9.7888822555542, -9.448871612548828, -9.10886001586914, -8.76884937286377, -8.428837776184082, -8.088827133178711, -7.748816013336182, -7.408804893493652, -7.068794250488281, -6.728783130645752, -6.388772010803223, -6.048760890960693, -5.708749771118164, -5.368739128112793, -5.028728008270264, -4.688716888427734, -4.348706245422363, -4.008695125579834, -3.6686840057373047, -3.3286728858947754, -2.988662004470825, -2.648651123046875, -2.3086400032043457, -1.968629002571106, -1.6286180019378662, -1.288607120513916, -0.9485960006713867, -0.608585000038147, -0.2685739994049072, 0.07143700122833252, 0.41144800186157227, 0.751459002494812, 1.0914700031280518, 1.431480884552002, 1.7714920043945312, 2.1115031242370605, 2.4515140056610107, 2.791524887084961, 3.1315360069274902, 3.4715471267700195, 3.8115580081939697, 4.15156888961792, 4.491580009460449, 4.8315911293029785, 5.171602249145508, 5.511612892150879, 5.851624011993408, 6.1916351318359375, 6.531645774841309, 6.871656894683838, 7.211668014526367]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 5.0, 6.0, 10.0, 6.0, 12.0, 17.0, 15.0, 20.0, 25.0, 34.0, 32.0, 30.0, 31.0, 47.0, 38.0, 39.0, 39.0, 37.0, 38.0, 43.0, 54.0, 52.0, 40.0, 33.0, 36.0, 34.0, 27.0, 32.0, 26.0, 16.0, 25.0, 22.0, 15.0, 11.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-6.172049522399902, -5.989982604980469, -5.807915210723877, -5.625848293304443, -5.443780899047852, -5.261713981628418, -5.079646587371826, -4.897579669952393, -4.715512275695801, -4.533445358276367, -4.351377964019775, -4.169311046600342, -3.98724365234375, -3.8051764965057373, -3.6231093406677246, -3.441042423248291, -3.2589752674102783, -3.0769081115722656, -2.894840955734253, -2.7127737998962402, -2.5307066440582275, -2.348639488220215, -2.1665725708007812, -1.984505295753479, -1.8024381399154663, -1.6203709840774536, -1.438303828239441, -1.2562367916107178, -1.074169635772705, -0.8921024203300476, -0.7100353240966797, -0.527968168258667, -0.3459010124206543, -0.1638338714838028, 0.018233269453048706, 0.200300395488739, 0.3823675513267517, 0.5644347071647644, 0.7465018033981323, 0.928568959236145, 1.1106361150741577, 1.2927032709121704, 1.474770426750183, 1.6568374633789062, 1.838904619216919, 2.0209717750549316, 2.2030389308929443, 2.385106086730957, 2.5671732425689697, 2.7492403984069824, 2.931307554244995, 3.113374710083008, 3.2954418659210205, 3.477509021759033, 3.659575939178467, 3.8416433334350586, 4.023710250854492, 4.205777168273926, 4.387844562530518, 4.569911479949951, 4.751978874206543, 4.934045791625977, 5.116113185882568, 5.298180103302002, 5.480247497558594]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 2.0, 9.0, 2.0, 8.0, 20.0, 23.0, 22.0, 52.0, 84.0, 120.0, 199.0, 318.0, 551.0, 1122.0, 2302.0, 5496.0, 14091.0, 42501.0, 137472.0, 350625.0, 320383.0, 115924.0, 35868.0, 12197.0, 4803.0, 2070.0, 980.0, 534.0, 312.0, 163.0, 99.0, 62.0, 45.0, 28.0, 18.0, 15.0, 12.0, 7.0, 4.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.8828125, -9.599853515625, -9.31689453125, -9.033935546875, -8.7509765625, -8.468017578125, -8.18505859375, -7.902099609375, -7.619140625, -7.336181640625, -7.05322265625, -6.770263671875, -6.4873046875, -6.204345703125, -5.92138671875, -5.638427734375, -5.35546875, -5.072509765625, -4.78955078125, -4.506591796875, -4.2236328125, -3.940673828125, -3.65771484375, -3.374755859375, -3.091796875, -2.808837890625, -2.52587890625, -2.242919921875, -1.9599609375, -1.677001953125, -1.39404296875, -1.111083984375, -0.828125, -0.545166015625, -0.26220703125, 0.020751953125, 0.3037109375, 0.586669921875, 0.86962890625, 1.152587890625, 1.435546875, 1.718505859375, 2.00146484375, 2.284423828125, 2.5673828125, 2.850341796875, 3.13330078125, 3.416259765625, 3.69921875, 3.982177734375, 4.26513671875, 4.548095703125, 4.8310546875, 5.114013671875, 5.39697265625, 5.679931640625, 5.962890625, 6.245849609375, 6.52880859375, 6.811767578125, 7.0947265625, 7.377685546875, 7.66064453125, 7.943603515625, 8.2265625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 9.0, 11.0, 9.0, 23.0, 22.0, 14.0, 33.0, 40.0, 27.0, 44.0, 65.0, 43.0, 68.0, 66.0, 68.0, 51.0, 60.0, 64.0, 52.0, 36.0, 43.0, 35.0, 22.0, 22.0, 15.0, 14.0, 5.0, 7.0, 4.0, 9.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.19403076171875, -4.0404052734375, -3.88677978515625, -3.733154296875, -3.57952880859375, -3.4259033203125, -3.27227783203125, -3.11865234375, -2.96502685546875, -2.8114013671875, -2.65777587890625, -2.504150390625, -2.35052490234375, -2.1968994140625, -2.04327392578125, -1.8896484375, -1.73602294921875, -1.5823974609375, -1.42877197265625, -1.275146484375, -1.12152099609375, -0.9678955078125, -0.81427001953125, -0.66064453125, -0.50701904296875, -0.3533935546875, -0.19976806640625, -0.046142578125, 0.10748291015625, 0.2611083984375, 0.41473388671875, 0.568359375, 0.72198486328125, 0.8756103515625, 1.02923583984375, 1.182861328125, 1.33648681640625, 1.4901123046875, 1.64373779296875, 1.79736328125, 1.95098876953125, 2.1046142578125, 2.25823974609375, 2.411865234375, 2.56549072265625, 2.7191162109375, 2.87274169921875, 3.0263671875, 3.17999267578125, 3.3336181640625, 3.48724365234375, 3.640869140625, 3.79449462890625, 3.9481201171875, 4.10174560546875, 4.25537109375, 4.40899658203125, 4.5626220703125, 4.71624755859375, 4.869873046875, 5.02349853515625, 5.1771240234375, 5.33074951171875, 5.484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 9.0, 14.0, 7.0, 26.0, 27.0, 34.0, 41.0, 78.0, 103.0, 151.0, 262.0, 430.0, 817.0, 1934.0, 6354.0, 32456.0, 329840.0, 599477.0, 61446.0, 9793.0, 2727.0, 1093.0, 548.0, 309.0, 194.0, 135.0, 66.0, 41.0, 42.0, 23.0, 15.0, 14.0, 7.0, 12.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.171875, -17.606689453125, -17.04150390625, -16.476318359375, -15.9111328125, -15.345947265625, -14.78076171875, -14.215576171875, -13.650390625, -13.085205078125, -12.52001953125, -11.954833984375, -11.3896484375, -10.824462890625, -10.25927734375, -9.694091796875, -9.12890625, -8.563720703125, -7.99853515625, -7.433349609375, -6.8681640625, -6.302978515625, -5.73779296875, -5.172607421875, -4.607421875, -4.042236328125, -3.47705078125, -2.911865234375, -2.3466796875, -1.781494140625, -1.21630859375, -0.651123046875, -0.0859375, 0.479248046875, 1.04443359375, 1.609619140625, 2.1748046875, 2.739990234375, 3.30517578125, 3.870361328125, 4.435546875, 5.000732421875, 5.56591796875, 6.131103515625, 6.6962890625, 7.261474609375, 7.82666015625, 8.391845703125, 8.95703125, 9.522216796875, 10.08740234375, 10.652587890625, 11.2177734375, 11.782958984375, 12.34814453125, 12.913330078125, 13.478515625, 14.043701171875, 14.60888671875, 15.174072265625, 15.7392578125, 16.304443359375, 16.86962890625, 17.434814453125, 18.0]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 0.0, 4.0, 4.0, 11.0, 13.0, 11.0, 10.0, 15.0, 21.0, 23.0, 32.0, 38.0, 44.0, 52.0, 40.0, 52.0, 68.0, 50.0, 45.0, 47.0, 54.0, 48.0, 44.0, 42.0, 49.0, 39.0, 24.0, 24.0, 15.0, 18.0, 13.0, 12.0, 6.0, 5.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.546875, -22.837890625, -22.12890625, -21.419921875, -20.7109375, -20.001953125, -19.29296875, -18.583984375, -17.875, -17.166015625, -16.45703125, -15.748046875, -15.0390625, -14.330078125, -13.62109375, -12.912109375, -12.203125, -11.494140625, -10.78515625, -10.076171875, -9.3671875, -8.658203125, -7.94921875, -7.240234375, -6.53125, -5.822265625, -5.11328125, -4.404296875, -3.6953125, -2.986328125, -2.27734375, -1.568359375, -0.859375, -0.150390625, 0.55859375, 1.267578125, 1.9765625, 2.685546875, 3.39453125, 4.103515625, 4.8125, 5.521484375, 6.23046875, 6.939453125, 7.6484375, 8.357421875, 9.06640625, 9.775390625, 10.484375, 11.193359375, 11.90234375, 12.611328125, 13.3203125, 14.029296875, 14.73828125, 15.447265625, 16.15625, 16.865234375, 17.57421875, 18.283203125, 18.9921875, 19.701171875, 20.41015625, 21.119140625, 21.828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 14.0, 16.0, 19.0, 26.0, 42.0, 61.0, 84.0, 139.0, 219.0, 394.0, 867.0, 2085.0, 7024.0, 36330.0, 360686.0, 569389.0, 56799.0, 9660.0, 2576.0, 941.0, 450.0, 262.0, 140.0, 107.0, 76.0, 39.0, 21.0, 16.0, 17.0, 10.0, 11.0, 12.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37890625, -6.13458251953125, -5.8902587890625, -5.64593505859375, -5.401611328125, -5.15728759765625, -4.9129638671875, -4.66864013671875, -4.42431640625, -4.17999267578125, -3.9356689453125, -3.69134521484375, -3.447021484375, -3.20269775390625, -2.9583740234375, -2.71405029296875, -2.4697265625, -2.22540283203125, -1.9810791015625, -1.73675537109375, -1.492431640625, -1.24810791015625, -1.0037841796875, -0.75946044921875, -0.51513671875, -0.27081298828125, -0.0264892578125, 0.21783447265625, 0.462158203125, 0.70648193359375, 0.9508056640625, 1.19512939453125, 1.439453125, 1.68377685546875, 1.9281005859375, 2.17242431640625, 2.416748046875, 2.66107177734375, 2.9053955078125, 3.14971923828125, 3.39404296875, 3.63836669921875, 3.8826904296875, 4.12701416015625, 4.371337890625, 4.61566162109375, 4.8599853515625, 5.10430908203125, 5.3486328125, 5.59295654296875, 5.8372802734375, 6.08160400390625, 6.325927734375, 6.57025146484375, 6.8145751953125, 7.05889892578125, 7.30322265625, 7.54754638671875, 7.7918701171875, 8.03619384765625, 8.280517578125, 8.52484130859375, 8.7691650390625, 9.01348876953125, 9.2578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 1.0, 1.0, 9.0, 2.0, 2.0, 7.0, 4.0, 9.0, 8.0, 18.0, 18.0, 21.0, 20.0, 41.0, 42.0, 65.0, 65.0, 84.0, 94.0, 89.0, 82.0, 56.0, 59.0, 50.0, 34.0, 23.0, 27.0, 19.0, 10.0, 16.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007691383361816406, -0.0007465332746505737, -0.0007239282131195068, -0.0007013231515884399, -0.000678718090057373, -0.0006561130285263062, -0.0006335079669952393, -0.0006109029054641724, -0.0005882978439331055, -0.0005656927824020386, -0.0005430877208709717, -0.0005204826593399048, -0.0004978775978088379, -0.000475272536277771, -0.0004526674747467041, -0.0004300624132156372, -0.0004074573516845703, -0.0003848522901535034, -0.0003622472286224365, -0.00033964216709136963, -0.00031703710556030273, -0.00029443204402923584, -0.00027182698249816895, -0.00024922192096710205, -0.00022661685943603516, -0.00020401179790496826, -0.00018140673637390137, -0.00015880167484283447, -0.00013619661331176758, -0.00011359155178070068, -9.098649024963379e-05, -6.83814287185669e-05, -4.57763671875e-05, -2.3171305656433105e-05, -5.662441253662109e-07, 2.2038817405700684e-05, 4.464387893676758e-05, 6.724894046783447e-05, 8.985400199890137e-05, 0.00011245906352996826, 0.00013506412506103516, 0.00015766918659210205, 0.00018027424812316895, 0.00020287930965423584, 0.00022548437118530273, 0.00024808943271636963, 0.0002706944942474365, 0.0002932995557785034, 0.0003159046173095703, 0.0003385096788406372, 0.0003611147403717041, 0.000383719801902771, 0.0004063248634338379, 0.0004289299249649048, 0.0004515349864959717, 0.0004741400480270386, 0.0004967451095581055, 0.0005193501710891724, 0.0005419552326202393, 0.0005645602941513062, 0.000587165355682373, 0.0006097704172134399, 0.0006323754787445068, 0.0006549805402755737, 0.0006775856018066406]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 7.0, 10.0, 19.0, 32.0, 40.0, 63.0, 109.0, 211.0, 353.0, 796.0, 1949.0, 6926.0, 47198.0, 645921.0, 313488.0, 24029.0, 4451.0, 1522.0, 661.0, 326.0, 193.0, 97.0, 47.0, 30.0, 22.0, 16.0, 11.0, 7.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4266357421875, -8.134521484375, -7.8424072265625, -7.55029296875, -7.2581787109375, -6.966064453125, -6.6739501953125, -6.3818359375, -6.0897216796875, -5.797607421875, -5.5054931640625, -5.21337890625, -4.9212646484375, -4.629150390625, -4.3370361328125, -4.044921875, -3.7528076171875, -3.460693359375, -3.1685791015625, -2.87646484375, -2.5843505859375, -2.292236328125, -2.0001220703125, -1.7080078125, -1.4158935546875, -1.123779296875, -0.8316650390625, -0.53955078125, -0.2474365234375, 0.044677734375, 0.3367919921875, 0.62890625, 0.9210205078125, 1.213134765625, 1.5052490234375, 1.79736328125, 2.0894775390625, 2.381591796875, 2.6737060546875, 2.9658203125, 3.2579345703125, 3.550048828125, 3.8421630859375, 4.13427734375, 4.4263916015625, 4.718505859375, 5.0106201171875, 5.302734375, 5.5948486328125, 5.886962890625, 6.1790771484375, 6.47119140625, 6.7633056640625, 7.055419921875, 7.3475341796875, 7.6396484375, 7.9317626953125, 8.223876953125, 8.5159912109375, 8.80810546875, 9.1002197265625, 9.392333984375, 9.6844482421875, 9.9765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 7.0, 4.0, 10.0, 10.0, 22.0, 43.0, 28.0, 56.0, 52.0, 105.0, 145.0, 108.0, 87.0, 81.0, 66.0, 46.0, 43.0, 40.0, 15.0, 15.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.50921630859375, -5.2254638671875, -4.94171142578125, -4.657958984375, -4.37420654296875, -4.0904541015625, -3.80670166015625, -3.52294921875, -3.23919677734375, -2.9554443359375, -2.67169189453125, -2.387939453125, -2.10418701171875, -1.8204345703125, -1.53668212890625, -1.2529296875, -0.96917724609375, -0.6854248046875, -0.40167236328125, -0.117919921875, 0.16583251953125, 0.4495849609375, 0.73333740234375, 1.01708984375, 1.30084228515625, 1.5845947265625, 1.86834716796875, 2.152099609375, 2.43585205078125, 2.7196044921875, 3.00335693359375, 3.287109375, 3.57086181640625, 3.8546142578125, 4.13836669921875, 4.422119140625, 4.70587158203125, 4.9896240234375, 5.27337646484375, 5.55712890625, 5.84088134765625, 6.1246337890625, 6.40838623046875, 6.692138671875, 6.97589111328125, 7.2596435546875, 7.54339599609375, 7.8271484375, 8.11090087890625, 8.3946533203125, 8.67840576171875, 8.962158203125, 9.24591064453125, 9.5296630859375, 9.81341552734375, 10.09716796875, 10.38092041015625, 10.6646728515625, 10.94842529296875, 11.232177734375, 11.51593017578125, 11.7996826171875, 12.08343505859375, 12.3671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 9.0, 12.0, 16.0, 28.0, 67.0, 112.0, 137.0, 195.0, 175.0, 112.0, 70.0, 37.0, 15.0, 8.0, 5.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.7614517211914, -110.64675903320312, -106.53205871582031, -102.41736602783203, -98.30267333984375, -94.18797302246094, -90.07328033447266, -85.95858764648438, -81.84388732910156, -77.72919464111328, -73.61449432373047, -69.49980163574219, -65.38510131835938, -61.270408630371094, -57.15571594238281, -53.041019439697266, -48.92632293701172, -44.81162643432617, -40.696929931640625, -36.582237243652344, -32.4675407409668, -28.35284423828125, -24.238149642944336, -20.123455047607422, -16.008758544921875, -11.894062995910645, -7.779367446899414, -3.6646718978881836, 0.4500236511230469, 4.564720153808594, 8.679414749145508, 12.794109344482422, 16.9088134765625, 21.023509979248047, 25.13820457458496, 29.252899169921875, 33.36759567260742, 37.48229217529297, 41.59698486328125, 45.7116813659668, 49.826377868652344, 53.94107437133789, 58.05577087402344, 62.17046356201172, 66.28515625, 70.39985656738281, 74.5145492553711, 78.62924194335938, 82.74394226074219, 86.85863494873047, 90.97333526611328, 95.08802795410156, 99.20272827148438, 103.31742095947266, 107.43211364746094, 111.54681396484375, 115.66150665283203, 119.77619934082031, 123.89089965820312, 128.00559997558594, 132.1202850341797, 136.2349853515625, 140.3496856689453, 144.46437072753906, 148.57907104492188]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 8.0, 16.0, 10.0, 22.0, 19.0, 29.0, 37.0, 33.0, 56.0, 49.0, 55.0, 62.0, 62.0, 56.0, 55.0, 56.0, 52.0, 57.0, 41.0, 34.0, 31.0, 37.0, 26.0, 15.0, 11.0, 17.0, 15.0, 12.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.51278686523438, -86.12169647216797, -82.7306137084961, -79.33952331542969, -75.94844055175781, -72.5573501586914, -69.166259765625, -65.77517700195312, -62.38408660888672, -58.99300003051758, -55.60191345214844, -52.21082305908203, -48.81973648071289, -45.42864990234375, -42.037559509277344, -38.6464729309082, -35.25538635253906, -31.864299774169922, -28.47321128845215, -25.082122802734375, -21.691036224365234, -18.299949645996094, -14.90886116027832, -11.517772674560547, -8.126686096191406, -4.735598564147949, -1.3445110321044922, 2.046576499938965, 5.437664031982422, 8.828750610351562, 12.219839096069336, 15.61092758178711, 19.00200653076172, 22.39309310913086, 25.784181594848633, 29.175270080566406, 32.56635665893555, 35.95744323730469, 39.348533630371094, 42.739620208740234, 46.130706787109375, 49.521793365478516, 52.912879943847656, 56.30397033691406, 59.6950569152832, 63.086143493652344, 66.47723388671875, 69.86831665039062, 73.25940704345703, 76.65049743652344, 80.04158020019531, 83.43267059326172, 86.82376098632812, 90.21484375, 93.6059341430664, 96.99702453613281, 100.38810729980469, 103.7791976928711, 107.17028045654297, 110.56137084960938, 113.95245361328125, 117.34354400634766, 120.73463439941406, 124.12571716308594, 127.51680755615234]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 6.0, 6.0, 3.0, 5.0, 9.0, 17.0, 20.0, 25.0, 53.0, 66.0, 124.0, 190.0, 334.0, 609.0, 1093.0, 2477.0, 6517.0, 37752.0, 4086476.0, 45846.0, 7184.0, 2562.0, 1286.0, 659.0, 381.0, 239.0, 109.0, 75.0, 43.0, 38.0, 15.0, 17.0, 10.0, 5.0, 9.0, 10.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.015625, -16.49267578125, -15.9697265625, -15.44677734375, -14.923828125, -14.40087890625, -13.8779296875, -13.35498046875, -12.83203125, -12.30908203125, -11.7861328125, -11.26318359375, -10.740234375, -10.21728515625, -9.6943359375, -9.17138671875, -8.6484375, -8.12548828125, -7.6025390625, -7.07958984375, -6.556640625, -6.03369140625, -5.5107421875, -4.98779296875, -4.46484375, -3.94189453125, -3.4189453125, -2.89599609375, -2.373046875, -1.85009765625, -1.3271484375, -0.80419921875, -0.28125, 0.24169921875, 0.7646484375, 1.28759765625, 1.810546875, 2.33349609375, 2.8564453125, 3.37939453125, 3.90234375, 4.42529296875, 4.9482421875, 5.47119140625, 5.994140625, 6.51708984375, 7.0400390625, 7.56298828125, 8.0859375, 8.60888671875, 9.1318359375, 9.65478515625, 10.177734375, 10.70068359375, 11.2236328125, 11.74658203125, 12.26953125, 12.79248046875, 13.3154296875, 13.83837890625, 14.361328125, 14.88427734375, 15.4072265625, 15.93017578125, 16.453125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 6.0, 10.0, 18.0, 20.0, 28.0, 37.0, 47.0, 71.0, 53.0, 77.0, 87.0, 91.0, 82.0, 85.0, 71.0, 51.0, 44.0, 27.0, 26.0, 19.0, 16.0, 11.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.19921875, -5.98809814453125, -5.7769775390625, -5.56585693359375, -5.354736328125, -5.14361572265625, -4.9324951171875, -4.72137451171875, -4.51025390625, -4.29913330078125, -4.0880126953125, -3.87689208984375, -3.665771484375, -3.45465087890625, -3.2435302734375, -3.03240966796875, -2.8212890625, -2.61016845703125, -2.3990478515625, -2.18792724609375, -1.976806640625, -1.76568603515625, -1.5545654296875, -1.34344482421875, -1.13232421875, -0.92120361328125, -0.7100830078125, -0.49896240234375, -0.287841796875, -0.07672119140625, 0.1343994140625, 0.34552001953125, 0.556640625, 0.76776123046875, 0.9788818359375, 1.19000244140625, 1.401123046875, 1.61224365234375, 1.8233642578125, 2.03448486328125, 2.24560546875, 2.45672607421875, 2.6678466796875, 2.87896728515625, 3.090087890625, 3.30120849609375, 3.5123291015625, 3.72344970703125, 3.9345703125, 4.14569091796875, 4.3568115234375, 4.56793212890625, 4.779052734375, 4.99017333984375, 5.2012939453125, 5.41241455078125, 5.62353515625, 5.83465576171875, 6.0457763671875, 6.25689697265625, 6.468017578125, 6.67913818359375, 6.8902587890625, 7.10137939453125, 7.3125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 5.0, 11.0, 5.0, 11.0, 14.0, 15.0, 16.0, 17.0, 34.0, 65.0, 70.0, 86.0, 103.0, 153.0, 227.0, 398.0, 659.0, 1306.0, 2731.0, 6864.0, 23453.0, 269150.0, 3837775.0, 35103.0, 9026.0, 3352.0, 1548.0, 765.0, 455.0, 281.0, 171.0, 86.0, 93.0, 45.0, 41.0, 31.0, 27.0, 14.0, 20.0, 17.0, 12.0, 8.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -9.0074462890625, -8.718017578125, -8.4285888671875, -8.13916015625, -7.8497314453125, -7.560302734375, -7.2708740234375, -6.9814453125, -6.6920166015625, -6.402587890625, -6.1131591796875, -5.82373046875, -5.5343017578125, -5.244873046875, -4.9554443359375, -4.666015625, -4.3765869140625, -4.087158203125, -3.7977294921875, -3.50830078125, -3.2188720703125, -2.929443359375, -2.6400146484375, -2.3505859375, -2.0611572265625, -1.771728515625, -1.4822998046875, -1.19287109375, -0.9034423828125, -0.614013671875, -0.3245849609375, -0.03515625, 0.2542724609375, 0.543701171875, 0.8331298828125, 1.12255859375, 1.4119873046875, 1.701416015625, 1.9908447265625, 2.2802734375, 2.5697021484375, 2.859130859375, 3.1485595703125, 3.43798828125, 3.7274169921875, 4.016845703125, 4.3062744140625, 4.595703125, 4.8851318359375, 5.174560546875, 5.4639892578125, 5.75341796875, 6.0428466796875, 6.332275390625, 6.6217041015625, 6.9111328125, 7.2005615234375, 7.489990234375, 7.7794189453125, 8.06884765625, 8.3582763671875, 8.647705078125, 8.9371337890625, 9.2265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 6.0, 11.0, 17.0, 35.0, 70.0, 315.0, 3401.0, 117.0, 39.0, 17.0, 11.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.25, -4.1538543701171875, -4.057708740234375, -3.9615631103515625, -3.86541748046875, -3.7692718505859375, -3.673126220703125, -3.5769805908203125, -3.4808349609375, -3.3846893310546875, -3.288543701171875, -3.1923980712890625, -3.09625244140625, -3.0001068115234375, -2.903961181640625, -2.8078155517578125, -2.711669921875, -2.6155242919921875, -2.519378662109375, -2.4232330322265625, -2.32708740234375, -2.2309417724609375, -2.134796142578125, -2.0386505126953125, -1.9425048828125, -1.8463592529296875, -1.750213623046875, -1.6540679931640625, -1.55792236328125, -1.4617767333984375, -1.365631103515625, -1.2694854736328125, -1.17333984375, -1.0771942138671875, -0.981048583984375, -0.8849029541015625, -0.78875732421875, -0.6926116943359375, -0.596466064453125, -0.5003204345703125, -0.4041748046875, -0.3080291748046875, -0.211883544921875, -0.1157379150390625, -0.01959228515625, 0.0765533447265625, 0.172698974609375, 0.2688446044921875, 0.364990234375, 0.4611358642578125, 0.557281494140625, 0.6534271240234375, 0.74957275390625, 0.8457183837890625, 0.941864013671875, 1.0380096435546875, 1.1341552734375, 1.2303009033203125, 1.326446533203125, 1.4225921630859375, 1.51873779296875, 1.6148834228515625, 1.711029052734375, 1.8071746826171875, 1.9033203125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 10.0, 10.0, 33.0, 82.0, 223.0, 318.0, 219.0, 79.0, 24.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.883522033691406, -22.259910583496094, -21.636301040649414, -21.0126895904541, -20.389080047607422, -19.76546859741211, -19.141857147216797, -18.518245697021484, -17.894636154174805, -17.271024703979492, -16.647415161132812, -16.0238037109375, -15.400193214416504, -14.776582717895508, -14.152971267700195, -13.5293607711792, -12.905750274658203, -12.282139778137207, -11.658529281616211, -11.034917831420898, -10.411307334899902, -9.787696838378906, -9.164085388183594, -8.540474891662598, -7.916864395141602, -7.2932538986206055, -6.669642925262451, -6.046031951904297, -5.422421455383301, -4.798810958862305, -4.17519998550415, -3.551589012145996, -2.927980422973633, -2.3043696880340576, -1.6807589530944824, -1.0571482181549072, -0.43353748321533203, 0.19007325172424316, 0.8136839866638184, 1.4372949600219727, 2.0609054565429688, 2.684516191482544, 3.308126926422119, 3.9317376613616943, 4.5553483963012695, 5.178958892822266, 5.80256986618042, 6.426180839538574, 7.04979133605957, 7.673401832580566, 8.297012329101562, 8.920623779296875, 9.544234275817871, 10.167844772338867, 10.79145622253418, 11.415066719055176, 12.038677215576172, 12.662287712097168, 13.285898208618164, 13.909509658813477, 14.533120155334473, 15.156730651855469, 15.780342102050781, 16.403953552246094, 17.027563095092773]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 4.0, 3.0, 3.0, 4.0, 13.0, 7.0, 18.0, 10.0, 25.0, 24.0, 24.0, 22.0, 36.0, 37.0, 34.0, 46.0, 36.0, 41.0, 36.0, 42.0, 52.0, 41.0, 62.0, 41.0, 37.0, 37.0, 38.0, 36.0, 30.0, 34.0, 17.0, 21.0, 18.0, 17.0, 16.0, 11.0, 7.0, 4.0, 8.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.021036624908447, -3.8739583492279053, -3.7268800735473633, -3.579801559448242, -3.4327232837677, -3.285645008087158, -3.138566493988037, -2.991488218307495, -2.844409942626953, -2.697331666946411, -2.550253391265869, -2.403174877166748, -2.256096601486206, -2.109018325805664, -1.9619399309158325, -1.814861536026001, -1.667783260345459, -1.520704984664917, -1.3736265897750854, -1.226548194885254, -1.079469919204712, -0.9323915839195251, -0.7853132486343384, -0.6382348537445068, -0.49115657806396484, -0.3440782427787781, -0.1969999074935913, -0.04992157220840454, 0.09715676307678223, 0.244235098361969, 0.39131343364715576, 0.5383918285369873, 0.6854705810546875, 0.8325489163398743, 0.979627251625061, 1.1267056465148926, 1.2737839221954346, 1.4208621978759766, 1.567940592765808, 1.7150189876556396, 1.8620972633361816, 2.0091755390167236, 2.1562538146972656, 2.3033323287963867, 2.4504106044769287, 2.5974888801574707, 2.744567394256592, 2.891645669937134, 3.038723945617676, 3.1858022212982178, 3.3328804969787598, 3.479959011077881, 3.627037286758423, 3.774115562438965, 3.921194076538086, 4.068272590637207, 4.21535062789917, 4.362429141998291, 4.509507179260254, 4.656585693359375, 4.803664207458496, 4.950742244720459, 5.09782075881958, 5.244898796081543, 5.391977310180664]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 16.0, 14.0, 28.0, 29.0, 54.0, 72.0, 92.0, 151.0, 250.0, 377.0, 597.0, 1142.0, 2220.0, 4626.0, 11217.0, 29046.0, 79691.0, 210233.0, 361957.0, 214159.0, 81480.0, 29635.0, 11487.0, 4947.0, 2162.0, 1171.0, 646.0, 408.0, 211.0, 139.0, 101.0, 54.0, 50.0, 30.0, 20.0, 17.0, 5.0, 7.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6328125, -8.38970947265625, -8.1466064453125, -7.90350341796875, -7.660400390625, -7.41729736328125, -7.1741943359375, -6.93109130859375, -6.68798828125, -6.44488525390625, -6.2017822265625, -5.95867919921875, -5.715576171875, -5.47247314453125, -5.2293701171875, -4.98626708984375, -4.7431640625, -4.50006103515625, -4.2569580078125, -4.01385498046875, -3.770751953125, -3.52764892578125, -3.2845458984375, -3.04144287109375, -2.79833984375, -2.55523681640625, -2.3121337890625, -2.06903076171875, -1.825927734375, -1.58282470703125, -1.3397216796875, -1.09661865234375, -0.853515625, -0.61041259765625, -0.3673095703125, -0.12420654296875, 0.118896484375, 0.36199951171875, 0.6051025390625, 0.84820556640625, 1.09130859375, 1.33441162109375, 1.5775146484375, 1.82061767578125, 2.063720703125, 2.30682373046875, 2.5499267578125, 2.79302978515625, 3.0361328125, 3.27923583984375, 3.5223388671875, 3.76544189453125, 4.008544921875, 4.25164794921875, 4.4947509765625, 4.73785400390625, 4.98095703125, 5.22406005859375, 5.4671630859375, 5.71026611328125, 5.953369140625, 6.19647216796875, 6.4395751953125, 6.68267822265625, 6.92578125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 8.0, 11.0, 14.0, 22.0, 29.0, 35.0, 45.0, 58.0, 68.0, 74.0, 83.0, 78.0, 80.0, 83.0, 77.0, 55.0, 35.0, 40.0, 26.0, 22.0, 15.0, 12.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0703125, -5.865234375, -5.66015625, -5.455078125, -5.25, -5.044921875, -4.83984375, -4.634765625, -4.4296875, -4.224609375, -4.01953125, -3.814453125, -3.609375, -3.404296875, -3.19921875, -2.994140625, -2.7890625, -2.583984375, -2.37890625, -2.173828125, -1.96875, -1.763671875, -1.55859375, -1.353515625, -1.1484375, -0.943359375, -0.73828125, -0.533203125, -0.328125, -0.123046875, 0.08203125, 0.287109375, 0.4921875, 0.697265625, 0.90234375, 1.107421875, 1.3125, 1.517578125, 1.72265625, 1.927734375, 2.1328125, 2.337890625, 2.54296875, 2.748046875, 2.953125, 3.158203125, 3.36328125, 3.568359375, 3.7734375, 3.978515625, 4.18359375, 4.388671875, 4.59375, 4.798828125, 5.00390625, 5.208984375, 5.4140625, 5.619140625, 5.82421875, 6.029296875, 6.234375, 6.439453125, 6.64453125, 6.849609375, 7.0546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 3.0, 8.0, 12.0, 22.0, 30.0, 38.0, 48.0, 67.0, 135.0, 218.0, 445.0, 912.0, 2221.0, 7376.0, 43567.0, 653606.0, 307906.0, 23694.0, 4955.0, 1741.0, 714.0, 378.0, 178.0, 101.0, 56.0, 32.0, 29.0, 15.0, 14.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.67578125, -16.9921875, -16.30859375, -15.625, -14.94140625, -14.2578125, -13.57421875, -12.890625, -12.20703125, -11.5234375, -10.83984375, -10.15625, -9.47265625, -8.7890625, -8.10546875, -7.421875, -6.73828125, -6.0546875, -5.37109375, -4.6875, -4.00390625, -3.3203125, -2.63671875, -1.953125, -1.26953125, -0.5859375, 0.09765625, 0.78125, 1.46484375, 2.1484375, 2.83203125, 3.515625, 4.19921875, 4.8828125, 5.56640625, 6.25, 6.93359375, 7.6171875, 8.30078125, 8.984375, 9.66796875, 10.3515625, 11.03515625, 11.71875, 12.40234375, 13.0859375, 13.76953125, 14.453125, 15.13671875, 15.8203125, 16.50390625, 17.1875, 17.87109375, 18.5546875, 19.23828125, 19.921875, 20.60546875, 21.2890625, 21.97265625, 22.65625, 23.33984375, 24.0234375, 24.70703125, 25.390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 6.0, 8.0, 12.0, 23.0, 28.0, 28.0, 49.0, 74.0, 68.0, 100.0, 98.0, 108.0, 81.0, 79.0, 65.0, 48.0, 34.0, 26.0, 20.0, 10.0, 8.0, 8.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-51.96875, -50.675537109375, -49.38232421875, -48.089111328125, -46.7958984375, -45.502685546875, -44.20947265625, -42.916259765625, -41.623046875, -40.329833984375, -39.03662109375, -37.743408203125, -36.4501953125, -35.156982421875, -33.86376953125, -32.570556640625, -31.27734375, -29.984130859375, -28.69091796875, -27.397705078125, -26.1044921875, -24.811279296875, -23.51806640625, -22.224853515625, -20.931640625, -19.638427734375, -18.34521484375, -17.052001953125, -15.7587890625, -14.465576171875, -13.17236328125, -11.879150390625, -10.5859375, -9.292724609375, -7.99951171875, -6.706298828125, -5.4130859375, -4.119873046875, -2.82666015625, -1.533447265625, -0.240234375, 1.052978515625, 2.34619140625, 3.639404296875, 4.9326171875, 6.225830078125, 7.51904296875, 8.812255859375, 10.10546875, 11.398681640625, 12.69189453125, 13.985107421875, 15.2783203125, 16.571533203125, 17.86474609375, 19.157958984375, 20.451171875, 21.744384765625, 23.03759765625, 24.330810546875, 25.6240234375, 26.917236328125, 28.21044921875, 29.503662109375, 30.796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 9.0, 2.0, 9.0, 11.0, 22.0, 15.0, 38.0, 55.0, 76.0, 130.0, 228.0, 432.0, 1830.0, 24702.0, 974281.0, 43260.0, 2230.0, 558.0, 265.0, 126.0, 77.0, 55.0, 42.0, 29.0, 19.0, 14.0, 8.0, 6.0, 5.0, 5.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.953125, -16.338134765625, -15.72314453125, -15.108154296875, -14.4931640625, -13.878173828125, -13.26318359375, -12.648193359375, -12.033203125, -11.418212890625, -10.80322265625, -10.188232421875, -9.5732421875, -8.958251953125, -8.34326171875, -7.728271484375, -7.11328125, -6.498291015625, -5.88330078125, -5.268310546875, -4.6533203125, -4.038330078125, -3.42333984375, -2.808349609375, -2.193359375, -1.578369140625, -0.96337890625, -0.348388671875, 0.2666015625, 0.881591796875, 1.49658203125, 2.111572265625, 2.7265625, 3.341552734375, 3.95654296875, 4.571533203125, 5.1865234375, 5.801513671875, 6.41650390625, 7.031494140625, 7.646484375, 8.261474609375, 8.87646484375, 9.491455078125, 10.1064453125, 10.721435546875, 11.33642578125, 11.951416015625, 12.56640625, 13.181396484375, 13.79638671875, 14.411376953125, 15.0263671875, 15.641357421875, 16.25634765625, 16.871337890625, 17.486328125, 18.101318359375, 18.71630859375, 19.331298828125, 19.9462890625, 20.561279296875, 21.17626953125, 21.791259765625, 22.40625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 7.0, 11.0, 14.0, 12.0, 21.0, 17.0, 19.0, 28.0, 33.0, 52.0, 67.0, 86.0, 82.0, 113.0, 82.0, 77.0, 53.0, 48.0, 37.0, 23.0, 26.0, 16.0, 12.0, 12.0, 9.0, 9.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005483627319335938, -0.0005267709493637085, -0.0005051791667938232, -0.000483587384223938, -0.00046199560165405273, -0.0004404038190841675, -0.0004188120365142822, -0.00039722025394439697, -0.0003756284713745117, -0.00035403668880462646, -0.0003324449062347412, -0.00031085312366485596, -0.0002892613410949707, -0.00026766955852508545, -0.0002460777759552002, -0.00022448599338531494, -0.0002028942108154297, -0.00018130242824554443, -0.00015971064567565918, -0.00013811886310577393, -0.00011652708053588867, -9.493529796600342e-05, -7.334351539611816e-05, -5.175173282623291e-05, -3.0159950256347656e-05, -8.568167686462402e-06, 1.3023614883422852e-05, 3.4615397453308105e-05, 5.620718002319336e-05, 7.779896259307861e-05, 9.939074516296387e-05, 0.00012098252773284912, 0.00014257431030273438, 0.00016416609287261963, 0.00018575787544250488, 0.00020734965801239014, 0.0002289414405822754, 0.00025053322315216064, 0.0002721250057220459, 0.00029371678829193115, 0.0003153085708618164, 0.00033690035343170166, 0.0003584921360015869, 0.00038008391857147217, 0.0004016757011413574, 0.0004232674837112427, 0.00044485926628112793, 0.0004664510488510132, 0.00048804283142089844, 0.0005096346139907837, 0.0005312263965606689, 0.0005528181791305542, 0.0005744099617004395, 0.0005960017442703247, 0.00061759352684021, 0.0006391853094100952, 0.0006607770919799805, 0.0006823688745498657, 0.000703960657119751, 0.0007255524396896362, 0.0007471442222595215, 0.0007687360048294067, 0.000790327787399292, 0.0008119195699691772, 0.0008335113525390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 7.0, 5.0, 4.0, 9.0, 19.0, 14.0, 27.0, 18.0, 44.0, 87.0, 86.0, 173.0, 294.0, 523.0, 1257.0, 3528.0, 14757.0, 173007.0, 795289.0, 48246.0, 7185.0, 2128.0, 847.0, 384.0, 220.0, 129.0, 79.0, 60.0, 37.0, 27.0, 22.0, 11.0, 4.0, 11.0, 5.0, 0.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.09375, -11.7303466796875, -11.366943359375, -11.0035400390625, -10.64013671875, -10.2767333984375, -9.913330078125, -9.5499267578125, -9.1865234375, -8.8231201171875, -8.459716796875, -8.0963134765625, -7.73291015625, -7.3695068359375, -7.006103515625, -6.6427001953125, -6.279296875, -5.9158935546875, -5.552490234375, -5.1890869140625, -4.82568359375, -4.4622802734375, -4.098876953125, -3.7354736328125, -3.3720703125, -3.0086669921875, -2.645263671875, -2.2818603515625, -1.91845703125, -1.5550537109375, -1.191650390625, -0.8282470703125, -0.46484375, -0.1014404296875, 0.261962890625, 0.6253662109375, 0.98876953125, 1.3521728515625, 1.715576171875, 2.0789794921875, 2.4423828125, 2.8057861328125, 3.169189453125, 3.5325927734375, 3.89599609375, 4.2593994140625, 4.622802734375, 4.9862060546875, 5.349609375, 5.7130126953125, 6.076416015625, 6.4398193359375, 6.80322265625, 7.1666259765625, 7.530029296875, 7.8934326171875, 8.2568359375, 8.6202392578125, 8.983642578125, 9.3470458984375, 9.71044921875, 10.0738525390625, 10.437255859375, 10.8006591796875, 11.1640625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 8.0, 18.0, 27.0, 51.0, 66.0, 113.0, 157.0, 163.0, 137.0, 74.0, 65.0, 33.0, 21.0, 11.0, 10.0, 2.0, 3.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8515625, -13.4342041015625, -13.016845703125, -12.5994873046875, -12.18212890625, -11.7647705078125, -11.347412109375, -10.9300537109375, -10.5126953125, -10.0953369140625, -9.677978515625, -9.2606201171875, -8.84326171875, -8.4259033203125, -8.008544921875, -7.5911865234375, -7.173828125, -6.7564697265625, -6.339111328125, -5.9217529296875, -5.50439453125, -5.0870361328125, -4.669677734375, -4.2523193359375, -3.8349609375, -3.4176025390625, -3.000244140625, -2.5828857421875, -2.16552734375, -1.7481689453125, -1.330810546875, -0.9134521484375, -0.49609375, -0.0787353515625, 0.338623046875, 0.7559814453125, 1.17333984375, 1.5906982421875, 2.008056640625, 2.4254150390625, 2.8427734375, 3.2601318359375, 3.677490234375, 4.0948486328125, 4.51220703125, 4.9295654296875, 5.346923828125, 5.7642822265625, 6.181640625, 6.5989990234375, 7.016357421875, 7.4337158203125, 7.85107421875, 8.2684326171875, 8.685791015625, 9.1031494140625, 9.5205078125, 9.9378662109375, 10.355224609375, 10.7725830078125, 11.18994140625, 11.6072998046875, 12.024658203125, 12.4420166015625, 12.859375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 19.0, 59.0, 191.0, 328.0, 256.0, 100.0, 27.0, 8.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-244.9911651611328, -237.0405731201172, -229.08998107910156, -221.13938903808594, -213.18881225585938, -205.23822021484375, -197.28762817382812, -189.3370361328125, -181.38644409179688, -173.43585205078125, -165.48526000976562, -157.53466796875, -149.58407592773438, -141.63348388671875, -133.6829071044922, -125.73231506347656, -117.78172302246094, -109.83113098144531, -101.88053894042969, -93.9299545288086, -85.97936248779297, -78.02877044677734, -70.07818603515625, -62.127593994140625, -54.177001953125, -46.226409912109375, -38.275821685791016, -30.325231552124023, -22.37464141845703, -14.424049377441406, -6.473461151123047, 1.4771270751953125, 9.427734375, 17.378324508666992, 25.328914642333984, 33.279502868652344, 41.23009490966797, 49.180686950683594, 57.13127517700195, 65.08186340332031, 73.03245544433594, 80.98304748535156, 88.93363952636719, 96.88422393798828, 104.8348159790039, 112.78540802001953, 120.73599243164062, 128.68658447265625, 136.63717651367188, 144.5877685546875, 152.53836059570312, 160.48895263671875, 168.43954467773438, 176.39013671875, 184.34071350097656, 192.2913055419922, 200.2418975830078, 208.19248962402344, 216.14308166503906, 224.0936737060547, 232.04425048828125, 239.99484252929688, 247.9454345703125, 255.89602661132812, 263.84661865234375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 7.0, 17.0, 13.0, 24.0, 17.0, 19.0, 29.0, 37.0, 41.0, 45.0, 37.0, 47.0, 52.0, 49.0, 50.0, 47.0, 56.0, 61.0, 34.0, 46.0, 37.0, 34.0, 37.0, 23.0, 20.0, 14.0, 16.0, 15.0, 11.0, 6.0, 10.0, 7.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-94.42808532714844, -91.4889907836914, -88.54989624023438, -85.61080169677734, -82.67170715332031, -79.73260498046875, -76.79351043701172, -73.85441589355469, -70.91532135009766, -67.97622680664062, -65.0371322631836, -62.0980339050293, -59.158939361572266, -56.219844818115234, -53.28074645996094, -50.341651916503906, -47.402557373046875, -44.463462829589844, -41.52436828613281, -38.585269927978516, -35.646175384521484, -32.70708084106445, -29.76798439025879, -26.828887939453125, -23.889793395996094, -20.950698852539062, -18.0116024017334, -15.07250690460205, -12.133411407470703, -9.194315910339355, -6.255220413208008, -3.3161239624023438, -0.3770294189453125, 2.562066078186035, 5.501161575317383, 8.44025707244873, 11.379352569580078, 14.318448066711426, 17.257543563842773, 20.196640014648438, 23.13573455810547, 26.0748291015625, 29.013925552368164, 31.953022003173828, 34.89211654663086, 37.83121109008789, 40.77030944824219, 43.70940399169922, 46.64849853515625, 49.58759307861328, 52.52668762207031, 55.46578598022461, 58.40488052368164, 61.34397506713867, 64.28307342529297, 67.22216796875, 70.16126251220703, 73.10035705566406, 76.0394515991211, 78.97854614257812, 81.91764831542969, 84.85674285888672, 87.79583740234375, 90.73493194580078, 93.67402648925781]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 1.0, 3.0, 7.0, 6.0, 15.0, 13.0, 15.0, 26.0, 36.0, 67.0, 98.0, 175.0, 292.0, 593.0, 1375.0, 3573.0, 11886.0, 79870.0, 4018553.0, 61583.0, 10422.0, 3129.0, 1254.0, 547.0, 292.0, 160.0, 108.0, 60.0, 33.0, 34.0, 14.0, 14.0, 7.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.2109375, -14.7694091796875, -14.327880859375, -13.8863525390625, -13.44482421875, -13.0032958984375, -12.561767578125, -12.1202392578125, -11.6787109375, -11.2371826171875, -10.795654296875, -10.3541259765625, -9.91259765625, -9.4710693359375, -9.029541015625, -8.5880126953125, -8.146484375, -7.7049560546875, -7.263427734375, -6.8218994140625, -6.38037109375, -5.9388427734375, -5.497314453125, -5.0557861328125, -4.6142578125, -4.1727294921875, -3.731201171875, -3.2896728515625, -2.84814453125, -2.4066162109375, -1.965087890625, -1.5235595703125, -1.08203125, -0.6405029296875, -0.198974609375, 0.2425537109375, 0.68408203125, 1.1256103515625, 1.567138671875, 2.0086669921875, 2.4501953125, 2.8917236328125, 3.333251953125, 3.7747802734375, 4.21630859375, 4.6578369140625, 5.099365234375, 5.5408935546875, 5.982421875, 6.4239501953125, 6.865478515625, 7.3070068359375, 7.74853515625, 8.1900634765625, 8.631591796875, 9.0731201171875, 9.5146484375, 9.9561767578125, 10.397705078125, 10.8392333984375, 11.28076171875, 11.7222900390625, 12.163818359375, 12.6053466796875, 13.046875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 5.0, 2.0, 9.0, 8.0, 16.0, 21.0, 18.0, 26.0, 35.0, 36.0, 50.0, 49.0, 63.0, 54.0, 55.0, 77.0, 71.0, 55.0, 53.0, 58.0, 39.0, 32.0, 27.0, 28.0, 20.0, 17.0, 18.0, 12.0, 14.0, 4.0, 7.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.8125, -5.65374755859375, -5.4949951171875, -5.33624267578125, -5.177490234375, -5.01873779296875, -4.8599853515625, -4.70123291015625, -4.54248046875, -4.38372802734375, -4.2249755859375, -4.06622314453125, -3.907470703125, -3.74871826171875, -3.5899658203125, -3.43121337890625, -3.2724609375, -3.11370849609375, -2.9549560546875, -2.79620361328125, -2.637451171875, -2.47869873046875, -2.3199462890625, -2.16119384765625, -2.00244140625, -1.84368896484375, -1.6849365234375, -1.52618408203125, -1.367431640625, -1.20867919921875, -1.0499267578125, -0.89117431640625, -0.732421875, -0.57366943359375, -0.4149169921875, -0.25616455078125, -0.097412109375, 0.06134033203125, 0.2200927734375, 0.37884521484375, 0.53759765625, 0.69635009765625, 0.8551025390625, 1.01385498046875, 1.172607421875, 1.33135986328125, 1.4901123046875, 1.64886474609375, 1.8076171875, 1.96636962890625, 2.1251220703125, 2.28387451171875, 2.442626953125, 2.60137939453125, 2.7601318359375, 2.91888427734375, 3.07763671875, 3.23638916015625, 3.3951416015625, 3.55389404296875, 3.712646484375, 3.87139892578125, 4.0301513671875, 4.18890380859375, 4.34765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 9.0, 4.0, 10.0, 12.0, 17.0, 20.0, 33.0, 33.0, 60.0, 62.0, 93.0, 202.0, 367.0, 783.0, 2229.0, 8827.0, 67194.0, 4027341.0, 73662.0, 9338.0, 2286.0, 755.0, 365.0, 199.0, 121.0, 73.0, 54.0, 38.0, 34.0, 24.0, 9.0, 11.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.75, -15.265625, -14.78125, -14.296875, -13.8125, -13.328125, -12.84375, -12.359375, -11.875, -11.390625, -10.90625, -10.421875, -9.9375, -9.453125, -8.96875, -8.484375, -8.0, -7.515625, -7.03125, -6.546875, -6.0625, -5.578125, -5.09375, -4.609375, -4.125, -3.640625, -3.15625, -2.671875, -2.1875, -1.703125, -1.21875, -0.734375, -0.25, 0.234375, 0.71875, 1.203125, 1.6875, 2.171875, 2.65625, 3.140625, 3.625, 4.109375, 4.59375, 5.078125, 5.5625, 6.046875, 6.53125, 7.015625, 7.5, 7.984375, 8.46875, 8.953125, 9.4375, 9.921875, 10.40625, 10.890625, 11.375, 11.859375, 12.34375, 12.828125, 13.3125, 13.796875, 14.28125, 14.765625, 15.25]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 7.0, 3.0, 3.0, 9.0, 2.0, 6.0, 4.0, 24.0, 22.0, 32.0, 53.0, 88.0, 267.0, 3013.0, 322.0, 97.0, 49.0, 29.0, 16.0, 10.0, 9.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6328125, -3.48455810546875, -3.3363037109375, -3.18804931640625, -3.039794921875, -2.89154052734375, -2.7432861328125, -2.59503173828125, -2.44677734375, -2.29852294921875, -2.1502685546875, -2.00201416015625, -1.853759765625, -1.70550537109375, -1.5572509765625, -1.40899658203125, -1.2607421875, -1.11248779296875, -0.9642333984375, -0.81597900390625, -0.667724609375, -0.51947021484375, -0.3712158203125, -0.22296142578125, -0.07470703125, 0.07354736328125, 0.2218017578125, 0.37005615234375, 0.518310546875, 0.66656494140625, 0.8148193359375, 0.96307373046875, 1.111328125, 1.25958251953125, 1.4078369140625, 1.55609130859375, 1.704345703125, 1.85260009765625, 2.0008544921875, 2.14910888671875, 2.29736328125, 2.44561767578125, 2.5938720703125, 2.74212646484375, 2.890380859375, 3.03863525390625, 3.1868896484375, 3.33514404296875, 3.4833984375, 3.63165283203125, 3.7799072265625, 3.92816162109375, 4.076416015625, 4.22467041015625, 4.3729248046875, 4.52117919921875, 4.66943359375, 4.81768798828125, 4.9659423828125, 5.11419677734375, 5.262451171875, 5.41070556640625, 5.5589599609375, 5.70721435546875, 5.85546875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 0.0, 4.0, 5.0, 4.0, 16.0, 27.0, 54.0, 107.0, 154.0, 228.0, 217.0, 101.0, 37.0, 25.0, 7.0, 7.0, 9.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.6118049621582, -45.63412857055664, -44.65645217895508, -43.67877197265625, -42.70109558105469, -41.723419189453125, -40.74574279785156, -39.76806640625, -38.79039001464844, -37.812713623046875, -36.83503723144531, -35.857357025146484, -34.87968063354492, -33.90200424194336, -32.9243278503418, -31.946651458740234, -30.968971252441406, -29.991294860839844, -29.01361656188965, -28.035940170288086, -27.05826187133789, -26.080585479736328, -25.102909088134766, -24.125232696533203, -23.147554397583008, -22.169878005981445, -21.19219970703125, -20.214523315429688, -19.236846923828125, -18.25916862487793, -17.281492233276367, -16.303813934326172, -15.326135635375977, -14.348458290100098, -13.370780944824219, -12.393104553222656, -11.415427207946777, -10.437749862670898, -9.460073471069336, -8.482396125793457, -7.504718780517578, -6.527041435241699, -5.5493645668029785, -4.571687698364258, -3.594010353088379, -2.6163330078125, -1.6386561393737793, -0.6609792709350586, 0.3166980743408203, 1.2943751811981201, 2.27205228805542, 3.2497293949127197, 4.2274065017700195, 5.205083847045898, 6.182760715484619, 7.16043758392334, 8.138114929199219, 9.115792274475098, 10.093469619750977, 11.071146011352539, 12.048823356628418, 13.026500701904297, 14.00417709350586, 14.981854438781738, 15.959531784057617]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 6.0, 2.0, 6.0, 7.0, 9.0, 17.0, 16.0, 16.0, 33.0, 34.0, 36.0, 32.0, 44.0, 46.0, 40.0, 56.0, 59.0, 52.0, 55.0, 70.0, 50.0, 52.0, 39.0, 36.0, 24.0, 20.0, 21.0, 30.0, 19.0, 19.0, 14.0, 12.0, 15.0, 8.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.946131706237793, -11.558565139770508, -11.170998573303223, -10.783432006835938, -10.395864486694336, -10.00829792022705, -9.620731353759766, -9.23316478729248, -8.845598220825195, -8.45803165435791, -8.070465087890625, -7.682898044586182, -7.2953314781188965, -6.907764911651611, -6.520197868347168, -6.132631301879883, -5.745064735412598, -5.3574981689453125, -4.969931602478027, -4.582364559173584, -4.194797992706299, -3.8072314262390137, -3.4196646213531494, -3.032097816467285, -2.64453125, -2.256964683532715, -1.8693978786468506, -1.4818311929702759, -1.0942645072937012, -0.7066978216171265, -0.31913113594055176, 0.0684356689453125, 0.45600318908691406, 0.8435698747634888, 1.2311365604400635, 1.6187032461166382, 2.006269931793213, 2.393836498260498, 2.7814033031463623, 3.1689701080322266, 3.5565366744995117, 3.944103240966797, 4.331669807434082, 4.719236850738525, 5.1068034172058105, 5.494369983673096, 5.881937026977539, 6.269503593444824, 6.657070159912109, 7.0446367263793945, 7.43220329284668, 7.819770336151123, 8.20733642578125, 8.594903945922852, 8.982470512390137, 9.370037078857422, 9.757603645324707, 10.145170211791992, 10.532736778259277, 10.920303344726562, 11.307870864868164, 11.69543743133545, 12.083003997802734, 12.47057056427002, 12.858137130737305]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 4.0, 10.0, 11.0, 21.0, 23.0, 37.0, 57.0, 86.0, 143.0, 225.0, 361.0, 678.0, 1168.0, 2266.0, 4855.0, 12021.0, 34268.0, 117668.0, 382264.0, 343505.0, 99752.0, 29467.0, 10554.0, 4397.0, 2107.0, 1050.0, 572.0, 336.0, 205.0, 135.0, 85.0, 59.0, 35.0, 33.0, 23.0, 17.0, 12.0, 11.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.171875, -9.863037109375, -9.55419921875, -9.245361328125, -8.9365234375, -8.627685546875, -8.31884765625, -8.010009765625, -7.701171875, -7.392333984375, -7.08349609375, -6.774658203125, -6.4658203125, -6.156982421875, -5.84814453125, -5.539306640625, -5.23046875, -4.921630859375, -4.61279296875, -4.303955078125, -3.9951171875, -3.686279296875, -3.37744140625, -3.068603515625, -2.759765625, -2.450927734375, -2.14208984375, -1.833251953125, -1.5244140625, -1.215576171875, -0.90673828125, -0.597900390625, -0.2890625, 0.019775390625, 0.32861328125, 0.637451171875, 0.9462890625, 1.255126953125, 1.56396484375, 1.872802734375, 2.181640625, 2.490478515625, 2.79931640625, 3.108154296875, 3.4169921875, 3.725830078125, 4.03466796875, 4.343505859375, 4.65234375, 4.961181640625, 5.27001953125, 5.578857421875, 5.8876953125, 6.196533203125, 6.50537109375, 6.814208984375, 7.123046875, 7.431884765625, 7.74072265625, 8.049560546875, 8.3583984375, 8.667236328125, 8.97607421875, 9.284912109375, 9.59375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 10.0, 7.0, 7.0, 14.0, 22.0, 17.0, 20.0, 33.0, 34.0, 46.0, 44.0, 55.0, 45.0, 74.0, 72.0, 68.0, 58.0, 57.0, 44.0, 34.0, 39.0, 41.0, 28.0, 23.0, 24.0, 20.0, 17.0, 9.0, 11.0, 6.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.12188720703125, -4.9625244140625, -4.80316162109375, -4.643798828125, -4.48443603515625, -4.3250732421875, -4.16571044921875, -4.00634765625, -3.84698486328125, -3.6876220703125, -3.52825927734375, -3.368896484375, -3.20953369140625, -3.0501708984375, -2.89080810546875, -2.7314453125, -2.57208251953125, -2.4127197265625, -2.25335693359375, -2.093994140625, -1.93463134765625, -1.7752685546875, -1.61590576171875, -1.45654296875, -1.29718017578125, -1.1378173828125, -0.97845458984375, -0.819091796875, -0.65972900390625, -0.5003662109375, -0.34100341796875, -0.181640625, -0.02227783203125, 0.1370849609375, 0.29644775390625, 0.455810546875, 0.61517333984375, 0.7745361328125, 0.93389892578125, 1.09326171875, 1.25262451171875, 1.4119873046875, 1.57135009765625, 1.730712890625, 1.89007568359375, 2.0494384765625, 2.20880126953125, 2.3681640625, 2.52752685546875, 2.6868896484375, 2.84625244140625, 3.005615234375, 3.16497802734375, 3.3243408203125, 3.48370361328125, 3.64306640625, 3.80242919921875, 3.9617919921875, 4.12115478515625, 4.280517578125, 4.43988037109375, 4.5992431640625, 4.75860595703125, 4.91796875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 7.0, 8.0, 6.0, 17.0, 19.0, 34.0, 44.0, 46.0, 98.0, 210.0, 402.0, 1135.0, 4371.0, 31711.0, 792664.0, 202403.0, 11699.0, 2268.0, 679.0, 312.0, 156.0, 94.0, 54.0, 40.0, 25.0, 15.0, 6.0, 9.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.90625, -24.009765625, -23.11328125, -22.216796875, -21.3203125, -20.423828125, -19.52734375, -18.630859375, -17.734375, -16.837890625, -15.94140625, -15.044921875, -14.1484375, -13.251953125, -12.35546875, -11.458984375, -10.5625, -9.666015625, -8.76953125, -7.873046875, -6.9765625, -6.080078125, -5.18359375, -4.287109375, -3.390625, -2.494140625, -1.59765625, -0.701171875, 0.1953125, 1.091796875, 1.98828125, 2.884765625, 3.78125, 4.677734375, 5.57421875, 6.470703125, 7.3671875, 8.263671875, 9.16015625, 10.056640625, 10.953125, 11.849609375, 12.74609375, 13.642578125, 14.5390625, 15.435546875, 16.33203125, 17.228515625, 18.125, 19.021484375, 19.91796875, 20.814453125, 21.7109375, 22.607421875, 23.50390625, 24.400390625, 25.296875, 26.193359375, 27.08984375, 27.986328125, 28.8828125, 29.779296875, 30.67578125, 31.572265625, 32.46875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 5.0, 6.0, 13.0, 7.0, 11.0, 9.0, 35.0, 24.0, 32.0, 37.0, 31.0, 46.0, 56.0, 54.0, 52.0, 56.0, 71.0, 61.0, 54.0, 55.0, 43.0, 42.0, 42.0, 30.0, 16.0, 22.0, 16.0, 16.0, 13.0, 9.0, 6.0, 4.0, 4.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.1875, -19.442626953125, -18.69775390625, -17.952880859375, -17.2080078125, -16.463134765625, -15.71826171875, -14.973388671875, -14.228515625, -13.483642578125, -12.73876953125, -11.993896484375, -11.2490234375, -10.504150390625, -9.75927734375, -9.014404296875, -8.26953125, -7.524658203125, -6.77978515625, -6.034912109375, -5.2900390625, -4.545166015625, -3.80029296875, -3.055419921875, -2.310546875, -1.565673828125, -0.82080078125, -0.075927734375, 0.6689453125, 1.413818359375, 2.15869140625, 2.903564453125, 3.6484375, 4.393310546875, 5.13818359375, 5.883056640625, 6.6279296875, 7.372802734375, 8.11767578125, 8.862548828125, 9.607421875, 10.352294921875, 11.09716796875, 11.842041015625, 12.5869140625, 13.331787109375, 14.07666015625, 14.821533203125, 15.56640625, 16.311279296875, 17.05615234375, 17.801025390625, 18.5458984375, 19.290771484375, 20.03564453125, 20.780517578125, 21.525390625, 22.270263671875, 23.01513671875, 23.760009765625, 24.5048828125, 25.249755859375, 25.99462890625, 26.739501953125, 27.484375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 8.0, 17.0, 13.0, 17.0, 41.0, 39.0, 68.0, 92.0, 128.0, 241.0, 538.0, 1512.0, 7600.0, 130442.0, 864743.0, 37077.0, 3949.0, 1011.0, 425.0, 200.0, 124.0, 77.0, 44.0, 42.0, 30.0, 15.0, 13.0, 13.0, 4.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-11.796875, -11.489013671875, -11.18115234375, -10.873291015625, -10.5654296875, -10.257568359375, -9.94970703125, -9.641845703125, -9.333984375, -9.026123046875, -8.71826171875, -8.410400390625, -8.1025390625, -7.794677734375, -7.48681640625, -7.178955078125, -6.87109375, -6.563232421875, -6.25537109375, -5.947509765625, -5.6396484375, -5.331787109375, -5.02392578125, -4.716064453125, -4.408203125, -4.100341796875, -3.79248046875, -3.484619140625, -3.1767578125, -2.868896484375, -2.56103515625, -2.253173828125, -1.9453125, -1.637451171875, -1.32958984375, -1.021728515625, -0.7138671875, -0.406005859375, -0.09814453125, 0.209716796875, 0.517578125, 0.825439453125, 1.13330078125, 1.441162109375, 1.7490234375, 2.056884765625, 2.36474609375, 2.672607421875, 2.98046875, 3.288330078125, 3.59619140625, 3.904052734375, 4.2119140625, 4.519775390625, 4.82763671875, 5.135498046875, 5.443359375, 5.751220703125, 6.05908203125, 6.366943359375, 6.6748046875, 6.982666015625, 7.29052734375, 7.598388671875, 7.90625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 2.0, 3.0, 8.0, 8.0, 11.0, 14.0, 32.0, 21.0, 29.0, 39.0, 32.0, 59.0, 83.0, 110.0, 130.0, 100.0, 72.0, 56.0, 49.0, 25.0, 27.0, 25.0, 8.0, 22.0, 8.0, 8.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007305145263671875, -0.0007054731249809265, -0.0006804317235946655, -0.0006553903222084045, -0.0006303489208221436, -0.0006053075194358826, -0.0005802661180496216, -0.0005552247166633606, -0.0005301833152770996, -0.0005051419138908386, -0.00048010051250457764, -0.00045505911111831665, -0.00043001770973205566, -0.0004049763083457947, -0.0003799349069595337, -0.0003548935055732727, -0.0003298521041870117, -0.00030481070280075073, -0.00027976930141448975, -0.00025472790002822876, -0.00022968649864196777, -0.0002046450972557068, -0.0001796036958694458, -0.00015456229448318481, -0.00012952089309692383, -0.00010447949171066284, -7.943809032440186e-05, -5.439668893814087e-05, -2.9355287551879883e-05, -4.3138861656188965e-06, 2.072751522064209e-05, 4.5768916606903076e-05, 7.081031799316406e-05, 9.585171937942505e-05, 0.00012089312076568604, 0.00014593452215194702, 0.000170975923538208, 0.000196017324924469, 0.00022105872631072998, 0.00024610012769699097, 0.00027114152908325195, 0.00029618293046951294, 0.0003212243318557739, 0.0003462657332420349, 0.0003713071346282959, 0.0003963485360145569, 0.00042138993740081787, 0.00044643133878707886, 0.00047147274017333984, 0.0004965141415596008, 0.0005215555429458618, 0.0005465969443321228, 0.0005716383457183838, 0.0005966797471046448, 0.0006217211484909058, 0.0006467625498771667, 0.0006718039512634277, 0.0006968453526496887, 0.0007218867540359497, 0.0007469281554222107, 0.0007719695568084717, 0.0007970109581947327, 0.0008220523595809937, 0.0008470937609672546, 0.0008721351623535156]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 0.0, 3.0, 7.0, 6.0, 6.0, 9.0, 15.0, 11.0, 31.0, 64.0, 105.0, 144.0, 243.0, 487.0, 1035.0, 2914.0, 12206.0, 115715.0, 804547.0, 95345.0, 10891.0, 2682.0, 984.0, 469.0, 242.0, 140.0, 87.0, 53.0, 30.0, 21.0, 13.0, 13.0, 7.0, 8.0, 8.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.2734375, -8.03338623046875, -7.7933349609375, -7.55328369140625, -7.313232421875, -7.07318115234375, -6.8331298828125, -6.59307861328125, -6.35302734375, -6.11297607421875, -5.8729248046875, -5.63287353515625, -5.392822265625, -5.15277099609375, -4.9127197265625, -4.67266845703125, -4.4326171875, -4.19256591796875, -3.9525146484375, -3.71246337890625, -3.472412109375, -3.23236083984375, -2.9923095703125, -2.75225830078125, -2.51220703125, -2.27215576171875, -2.0321044921875, -1.79205322265625, -1.552001953125, -1.31195068359375, -1.0718994140625, -0.83184814453125, -0.591796875, -0.35174560546875, -0.1116943359375, 0.12835693359375, 0.368408203125, 0.60845947265625, 0.8485107421875, 1.08856201171875, 1.32861328125, 1.56866455078125, 1.8087158203125, 2.04876708984375, 2.288818359375, 2.52886962890625, 2.7689208984375, 3.00897216796875, 3.2490234375, 3.48907470703125, 3.7291259765625, 3.96917724609375, 4.209228515625, 4.44927978515625, 4.6893310546875, 4.92938232421875, 5.16943359375, 5.40948486328125, 5.6495361328125, 5.88958740234375, 6.129638671875, 6.36968994140625, 6.6097412109375, 6.84979248046875, 7.08984375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 10.0, 14.0, 20.0, 31.0, 39.0, 56.0, 76.0, 82.0, 116.0, 113.0, 108.0, 91.0, 64.0, 45.0, 22.0, 22.0, 21.0, 23.0, 7.0, 11.0, 5.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9375, -8.69866943359375, -8.4598388671875, -8.22100830078125, -7.982177734375, -7.74334716796875, -7.5045166015625, -7.26568603515625, -7.02685546875, -6.78802490234375, -6.5491943359375, -6.31036376953125, -6.071533203125, -5.83270263671875, -5.5938720703125, -5.35504150390625, -5.1162109375, -4.87738037109375, -4.6385498046875, -4.39971923828125, -4.160888671875, -3.92205810546875, -3.6832275390625, -3.44439697265625, -3.20556640625, -2.96673583984375, -2.7279052734375, -2.48907470703125, -2.250244140625, -2.01141357421875, -1.7725830078125, -1.53375244140625, -1.294921875, -1.05609130859375, -0.8172607421875, -0.57843017578125, -0.339599609375, -0.10076904296875, 0.1380615234375, 0.37689208984375, 0.61572265625, 0.85455322265625, 1.0933837890625, 1.33221435546875, 1.571044921875, 1.80987548828125, 2.0487060546875, 2.28753662109375, 2.5263671875, 2.76519775390625, 3.0040283203125, 3.24285888671875, 3.481689453125, 3.72052001953125, 3.9593505859375, 4.19818115234375, 4.43701171875, 4.67584228515625, 4.9146728515625, 5.15350341796875, 5.392333984375, 5.63116455078125, 5.8699951171875, 6.10882568359375, 6.34765625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 7.0, 19.0, 63.0, 196.0, 372.0, 247.0, 78.0, 16.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-287.728759765625, -278.8977355957031, -270.06671142578125, -261.2356872558594, -252.4046630859375, -243.57363891601562, -234.74261474609375, -225.91159057617188, -217.08056640625, -208.24954223632812, -199.41851806640625, -190.58749389648438, -181.7564697265625, -172.92544555664062, -164.09442138671875, -155.26339721679688, -146.43238830566406, -137.6013641357422, -128.7703399658203, -119.93931579589844, -111.10829162597656, -102.27726745605469, -93.44625091552734, -84.61522674560547, -75.7842025756836, -66.95317840576172, -58.122154235839844, -49.291133880615234, -40.46010971069336, -31.629085540771484, -22.798065185546875, -13.967041015625, -5.136016845703125, 3.6950063705444336, 12.526029586791992, 21.357051849365234, 30.18807601928711, 39.019100189208984, 47.850120544433594, 56.68114471435547, 65.51216888427734, 74.34319305419922, 83.1742172241211, 92.00523376464844, 100.83625793457031, 109.66728210449219, 118.49830627441406, 127.32933044433594, 136.1603546142578, 144.9913787841797, 153.82240295410156, 162.65342712402344, 171.4844512939453, 180.3154754638672, 189.146484375, 197.97750854492188, 206.80853271484375, 215.63955688476562, 224.4705810546875, 233.30160522460938, 242.13262939453125, 250.96365356445312, 259.794677734375, 268.6257019042969, 277.45672607421875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 5.0, 7.0, 8.0, 9.0, 16.0, 14.0, 13.0, 15.0, 25.0, 25.0, 24.0, 39.0, 32.0, 32.0, 40.0, 43.0, 44.0, 41.0, 60.0, 52.0, 43.0, 52.0, 41.0, 42.0, 47.0, 33.0, 28.0, 29.0, 23.0, 24.0, 21.0, 16.0, 9.0, 14.0, 7.0, 8.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.92045593261719, -88.2249526977539, -85.52945709228516, -82.83395385742188, -80.1384506225586, -77.44294738769531, -74.74745178222656, -72.05194854736328, -69.3564453125, -66.66094207763672, -63.9654426574707, -61.26994323730469, -58.574440002441406, -55.87894058227539, -53.183441162109375, -50.487937927246094, -47.792442321777344, -45.09694290161133, -42.40143966674805, -39.70594024658203, -37.01043701171875, -34.314937591552734, -31.61943817138672, -28.92393684387207, -26.228435516357422, -23.532934188842773, -20.837432861328125, -18.14193344116211, -15.446432113647461, -12.750930786132812, -10.055431365966797, -7.359930038452148, -4.664421081542969, -1.9689202308654785, 0.7265806198120117, 3.4220809936523438, 6.117582321166992, 8.81308364868164, 11.508583068847656, 14.204084396362305, 16.899585723876953, 19.5950870513916, 22.29058837890625, 24.986087799072266, 27.681589126586914, 30.377090454101562, 33.07258987426758, 35.768089294433594, 38.463592529296875, 41.15909194946289, 43.85459518432617, 46.55009460449219, 49.24559783935547, 51.941097259521484, 54.6365966796875, 57.33209991455078, 60.0275993347168, 62.72309875488281, 65.4186019897461, 68.11410522460938, 70.80960083007812, 73.5051040649414, 76.20060729980469, 78.89610290527344, 81.59160614013672]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 9.0, 12.0, 15.0, 19.0, 27.0, 56.0, 80.0, 129.0, 202.0, 327.0, 696.0, 1482.0, 3933.0, 15415.0, 142849.0, 3916357.0, 93683.0, 12759.0, 3470.0, 1325.0, 603.0, 295.0, 188.0, 103.0, 90.0, 46.0, 30.0, 23.0, 14.0, 6.0, 10.0, 2.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.8125, -18.296142578125, -17.77978515625, -17.263427734375, -16.7470703125, -16.230712890625, -15.71435546875, -15.197998046875, -14.681640625, -14.165283203125, -13.64892578125, -13.132568359375, -12.6162109375, -12.099853515625, -11.58349609375, -11.067138671875, -10.55078125, -10.034423828125, -9.51806640625, -9.001708984375, -8.4853515625, -7.968994140625, -7.45263671875, -6.936279296875, -6.419921875, -5.903564453125, -5.38720703125, -4.870849609375, -4.3544921875, -3.838134765625, -3.32177734375, -2.805419921875, -2.2890625, -1.772705078125, -1.25634765625, -0.739990234375, -0.2236328125, 0.292724609375, 0.80908203125, 1.325439453125, 1.841796875, 2.358154296875, 2.87451171875, 3.390869140625, 3.9072265625, 4.423583984375, 4.93994140625, 5.456298828125, 5.97265625, 6.489013671875, 7.00537109375, 7.521728515625, 8.0380859375, 8.554443359375, 9.07080078125, 9.587158203125, 10.103515625, 10.619873046875, 11.13623046875, 11.652587890625, 12.1689453125, 12.685302734375, 13.20166015625, 13.718017578125, 14.234375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 9.0, 16.0, 18.0, 34.0, 32.0, 50.0, 54.0, 68.0, 89.0, 83.0, 93.0, 81.0, 75.0, 55.0, 49.0, 48.0, 29.0, 30.0, 25.0, 21.0, 11.0, 5.0, 7.0, 4.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.953125, -6.75775146484375, -6.5623779296875, -6.36700439453125, -6.171630859375, -5.97625732421875, -5.7808837890625, -5.58551025390625, -5.39013671875, -5.19476318359375, -4.9993896484375, -4.80401611328125, -4.608642578125, -4.41326904296875, -4.2178955078125, -4.02252197265625, -3.8271484375, -3.63177490234375, -3.4364013671875, -3.24102783203125, -3.045654296875, -2.85028076171875, -2.6549072265625, -2.45953369140625, -2.26416015625, -2.06878662109375, -1.8734130859375, -1.67803955078125, -1.482666015625, -1.28729248046875, -1.0919189453125, -0.89654541015625, -0.701171875, -0.50579833984375, -0.3104248046875, -0.11505126953125, 0.080322265625, 0.27569580078125, 0.4710693359375, 0.66644287109375, 0.86181640625, 1.05718994140625, 1.2525634765625, 1.44793701171875, 1.643310546875, 1.83868408203125, 2.0340576171875, 2.22943115234375, 2.4248046875, 2.62017822265625, 2.8155517578125, 3.01092529296875, 3.206298828125, 3.40167236328125, 3.5970458984375, 3.79241943359375, 3.98779296875, 4.18316650390625, 4.3785400390625, 4.57391357421875, 4.769287109375, 4.96466064453125, 5.1600341796875, 5.35540771484375, 5.55078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 8.0, 10.0, 12.0, 18.0, 24.0, 28.0, 40.0, 83.0, 109.0, 271.0, 654.0, 1906.0, 6923.0, 36964.0, 683968.0, 3384165.0, 64086.0, 10875.0, 2548.0, 866.0, 313.0, 146.0, 93.0, 48.0, 20.0, 27.0, 16.0, 10.0, 15.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.6217041015625, -12.173095703125, -11.7244873046875, -11.27587890625, -10.8272705078125, -10.378662109375, -9.9300537109375, -9.4814453125, -9.0328369140625, -8.584228515625, -8.1356201171875, -7.68701171875, -7.2384033203125, -6.789794921875, -6.3411865234375, -5.892578125, -5.4439697265625, -4.995361328125, -4.5467529296875, -4.09814453125, -3.6495361328125, -3.200927734375, -2.7523193359375, -2.3037109375, -1.8551025390625, -1.406494140625, -0.9578857421875, -0.50927734375, -0.0606689453125, 0.387939453125, 0.8365478515625, 1.28515625, 1.7337646484375, 2.182373046875, 2.6309814453125, 3.07958984375, 3.5281982421875, 3.976806640625, 4.4254150390625, 4.8740234375, 5.3226318359375, 5.771240234375, 6.2198486328125, 6.66845703125, 7.1170654296875, 7.565673828125, 8.0142822265625, 8.462890625, 8.9114990234375, 9.360107421875, 9.8087158203125, 10.25732421875, 10.7059326171875, 11.154541015625, 11.6031494140625, 12.0517578125, 12.5003662109375, 12.948974609375, 13.3975830078125, 13.84619140625, 14.2947998046875, 14.743408203125, 15.1920166015625, 15.640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 11.0, 14.0, 11.0, 14.0, 22.0, 26.0, 50.0, 86.0, 164.0, 418.0, 1365.0, 1112.0, 350.0, 165.0, 73.0, 46.0, 31.0, 24.0, 27.0, 7.0, 10.0, 8.0, 6.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.546875, -13.1697998046875, -12.792724609375, -12.4156494140625, -12.03857421875, -11.6614990234375, -11.284423828125, -10.9073486328125, -10.5302734375, -10.1531982421875, -9.776123046875, -9.3990478515625, -9.02197265625, -8.6448974609375, -8.267822265625, -7.8907470703125, -7.513671875, -7.1365966796875, -6.759521484375, -6.3824462890625, -6.00537109375, -5.6282958984375, -5.251220703125, -4.8741455078125, -4.4970703125, -4.1199951171875, -3.742919921875, -3.3658447265625, -2.98876953125, -2.6116943359375, -2.234619140625, -1.8575439453125, -1.48046875, -1.1033935546875, -0.726318359375, -0.3492431640625, 0.02783203125, 0.4049072265625, 0.781982421875, 1.1590576171875, 1.5361328125, 1.9132080078125, 2.290283203125, 2.6673583984375, 3.04443359375, 3.4215087890625, 3.798583984375, 4.1756591796875, 4.552734375, 4.9298095703125, 5.306884765625, 5.6839599609375, 6.06103515625, 6.4381103515625, 6.815185546875, 7.1922607421875, 7.5693359375, 7.9464111328125, 8.323486328125, 8.7005615234375, 9.07763671875, 9.4547119140625, 9.831787109375, 10.2088623046875, 10.5859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 19.0, 31.0, 75.0, 136.0, 178.0, 200.0, 149.0, 94.0, 44.0, 28.0, 15.0, 9.0, 9.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.3817138671875, -56.42219924926758, -53.46268844604492, -50.503173828125, -47.54365921020508, -44.584144592285156, -41.6246337890625, -38.66511917114258, -35.705604553222656, -32.746089935302734, -29.786577224731445, -26.827064514160156, -23.867549896240234, -20.908037185668945, -17.948524475097656, -14.989009857177734, -12.029499053955078, -9.069985389709473, -6.110472202301025, -3.150959014892578, -0.19144535064697266, 2.768068313598633, 5.727581024169922, 8.687095642089844, 11.646608352661133, 14.606122016906738, 17.565635681152344, 20.525148391723633, 23.484661102294922, 26.444175720214844, 29.403688430786133, 32.36320495605469, 35.322715759277344, 38.282230377197266, 41.24174118041992, 44.201255798339844, 47.160770416259766, 50.12028503417969, 53.079795837402344, 56.039310455322266, 58.99882507324219, 61.95833969116211, 64.91785430908203, 67.87736511230469, 70.83687591552734, 73.79639434814453, 76.75590515136719, 79.71542358398438, 82.6749267578125, 85.63443756103516, 88.59395599365234, 91.553466796875, 94.51297760009766, 97.47249603271484, 100.4320068359375, 103.39152526855469, 106.35103607177734, 109.310546875, 112.27006530761719, 115.22957611083984, 118.1890869140625, 121.14860534667969, 124.10811614990234, 127.067626953125, 130.0271453857422]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 14.0, 12.0, 21.0, 15.0, 23.0, 38.0, 34.0, 32.0, 46.0, 55.0, 43.0, 60.0, 58.0, 61.0, 52.0, 49.0, 52.0, 58.0, 38.0, 43.0, 36.0, 22.0, 29.0, 25.0, 20.0, 10.0, 10.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.08420944213867, -44.55585479736328, -43.027503967285156, -41.499149322509766, -39.970794677734375, -38.442440032958984, -36.914085388183594, -35.38573455810547, -33.85737991333008, -32.32902526855469, -30.80067253112793, -29.272319793701172, -27.74396514892578, -26.21561050415039, -24.687257766723633, -23.158905029296875, -21.630550384521484, -20.102195739746094, -18.573843002319336, -17.045490264892578, -15.517135620117188, -13.988781929016113, -12.460428237915039, -10.932074546813965, -9.40372085571289, -7.875367164611816, -6.347013473510742, -4.818659782409668, -3.2903060913085938, -1.7619524002075195, -0.2335987091064453, 1.294754981994629, 2.8231124877929688, 4.351466178894043, 5.879819869995117, 7.408173561096191, 8.936527252197266, 10.46488094329834, 11.993234634399414, 13.521588325500488, 15.049942016601562, 16.578296661376953, 18.10664939880371, 19.63500213623047, 21.16335678100586, 22.69171142578125, 24.220064163208008, 25.748416900634766, 27.276771545410156, 28.805126190185547, 30.333478927612305, 31.861831665039062, 33.39018630981445, 34.918540954589844, 36.44689178466797, 37.97524642944336, 39.50360107421875, 41.03195571899414, 42.56031036376953, 44.088661193847656, 45.61701583862305, 47.14537048339844, 48.67372131347656, 50.20207595825195, 51.730430603027344]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 7.0, 20.0, 14.0, 43.0, 60.0, 84.0, 136.0, 238.0, 412.0, 793.0, 1655.0, 3627.0, 8752.0, 24135.0, 74243.0, 256166.0, 445173.0, 157833.0, 47979.0, 15876.0, 6067.0, 2611.0, 1186.0, 594.0, 315.0, 174.0, 120.0, 71.0, 55.0, 29.0, 20.0, 17.0, 13.0, 10.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.703125, -9.4202880859375, -9.137451171875, -8.8546142578125, -8.57177734375, -8.2889404296875, -8.006103515625, -7.7232666015625, -7.4404296875, -7.1575927734375, -6.874755859375, -6.5919189453125, -6.30908203125, -6.0262451171875, -5.743408203125, -5.4605712890625, -5.177734375, -4.8948974609375, -4.612060546875, -4.3292236328125, -4.04638671875, -3.7635498046875, -3.480712890625, -3.1978759765625, -2.9150390625, -2.6322021484375, -2.349365234375, -2.0665283203125, -1.78369140625, -1.5008544921875, -1.218017578125, -0.9351806640625, -0.65234375, -0.3695068359375, -0.086669921875, 0.1961669921875, 0.47900390625, 0.7618408203125, 1.044677734375, 1.3275146484375, 1.6103515625, 1.8931884765625, 2.176025390625, 2.4588623046875, 2.74169921875, 3.0245361328125, 3.307373046875, 3.5902099609375, 3.873046875, 4.1558837890625, 4.438720703125, 4.7215576171875, 5.00439453125, 5.2872314453125, 5.570068359375, 5.8529052734375, 6.1357421875, 6.4185791015625, 6.701416015625, 6.9842529296875, 7.26708984375, 7.5499267578125, 7.832763671875, 8.1156005859375, 8.3984375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 9.0, 9.0, 7.0, 15.0, 30.0, 25.0, 43.0, 56.0, 58.0, 51.0, 74.0, 67.0, 90.0, 67.0, 70.0, 51.0, 66.0, 43.0, 37.0, 27.0, 26.0, 27.0, 15.0, 13.0, 7.0, 5.0, 9.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7578125, -5.58197021484375, -5.4061279296875, -5.23028564453125, -5.054443359375, -4.87860107421875, -4.7027587890625, -4.52691650390625, -4.35107421875, -4.17523193359375, -3.9993896484375, -3.82354736328125, -3.647705078125, -3.47186279296875, -3.2960205078125, -3.12017822265625, -2.9443359375, -2.76849365234375, -2.5926513671875, -2.41680908203125, -2.240966796875, -2.06512451171875, -1.8892822265625, -1.71343994140625, -1.53759765625, -1.36175537109375, -1.1859130859375, -1.01007080078125, -0.834228515625, -0.65838623046875, -0.4825439453125, -0.30670166015625, -0.130859375, 0.04498291015625, 0.2208251953125, 0.39666748046875, 0.572509765625, 0.74835205078125, 0.9241943359375, 1.10003662109375, 1.27587890625, 1.45172119140625, 1.6275634765625, 1.80340576171875, 1.979248046875, 2.15509033203125, 2.3309326171875, 2.50677490234375, 2.6826171875, 2.85845947265625, 3.0343017578125, 3.21014404296875, 3.385986328125, 3.56182861328125, 3.7376708984375, 3.91351318359375, 4.08935546875, 4.26519775390625, 4.4410400390625, 4.61688232421875, 4.792724609375, 4.96856689453125, 5.1444091796875, 5.32025146484375, 5.49609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 11.0, 19.0, 22.0, 21.0, 40.0, 80.0, 126.0, 260.0, 506.0, 1302.0, 4814.0, 50719.0, 911249.0, 70832.0, 5914.0, 1393.0, 568.0, 260.0, 153.0, 94.0, 48.0, 27.0, 17.0, 19.0, 16.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-29.75, -28.888916015625, -28.02783203125, -27.166748046875, -26.3056640625, -25.444580078125, -24.58349609375, -23.722412109375, -22.861328125, -22.000244140625, -21.13916015625, -20.278076171875, -19.4169921875, -18.555908203125, -17.69482421875, -16.833740234375, -15.97265625, -15.111572265625, -14.25048828125, -13.389404296875, -12.5283203125, -11.667236328125, -10.80615234375, -9.945068359375, -9.083984375, -8.222900390625, -7.36181640625, -6.500732421875, -5.6396484375, -4.778564453125, -3.91748046875, -3.056396484375, -2.1953125, -1.334228515625, -0.47314453125, 0.387939453125, 1.2490234375, 2.110107421875, 2.97119140625, 3.832275390625, 4.693359375, 5.554443359375, 6.41552734375, 7.276611328125, 8.1376953125, 8.998779296875, 9.85986328125, 10.720947265625, 11.58203125, 12.443115234375, 13.30419921875, 14.165283203125, 15.0263671875, 15.887451171875, 16.74853515625, 17.609619140625, 18.470703125, 19.331787109375, 20.19287109375, 21.053955078125, 21.9150390625, 22.776123046875, 23.63720703125, 24.498291015625, 25.359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 10.0, 12.0, 13.0, 21.0, 16.0, 26.0, 45.0, 40.0, 58.0, 55.0, 74.0, 92.0, 70.0, 74.0, 84.0, 70.0, 60.0, 50.0, 33.0, 22.0, 13.0, 14.0, 11.0, 9.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.453125, -26.606689453125, -25.76025390625, -24.913818359375, -24.0673828125, -23.220947265625, -22.37451171875, -21.528076171875, -20.681640625, -19.835205078125, -18.98876953125, -18.142333984375, -17.2958984375, -16.449462890625, -15.60302734375, -14.756591796875, -13.91015625, -13.063720703125, -12.21728515625, -11.370849609375, -10.5244140625, -9.677978515625, -8.83154296875, -7.985107421875, -7.138671875, -6.292236328125, -5.44580078125, -4.599365234375, -3.7529296875, -2.906494140625, -2.06005859375, -1.213623046875, -0.3671875, 0.479248046875, 1.32568359375, 2.172119140625, 3.0185546875, 3.864990234375, 4.71142578125, 5.557861328125, 6.404296875, 7.250732421875, 8.09716796875, 8.943603515625, 9.7900390625, 10.636474609375, 11.48291015625, 12.329345703125, 13.17578125, 14.022216796875, 14.86865234375, 15.715087890625, 16.5615234375, 17.407958984375, 18.25439453125, 19.100830078125, 19.947265625, 20.793701171875, 21.64013671875, 22.486572265625, 23.3330078125, 24.179443359375, 25.02587890625, 25.872314453125, 26.71875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 11.0, 19.0, 13.0, 26.0, 43.0, 57.0, 120.0, 234.0, 548.0, 1867.0, 12760.0, 652423.0, 367472.0, 10171.0, 1705.0, 523.0, 231.0, 93.0, 53.0, 50.0, 39.0, 18.0, 15.0, 13.0, 5.0, 6.0, 4.0, 7.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.4375, -13.0531005859375, -12.668701171875, -12.2843017578125, -11.89990234375, -11.5155029296875, -11.131103515625, -10.7467041015625, -10.3623046875, -9.9779052734375, -9.593505859375, -9.2091064453125, -8.82470703125, -8.4403076171875, -8.055908203125, -7.6715087890625, -7.287109375, -6.9027099609375, -6.518310546875, -6.1339111328125, -5.74951171875, -5.3651123046875, -4.980712890625, -4.5963134765625, -4.2119140625, -3.8275146484375, -3.443115234375, -3.0587158203125, -2.67431640625, -2.2899169921875, -1.905517578125, -1.5211181640625, -1.13671875, -0.7523193359375, -0.367919921875, 0.0164794921875, 0.40087890625, 0.7852783203125, 1.169677734375, 1.5540771484375, 1.9384765625, 2.3228759765625, 2.707275390625, 3.0916748046875, 3.47607421875, 3.8604736328125, 4.244873046875, 4.6292724609375, 5.013671875, 5.3980712890625, 5.782470703125, 6.1668701171875, 6.55126953125, 6.9356689453125, 7.320068359375, 7.7044677734375, 8.0888671875, 8.4732666015625, 8.857666015625, 9.2420654296875, 9.62646484375, 10.0108642578125, 10.395263671875, 10.7796630859375, 11.1640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 7.0, 7.0, 10.0, 13.0, 12.0, 23.0, 37.0, 22.0, 39.0, 46.0, 88.0, 134.0, 145.0, 125.0, 76.0, 52.0, 35.0, 28.0, 26.0, 14.0, 10.0, 13.0, 5.0, 8.0, 4.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.000988006591796875, -0.0009590983390808105, -0.0009301900863647461, -0.0009012818336486816, -0.0008723735809326172, -0.0008434653282165527, -0.0008145570755004883, -0.0007856488227844238, -0.0007567405700683594, -0.0007278323173522949, -0.0006989240646362305, -0.000670015811920166, -0.0006411075592041016, -0.0006121993064880371, -0.0005832910537719727, -0.0005543828010559082, -0.0005254745483398438, -0.0004965662956237793, -0.00046765804290771484, -0.0004387497901916504, -0.00040984153747558594, -0.0003809332847595215, -0.00035202503204345703, -0.0003231167793273926, -0.0002942085266113281, -0.00026530027389526367, -0.00023639202117919922, -0.00020748376846313477, -0.0001785755157470703, -0.00014966726303100586, -0.0001207590103149414, -9.185075759887695e-05, -6.29425048828125e-05, -3.403425216674805e-05, -5.125999450683594e-06, 2.378225326538086e-05, 5.269050598144531e-05, 8.159875869750977e-05, 0.00011050701141357422, 0.00013941526412963867, 0.00016832351684570312, 0.00019723176956176758, 0.00022614002227783203, 0.0002550482749938965, 0.00028395652770996094, 0.0003128647804260254, 0.00034177303314208984, 0.0003706812858581543, 0.00039958953857421875, 0.0004284977912902832, 0.00045740604400634766, 0.0004863142967224121, 0.0005152225494384766, 0.000544130802154541, 0.0005730390548706055, 0.0006019473075866699, 0.0006308555603027344, 0.0006597638130187988, 0.0006886720657348633, 0.0007175803184509277, 0.0007464885711669922, 0.0007753968238830566, 0.0008043050765991211, 0.0008332133293151855, 0.00086212158203125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 3.0, 8.0, 6.0, 9.0, 13.0, 21.0, 45.0, 48.0, 83.0, 124.0, 259.0, 478.0, 1069.0, 3050.0, 13654.0, 177487.0, 803598.0, 39514.0, 5740.0, 1755.0, 738.0, 352.0, 181.0, 101.0, 60.0, 49.0, 30.0, 25.0, 20.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.3046875, -10.0203857421875, -9.736083984375, -9.4517822265625, -9.16748046875, -8.8831787109375, -8.598876953125, -8.3145751953125, -8.0302734375, -7.7459716796875, -7.461669921875, -7.1773681640625, -6.89306640625, -6.6087646484375, -6.324462890625, -6.0401611328125, -5.755859375, -5.4715576171875, -5.187255859375, -4.9029541015625, -4.61865234375, -4.3343505859375, -4.050048828125, -3.7657470703125, -3.4814453125, -3.1971435546875, -2.912841796875, -2.6285400390625, -2.34423828125, -2.0599365234375, -1.775634765625, -1.4913330078125, -1.20703125, -0.9227294921875, -0.638427734375, -0.3541259765625, -0.06982421875, 0.2144775390625, 0.498779296875, 0.7830810546875, 1.0673828125, 1.3516845703125, 1.635986328125, 1.9202880859375, 2.20458984375, 2.4888916015625, 2.773193359375, 3.0574951171875, 3.341796875, 3.6260986328125, 3.910400390625, 4.1947021484375, 4.47900390625, 4.7633056640625, 5.047607421875, 5.3319091796875, 5.6162109375, 5.9005126953125, 6.184814453125, 6.4691162109375, 6.75341796875, 7.0377197265625, 7.322021484375, 7.6063232421875, 7.890625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 8.0, 3.0, 7.0, 10.0, 7.0, 16.0, 15.0, 22.0, 22.0, 32.0, 29.0, 46.0, 56.0, 79.0, 95.0, 79.0, 87.0, 85.0, 64.0, 38.0, 36.0, 28.0, 30.0, 24.0, 13.0, 19.0, 14.0, 6.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.6953125, -4.537109375, -4.37890625, -4.220703125, -4.0625, -3.904296875, -3.74609375, -3.587890625, -3.4296875, -3.271484375, -3.11328125, -2.955078125, -2.796875, -2.638671875, -2.48046875, -2.322265625, -2.1640625, -2.005859375, -1.84765625, -1.689453125, -1.53125, -1.373046875, -1.21484375, -1.056640625, -0.8984375, -0.740234375, -0.58203125, -0.423828125, -0.265625, -0.107421875, 0.05078125, 0.208984375, 0.3671875, 0.525390625, 0.68359375, 0.841796875, 1.0, 1.158203125, 1.31640625, 1.474609375, 1.6328125, 1.791015625, 1.94921875, 2.107421875, 2.265625, 2.423828125, 2.58203125, 2.740234375, 2.8984375, 3.056640625, 3.21484375, 3.373046875, 3.53125, 3.689453125, 3.84765625, 4.005859375, 4.1640625, 4.322265625, 4.48046875, 4.638671875, 4.796875, 4.955078125, 5.11328125, 5.271484375, 5.4296875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 10.0, 15.0, 89.0, 247.0, 401.0, 170.0, 46.0, 12.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.50225830078125, -296.6404724121094, -289.7786865234375, -282.91693115234375, -276.0551452636719, -269.193359375, -262.3315734863281, -255.46978759765625, -248.60801696777344, -241.74623107910156, -234.88446044921875, -228.02267456054688, -221.160888671875, -214.2991180419922, -207.4373321533203, -200.5755615234375, -193.71377563476562, -186.85198974609375, -179.99021911621094, -173.12843322753906, -166.26666259765625, -159.40487670898438, -152.5430908203125, -145.68130493164062, -138.8195343017578, -131.95774841308594, -125.09597778320312, -118.23419189453125, -111.3724136352539, -104.51063537597656, -97.64884948730469, -90.78707122802734, -83.92529296875, -77.06351470947266, -70.20173645019531, -63.33995056152344, -56.478172302246094, -49.61639404296875, -42.75461196899414, -35.89282989501953, -29.031051635742188, -22.16927146911621, -15.307491302490234, -8.445711135864258, -1.5839309692382812, 5.2778472900390625, 12.139629364013672, 19.00141143798828, 25.863189697265625, 32.72496795654297, 39.58675003051758, 46.44853210449219, 53.31031036376953, 60.172088623046875, 67.03387451171875, 73.8956527709961, 80.75743103027344, 87.61920928955078, 94.48098754882812, 101.3427734375, 108.20455169677734, 115.06632995605469, 121.92811584472656, 128.78988647460938, 135.65167236328125]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 8.0, 20.0, 9.0, 15.0, 20.0, 11.0, 8.0, 20.0, 22.0, 23.0, 30.0, 32.0, 50.0, 49.0, 51.0, 58.0, 65.0, 64.0, 68.0, 44.0, 43.0, 40.0, 33.0, 41.0, 23.0, 26.0, 31.0, 19.0, 14.0, 12.0, 8.0, 9.0, 8.0, 11.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.936309814453125, -61.731563568115234, -59.526817321777344, -57.32207489013672, -55.11732864379883, -52.91258239746094, -50.70783996582031, -48.50309371948242, -46.29834747314453, -44.09360122680664, -41.88885498046875, -39.684112548828125, -37.479366302490234, -35.274620056152344, -33.06987762451172, -30.865131378173828, -28.660385131835938, -26.455638885498047, -24.25089454650879, -22.04615020751953, -19.84140396118164, -17.63665771484375, -15.431913375854492, -13.227168083190918, -11.022422790527344, -8.81767749786377, -6.612932205200195, -4.408186912536621, -2.203441619873047, 0.0013036727905273438, 2.2060489654541016, 4.410794258117676, 6.615531921386719, 8.820277214050293, 11.025022506713867, 13.229767799377441, 15.434513092041016, 17.639259338378906, 19.844003677368164, 22.048748016357422, 24.253494262695312, 26.458240509033203, 28.66298484802246, 30.86772918701172, 33.07247543334961, 35.2772216796875, 37.481964111328125, 39.686710357666016, 41.891456604003906, 44.0962028503418, 46.30094909667969, 48.50569152832031, 50.7104377746582, 52.915184020996094, 55.11992645263672, 57.32467269897461, 59.5294189453125, 61.73416519165039, 63.93891143798828, 66.1436538696289, 68.34840393066406, 70.55314636230469, 72.75788879394531, 74.96263885498047, 77.1673812866211]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 0.0, 18.0, 22.0, 27.0, 60.0, 110.0, 229.0, 754.0, 18121.0, 4147659.0, 25745.0, 1030.0, 227.0, 118.0, 65.0, 43.0, 19.0, 14.0, 3.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.625, -38.54052734375, -37.4560546875, -36.37158203125, -35.287109375, -34.20263671875, -33.1181640625, -32.03369140625, -30.94921875, -29.86474609375, -28.7802734375, -27.69580078125, -26.611328125, -25.52685546875, -24.4423828125, -23.35791015625, -22.2734375, -21.18896484375, -20.1044921875, -19.02001953125, -17.935546875, -16.85107421875, -15.7666015625, -14.68212890625, -13.59765625, -12.51318359375, -11.4287109375, -10.34423828125, -9.259765625, -8.17529296875, -7.0908203125, -6.00634765625, -4.921875, -3.83740234375, -2.7529296875, -1.66845703125, -0.583984375, 0.50048828125, 1.5849609375, 2.66943359375, 3.75390625, 4.83837890625, 5.9228515625, 7.00732421875, 8.091796875, 9.17626953125, 10.2607421875, 11.34521484375, 12.4296875, 13.51416015625, 14.5986328125, 15.68310546875, 16.767578125, 17.85205078125, 18.9365234375, 20.02099609375, 21.10546875, 22.18994140625, 23.2744140625, 24.35888671875, 25.443359375, 26.52783203125, 27.6123046875, 28.69677734375, 29.78125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 0.0, 8.0, 20.0, 29.0, 29.0, 46.0, 62.0, 63.0, 64.0, 94.0, 83.0, 75.0, 84.0, 70.0, 67.0, 65.0, 34.0, 25.0, 29.0, 19.0, 12.0, 6.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.298828125, -3.105682373046875, -2.91253662109375, -2.719390869140625, -2.5262451171875, -2.333099365234375, -2.13995361328125, -1.946807861328125, -1.753662109375, -1.560516357421875, -1.36737060546875, -1.174224853515625, -0.9810791015625, -0.787933349609375, -0.59478759765625, -0.401641845703125, -0.20849609375, -0.015350341796875, 0.17779541015625, 0.370941162109375, 0.5640869140625, 0.757232666015625, 0.95037841796875, 1.143524169921875, 1.336669921875, 1.529815673828125, 1.72296142578125, 1.916107177734375, 2.1092529296875, 2.302398681640625, 2.49554443359375, 2.688690185546875, 2.8818359375, 3.074981689453125, 3.26812744140625, 3.461273193359375, 3.6544189453125, 3.847564697265625, 4.04071044921875, 4.233856201171875, 4.427001953125, 4.620147705078125, 4.81329345703125, 5.006439208984375, 5.1995849609375, 5.392730712890625, 5.58587646484375, 5.779022216796875, 5.97216796875, 6.165313720703125, 6.35845947265625, 6.551605224609375, 6.7447509765625, 6.937896728515625, 7.13104248046875, 7.324188232421875, 7.517333984375, 7.710479736328125, 7.90362548828125, 8.096771240234375, 8.2899169921875, 8.483062744140625, 8.67620849609375, 8.869354248046875, 9.0625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 11.0, 6.0, 7.0, 12.0, 29.0, 54.0, 82.0, 183.0, 386.0, 850.0, 1939.0, 4316.0, 11273.0, 40371.0, 311231.0, 3461863.0, 305432.0, 39109.0, 10580.0, 3797.0, 1586.0, 629.0, 284.0, 119.0, 57.0, 35.0, 9.0, 18.0, 3.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44140625, -6.18878173828125, -5.9361572265625, -5.68353271484375, -5.430908203125, -5.17828369140625, -4.9256591796875, -4.67303466796875, -4.42041015625, -4.16778564453125, -3.9151611328125, -3.66253662109375, -3.409912109375, -3.15728759765625, -2.9046630859375, -2.65203857421875, -2.3994140625, -2.14678955078125, -1.8941650390625, -1.64154052734375, -1.388916015625, -1.13629150390625, -0.8836669921875, -0.63104248046875, -0.37841796875, -0.12579345703125, 0.1268310546875, 0.37945556640625, 0.632080078125, 0.88470458984375, 1.1373291015625, 1.38995361328125, 1.642578125, 1.89520263671875, 2.1478271484375, 2.40045166015625, 2.653076171875, 2.90570068359375, 3.1583251953125, 3.41094970703125, 3.66357421875, 3.91619873046875, 4.1688232421875, 4.42144775390625, 4.674072265625, 4.92669677734375, 5.1793212890625, 5.43194580078125, 5.6845703125, 5.93719482421875, 6.1898193359375, 6.44244384765625, 6.695068359375, 6.94769287109375, 7.2003173828125, 7.45294189453125, 7.70556640625, 7.95819091796875, 8.2108154296875, 8.46343994140625, 8.716064453125, 8.96868896484375, 9.2213134765625, 9.47393798828125, 9.7265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 9.0, 9.0, 19.0, 20.0, 31.0, 45.0, 78.0, 142.0, 231.0, 530.0, 881.0, 943.0, 523.0, 248.0, 134.0, 70.0, 43.0, 27.0, 24.0, 14.0, 10.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.2734375, -9.01593017578125, -8.7584228515625, -8.50091552734375, -8.243408203125, -7.98590087890625, -7.7283935546875, -7.47088623046875, -7.21337890625, -6.95587158203125, -6.6983642578125, -6.44085693359375, -6.183349609375, -5.92584228515625, -5.6683349609375, -5.41082763671875, -5.1533203125, -4.89581298828125, -4.6383056640625, -4.38079833984375, -4.123291015625, -3.86578369140625, -3.6082763671875, -3.35076904296875, -3.09326171875, -2.83575439453125, -2.5782470703125, -2.32073974609375, -2.063232421875, -1.80572509765625, -1.5482177734375, -1.29071044921875, -1.033203125, -0.77569580078125, -0.5181884765625, -0.26068115234375, -0.003173828125, 0.25433349609375, 0.5118408203125, 0.76934814453125, 1.02685546875, 1.28436279296875, 1.5418701171875, 1.79937744140625, 2.056884765625, 2.31439208984375, 2.5718994140625, 2.82940673828125, 3.0869140625, 3.34442138671875, 3.6019287109375, 3.85943603515625, 4.116943359375, 4.37445068359375, 4.6319580078125, 4.88946533203125, 5.14697265625, 5.40447998046875, 5.6619873046875, 5.91949462890625, 6.177001953125, 6.43450927734375, 6.6920166015625, 6.94952392578125, 7.20703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 17.0, 32.0, 83.0, 233.0, 306.0, 190.0, 78.0, 28.0, 11.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-111.44131469726562, -107.99988555908203, -104.55845642089844, -101.11701965332031, -97.67559051513672, -94.23416137695312, -90.79273223876953, -87.35130310058594, -83.90987396240234, -80.46844482421875, -77.02701568603516, -73.58558654785156, -70.14414978027344, -66.70272064208984, -63.26129150390625, -59.819862365722656, -56.3784294128418, -52.9370002746582, -49.495567321777344, -46.05413818359375, -42.612709045410156, -39.17127990722656, -35.7298469543457, -32.28841781616211, -28.846986770629883, -25.405555725097656, -21.964126586914062, -18.522695541381836, -15.081265449523926, -11.639835357666016, -8.198404312133789, -4.756975173950195, -1.3155441284179688, 2.1258862018585205, 5.56731653213501, 9.008747100830078, 12.450177192687988, 15.891607284545898, 19.333038330078125, 22.77446746826172, 26.215898513793945, 29.657329559326172, 33.098758697509766, 36.540191650390625, 39.98162078857422, 43.42304992675781, 46.864479064941406, 50.305908203125, 53.74734115600586, 57.18877029418945, 60.63020324707031, 64.0716323852539, 67.5130615234375, 70.9544906616211, 74.39591979980469, 77.83735656738281, 81.2787857055664, 84.72021484375, 88.1616439819336, 91.60307312011719, 95.04450988769531, 98.4859390258789, 101.9273681640625, 105.3687973022461, 108.81022644042969]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 3.0, 9.0, 5.0, 5.0, 8.0, 16.0, 21.0, 22.0, 31.0, 22.0, 32.0, 36.0, 45.0, 49.0, 33.0, 41.0, 56.0, 52.0, 51.0, 51.0, 58.0, 40.0, 41.0, 36.0, 50.0, 33.0, 30.0, 25.0, 15.0, 25.0, 12.0, 10.0, 10.0, 4.0, 4.0, 3.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-45.58937454223633, -44.4271240234375, -43.26487350463867, -42.102622985839844, -40.940372467041016, -39.77812194824219, -38.61587142944336, -37.45362091064453, -36.29137420654297, -35.12912368774414, -33.96687316894531, -32.804622650146484, -31.642372131347656, -30.480121612548828, -29.317873001098633, -28.155622482299805, -26.993370056152344, -25.831119537353516, -24.668869018554688, -23.50661849975586, -22.34436798095703, -21.182117462158203, -20.019868850708008, -18.85761833190918, -17.69536781311035, -16.533117294311523, -15.370866775512695, -14.208617210388184, -13.046366691589355, -11.884116172790527, -10.721866607666016, -9.559616088867188, -8.39736557006836, -7.235115051269531, -6.072865009307861, -4.910614967346191, -3.7483644485473633, -2.586113929748535, -1.4238638877868652, -0.2616138458251953, 0.9006366729736328, 2.062886953353882, 3.225137233734131, 4.387387275695801, 5.549637794494629, 6.711888313293457, 7.874138355255127, 9.036388397216797, 10.198638916015625, 11.360889434814453, 12.523139953613281, 13.685389518737793, 14.847640037536621, 16.009891510009766, 17.17214012145996, 18.33439064025879, 19.496641159057617, 20.658891677856445, 21.821142196655273, 22.9833927154541, 24.145641326904297, 25.307891845703125, 26.470142364501953, 27.63239288330078, 28.79464340209961]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 5.0, 4.0, 9.0, 6.0, 7.0, 12.0, 18.0, 14.0, 30.0, 57.0, 73.0, 83.0, 176.0, 250.0, 423.0, 876.0, 1721.0, 3522.0, 7964.0, 18418.0, 46118.0, 129153.0, 360311.0, 307860.0, 104594.0, 37975.0, 15710.0, 6674.0, 3010.0, 1606.0, 780.0, 426.0, 208.0, 143.0, 88.0, 65.0, 41.0, 32.0, 22.0, 26.0, 17.0, 8.0, 6.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-7.328125, -7.1181640625, -6.908203125, -6.6982421875, -6.48828125, -6.2783203125, -6.068359375, -5.8583984375, -5.6484375, -5.4384765625, -5.228515625, -5.0185546875, -4.80859375, -4.5986328125, -4.388671875, -4.1787109375, -3.96875, -3.7587890625, -3.548828125, -3.3388671875, -3.12890625, -2.9189453125, -2.708984375, -2.4990234375, -2.2890625, -2.0791015625, -1.869140625, -1.6591796875, -1.44921875, -1.2392578125, -1.029296875, -0.8193359375, -0.609375, -0.3994140625, -0.189453125, 0.0205078125, 0.23046875, 0.4404296875, 0.650390625, 0.8603515625, 1.0703125, 1.2802734375, 1.490234375, 1.7001953125, 1.91015625, 2.1201171875, 2.330078125, 2.5400390625, 2.75, 2.9599609375, 3.169921875, 3.3798828125, 3.58984375, 3.7998046875, 4.009765625, 4.2197265625, 4.4296875, 4.6396484375, 4.849609375, 5.0595703125, 5.26953125, 5.4794921875, 5.689453125, 5.8994140625, 6.109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 6.0, 6.0, 9.0, 15.0, 14.0, 34.0, 35.0, 41.0, 48.0, 49.0, 55.0, 69.0, 66.0, 70.0, 71.0, 58.0, 48.0, 55.0, 50.0, 41.0, 38.0, 26.0, 26.0, 14.0, 16.0, 9.0, 14.0, 9.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.27734375, -3.1275634765625, -2.977783203125, -2.8280029296875, -2.67822265625, -2.5284423828125, -2.378662109375, -2.2288818359375, -2.0791015625, -1.9293212890625, -1.779541015625, -1.6297607421875, -1.47998046875, -1.3302001953125, -1.180419921875, -1.0306396484375, -0.880859375, -0.7310791015625, -0.581298828125, -0.4315185546875, -0.28173828125, -0.1319580078125, 0.017822265625, 0.1676025390625, 0.3173828125, 0.4671630859375, 0.616943359375, 0.7667236328125, 0.91650390625, 1.0662841796875, 1.216064453125, 1.3658447265625, 1.515625, 1.6654052734375, 1.815185546875, 1.9649658203125, 2.11474609375, 2.2645263671875, 2.414306640625, 2.5640869140625, 2.7138671875, 2.8636474609375, 3.013427734375, 3.1632080078125, 3.31298828125, 3.4627685546875, 3.612548828125, 3.7623291015625, 3.912109375, 4.0618896484375, 4.211669921875, 4.3614501953125, 4.51123046875, 4.6610107421875, 4.810791015625, 4.9605712890625, 5.1103515625, 5.2601318359375, 5.409912109375, 5.5596923828125, 5.70947265625, 5.8592529296875, 6.009033203125, 6.1588134765625, 6.30859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 11.0, 16.0, 24.0, 32.0, 46.0, 80.0, 143.0, 341.0, 971.0, 3876.0, 48532.0, 890486.0, 96220.0, 5811.0, 1111.0, 434.0, 194.0, 104.0, 54.0, 28.0, 17.0, 10.0, 2.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.671875, -23.9150390625, -23.158203125, -22.4013671875, -21.64453125, -20.8876953125, -20.130859375, -19.3740234375, -18.6171875, -17.8603515625, -17.103515625, -16.3466796875, -15.58984375, -14.8330078125, -14.076171875, -13.3193359375, -12.5625, -11.8056640625, -11.048828125, -10.2919921875, -9.53515625, -8.7783203125, -8.021484375, -7.2646484375, -6.5078125, -5.7509765625, -4.994140625, -4.2373046875, -3.48046875, -2.7236328125, -1.966796875, -1.2099609375, -0.453125, 0.3037109375, 1.060546875, 1.8173828125, 2.57421875, 3.3310546875, 4.087890625, 4.8447265625, 5.6015625, 6.3583984375, 7.115234375, 7.8720703125, 8.62890625, 9.3857421875, 10.142578125, 10.8994140625, 11.65625, 12.4130859375, 13.169921875, 13.9267578125, 14.68359375, 15.4404296875, 16.197265625, 16.9541015625, 17.7109375, 18.4677734375, 19.224609375, 19.9814453125, 20.73828125, 21.4951171875, 22.251953125, 23.0087890625, 23.765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 8.0, 7.0, 1.0, 17.0, 21.0, 19.0, 22.0, 24.0, 18.0, 22.0, 27.0, 45.0, 49.0, 56.0, 42.0, 58.0, 50.0, 54.0, 46.0, 51.0, 42.0, 46.0, 35.0, 31.0, 30.0, 35.0, 23.0, 15.0, 16.0, 14.0, 16.0, 13.0, 14.0, 10.0, 8.0, 8.0, 3.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.5703125, -14.1319580078125, -13.693603515625, -13.2552490234375, -12.81689453125, -12.3785400390625, -11.940185546875, -11.5018310546875, -11.0634765625, -10.6251220703125, -10.186767578125, -9.7484130859375, -9.31005859375, -8.8717041015625, -8.433349609375, -7.9949951171875, -7.556640625, -7.1182861328125, -6.679931640625, -6.2415771484375, -5.80322265625, -5.3648681640625, -4.926513671875, -4.4881591796875, -4.0498046875, -3.6114501953125, -3.173095703125, -2.7347412109375, -2.29638671875, -1.8580322265625, -1.419677734375, -0.9813232421875, -0.54296875, -0.1046142578125, 0.333740234375, 0.7720947265625, 1.21044921875, 1.6488037109375, 2.087158203125, 2.5255126953125, 2.9638671875, 3.4022216796875, 3.840576171875, 4.2789306640625, 4.71728515625, 5.1556396484375, 5.593994140625, 6.0323486328125, 6.470703125, 6.9090576171875, 7.347412109375, 7.7857666015625, 8.22412109375, 8.6624755859375, 9.100830078125, 9.5391845703125, 9.9775390625, 10.4158935546875, 10.854248046875, 11.2926025390625, 11.73095703125, 12.1693115234375, 12.607666015625, 13.0460205078125, 13.484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 11.0, 15.0, 54.0, 123.0, 745.0, 51320.0, 994487.0, 1503.0, 189.0, 58.0, 20.0, 13.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.0, -50.76611328125, -49.5322265625, -48.29833984375, -47.064453125, -45.83056640625, -44.5966796875, -43.36279296875, -42.12890625, -40.89501953125, -39.6611328125, -38.42724609375, -37.193359375, -35.95947265625, -34.7255859375, -33.49169921875, -32.2578125, -31.02392578125, -29.7900390625, -28.55615234375, -27.322265625, -26.08837890625, -24.8544921875, -23.62060546875, -22.38671875, -21.15283203125, -19.9189453125, -18.68505859375, -17.451171875, -16.21728515625, -14.9833984375, -13.74951171875, -12.515625, -11.28173828125, -10.0478515625, -8.81396484375, -7.580078125, -6.34619140625, -5.1123046875, -3.87841796875, -2.64453125, -1.41064453125, -0.1767578125, 1.05712890625, 2.291015625, 3.52490234375, 4.7587890625, 5.99267578125, 7.2265625, 8.46044921875, 9.6943359375, 10.92822265625, 12.162109375, 13.39599609375, 14.6298828125, 15.86376953125, 17.09765625, 18.33154296875, 19.5654296875, 20.79931640625, 22.033203125, 23.26708984375, 24.5009765625, 25.73486328125, 26.96875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 5.0, 5.0, 5.0, 4.0, 7.0, 12.0, 15.0, 15.0, 30.0, 67.0, 104.0, 198.0, 221.0, 130.0, 80.0, 34.0, 20.0, 13.0, 14.0, 8.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013456344604492188, -0.0013024955987930298, -0.0012593567371368408, -0.0012162178754806519, -0.0011730790138244629, -0.001129940152168274, -0.001086801290512085, -0.001043662428855896, -0.001000523567199707, -0.0009573847055435181, -0.0009142458438873291, -0.0008711069822311401, -0.0008279681205749512, -0.0007848292589187622, -0.0007416903972625732, -0.0006985515356063843, -0.0006554126739501953, -0.0006122738122940063, -0.0005691349506378174, -0.0005259960889816284, -0.00048285722732543945, -0.0004397183656692505, -0.0003965795040130615, -0.00035344064235687256, -0.0003103017807006836, -0.00026716291904449463, -0.00022402405738830566, -0.0001808851957321167, -0.00013774633407592773, -9.460747241973877e-05, -5.1468610763549805e-05, -8.32974910736084e-06, 3.4809112548828125e-05, 7.794797420501709e-05, 0.00012108683586120605, 0.00016422569751739502, 0.00020736455917358398, 0.00025050342082977295, 0.0002936422824859619, 0.0003367811441421509, 0.00037992000579833984, 0.0004230588674545288, 0.0004661977291107178, 0.0005093365907669067, 0.0005524754524230957, 0.0005956143140792847, 0.0006387531757354736, 0.0006818920373916626, 0.0007250308990478516, 0.0007681697607040405, 0.0008113086223602295, 0.0008544474840164185, 0.0008975863456726074, 0.0009407252073287964, 0.0009838640689849854, 0.0010270029306411743, 0.0010701417922973633, 0.0011132806539535522, 0.0011564195156097412, 0.0011995583772659302, 0.0012426972389221191, 0.001285836100578308, 0.001328974962234497, 0.001372113823890686, 0.001415252685546875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 7.0, 7.0, 17.0, 22.0, 28.0, 47.0, 69.0, 114.0, 277.0, 659.0, 1966.0, 9188.0, 134450.0, 859843.0, 35308.0, 4549.0, 1104.0, 429.0, 208.0, 93.0, 57.0, 25.0, 19.0, 18.0, 17.0, 6.0, 4.0, 9.0, 1.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-9.578125, -9.298828125, -9.01953125, -8.740234375, -8.4609375, -8.181640625, -7.90234375, -7.623046875, -7.34375, -7.064453125, -6.78515625, -6.505859375, -6.2265625, -5.947265625, -5.66796875, -5.388671875, -5.109375, -4.830078125, -4.55078125, -4.271484375, -3.9921875, -3.712890625, -3.43359375, -3.154296875, -2.875, -2.595703125, -2.31640625, -2.037109375, -1.7578125, -1.478515625, -1.19921875, -0.919921875, -0.640625, -0.361328125, -0.08203125, 0.197265625, 0.4765625, 0.755859375, 1.03515625, 1.314453125, 1.59375, 1.873046875, 2.15234375, 2.431640625, 2.7109375, 2.990234375, 3.26953125, 3.548828125, 3.828125, 4.107421875, 4.38671875, 4.666015625, 4.9453125, 5.224609375, 5.50390625, 5.783203125, 6.0625, 6.341796875, 6.62109375, 6.900390625, 7.1796875, 7.458984375, 7.73828125, 8.017578125, 8.296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 7.0, 10.0, 11.0, 6.0, 11.0, 15.0, 30.0, 56.0, 75.0, 73.0, 100.0, 152.0, 131.0, 104.0, 79.0, 45.0, 25.0, 18.0, 17.0, 11.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16015625, -6.9542236328125, -6.748291015625, -6.5423583984375, -6.33642578125, -6.1304931640625, -5.924560546875, -5.7186279296875, -5.5126953125, -5.3067626953125, -5.100830078125, -4.8948974609375, -4.68896484375, -4.4830322265625, -4.277099609375, -4.0711669921875, -3.865234375, -3.6593017578125, -3.453369140625, -3.2474365234375, -3.04150390625, -2.8355712890625, -2.629638671875, -2.4237060546875, -2.2177734375, -2.0118408203125, -1.805908203125, -1.5999755859375, -1.39404296875, -1.1881103515625, -0.982177734375, -0.7762451171875, -0.5703125, -0.3643798828125, -0.158447265625, 0.0474853515625, 0.25341796875, 0.4593505859375, 0.665283203125, 0.8712158203125, 1.0771484375, 1.2830810546875, 1.489013671875, 1.6949462890625, 1.90087890625, 2.1068115234375, 2.312744140625, 2.5186767578125, 2.724609375, 2.9305419921875, 3.136474609375, 3.3424072265625, 3.54833984375, 3.7542724609375, 3.960205078125, 4.1661376953125, 4.3720703125, 4.5780029296875, 4.783935546875, 4.9898681640625, 5.19580078125, 5.4017333984375, 5.607666015625, 5.8135986328125, 6.01953125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 18.0, 62.0, 328.0, 525.0, 58.0, 7.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-601.3699340820312, -590.484375, -579.5988159179688, -568.7132568359375, -557.8276977539062, -546.942138671875, -536.0565185546875, -525.1709594726562, -514.285400390625, -503.39984130859375, -492.5142822265625, -481.62872314453125, -470.7431335449219, -459.8575744628906, -448.9720153808594, -438.0864562988281, -427.2008972167969, -416.3153381347656, -405.4297790527344, -394.544189453125, -383.65863037109375, -372.7730712890625, -361.88751220703125, -351.001953125, -340.11639404296875, -329.2308349609375, -318.34527587890625, -307.459716796875, -296.5741271972656, -285.6885681152344, -274.8030090332031, -263.9174499511719, -253.03189086914062, -242.14633178710938, -231.26075744628906, -220.3751983642578, -209.4896240234375, -198.60406494140625, -187.718505859375, -176.83294677734375, -165.94737243652344, -155.0618133544922, -144.17623901367188, -133.29067993164062, -122.40511322021484, -111.51954650878906, -100.63398742675781, -89.74842071533203, -78.86285400390625, -67.97728729248047, -57.09172439575195, -46.20616149902344, -35.320594787597656, -24.435028076171875, -13.549468994140625, -2.6639022827148438, 8.221664428710938, 19.107229232788086, 29.992794036865234, 40.87835693359375, 51.76392364501953, 62.64949035644531, 73.53504943847656, 84.42061614990234, 95.30618286132812]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 9.0, 12.0, 6.0, 14.0, 9.0, 9.0, 13.0, 14.0, 26.0, 25.0, 35.0, 24.0, 28.0, 30.0, 43.0, 40.0, 60.0, 50.0, 59.0, 57.0, 48.0, 42.0, 38.0, 32.0, 28.0, 33.0, 34.0, 27.0, 26.0, 15.0, 19.0, 13.0, 15.0, 16.0, 16.0, 7.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-63.37405014038086, -61.506629943847656, -59.63920974731445, -57.77178955078125, -55.90436935424805, -54.036949157714844, -52.169532775878906, -50.30210876464844, -48.4346923828125, -46.5672721862793, -44.699851989746094, -42.83243179321289, -40.96501159667969, -39.097591400146484, -37.23017120361328, -35.362754821777344, -33.495330810546875, -31.627910614013672, -29.76049041748047, -27.893070220947266, -26.025650024414062, -24.15822982788086, -22.29081153869629, -20.423391342163086, -18.555971145629883, -16.68855094909668, -14.821130752563477, -12.95371150970459, -11.086291313171387, -9.218871116638184, -7.351451873779297, -5.484031677246094, -3.616607666015625, -1.749187707901001, 0.11823225021362305, 1.985651969909668, 3.853072166442871, 5.720492362976074, 7.587911605834961, 9.455331802368164, 11.322751998901367, 13.19017219543457, 15.057592391967773, 16.925010681152344, 18.792430877685547, 20.65985107421875, 22.527271270751953, 24.394691467285156, 26.26211166381836, 28.129531860351562, 29.996952056884766, 31.86437225341797, 33.73179244995117, 35.599212646484375, 37.46662902832031, 39.33405303955078, 41.20146942138672, 43.06888961791992, 44.936309814453125, 46.80373001098633, 48.67115020751953, 50.538570404052734, 52.40599060058594, 54.273406982421875, 56.140830993652344]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 5.0, 4.0, 13.0, 21.0, 35.0, 44.0, 99.0, 188.0, 367.0, 969.0, 3404.0, 16202.0, 145440.0, 3534638.0, 454187.0, 30415.0, 5605.0, 1570.0, 575.0, 239.0, 107.0, 62.0, 33.0, 12.0, 17.0, 8.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.6177978515625, -10.282470703125, -9.9471435546875, -9.61181640625, -9.2764892578125, -8.941162109375, -8.6058349609375, -8.2705078125, -7.9351806640625, -7.599853515625, -7.2645263671875, -6.92919921875, -6.5938720703125, -6.258544921875, -5.9232177734375, -5.587890625, -5.2525634765625, -4.917236328125, -4.5819091796875, -4.24658203125, -3.9112548828125, -3.575927734375, -3.2406005859375, -2.9052734375, -2.5699462890625, -2.234619140625, -1.8992919921875, -1.56396484375, -1.2286376953125, -0.893310546875, -0.5579833984375, -0.22265625, 0.1126708984375, 0.447998046875, 0.7833251953125, 1.11865234375, 1.4539794921875, 1.789306640625, 2.1246337890625, 2.4599609375, 2.7952880859375, 3.130615234375, 3.4659423828125, 3.80126953125, 4.1365966796875, 4.471923828125, 4.8072509765625, 5.142578125, 5.4779052734375, 5.813232421875, 6.1485595703125, 6.48388671875, 6.8192138671875, 7.154541015625, 7.4898681640625, 7.8251953125, 8.1605224609375, 8.495849609375, 8.8311767578125, 9.16650390625, 9.5018310546875, 9.837158203125, 10.1724853515625, 10.5078125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 13.0, 11.0, 13.0, 17.0, 14.0, 29.0, 20.0, 24.0, 39.0, 32.0, 35.0, 43.0, 38.0, 49.0, 53.0, 43.0, 36.0, 45.0, 43.0, 46.0, 40.0, 38.0, 42.0, 32.0, 31.0, 24.0, 22.0, 28.0, 14.0, 13.0, 9.0, 11.0, 6.0, 5.0, 7.0, 1.0, 1.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.193359375, -3.099639892578125, -3.00592041015625, -2.912200927734375, -2.8184814453125, -2.724761962890625, -2.63104248046875, -2.537322998046875, -2.443603515625, -2.349884033203125, -2.25616455078125, -2.162445068359375, -2.0687255859375, -1.975006103515625, -1.88128662109375, -1.787567138671875, -1.69384765625, -1.600128173828125, -1.50640869140625, -1.412689208984375, -1.3189697265625, -1.225250244140625, -1.13153076171875, -1.037811279296875, -0.944091796875, -0.850372314453125, -0.75665283203125, -0.662933349609375, -0.5692138671875, -0.475494384765625, -0.38177490234375, -0.288055419921875, -0.1943359375, -0.100616455078125, -0.00689697265625, 0.086822509765625, 0.1805419921875, 0.274261474609375, 0.36798095703125, 0.461700439453125, 0.555419921875, 0.649139404296875, 0.74285888671875, 0.836578369140625, 0.9302978515625, 1.024017333984375, 1.11773681640625, 1.211456298828125, 1.30517578125, 1.398895263671875, 1.49261474609375, 1.586334228515625, 1.6800537109375, 1.773773193359375, 1.86749267578125, 1.961212158203125, 2.054931640625, 2.148651123046875, 2.24237060546875, 2.336090087890625, 2.4298095703125, 2.523529052734375, 2.61724853515625, 2.710968017578125, 2.8046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 9.0, 13.0, 21.0, 24.0, 40.0, 95.0, 210.0, 410.0, 1181.0, 4246.0, 25191.0, 381135.0, 3652689.0, 115234.0, 10741.0, 1986.0, 541.0, 255.0, 130.0, 49.0, 39.0, 16.0, 17.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.84375, -9.439208984375, -9.03466796875, -8.630126953125, -8.2255859375, -7.821044921875, -7.41650390625, -7.011962890625, -6.607421875, -6.202880859375, -5.79833984375, -5.393798828125, -4.9892578125, -4.584716796875, -4.18017578125, -3.775634765625, -3.37109375, -2.966552734375, -2.56201171875, -2.157470703125, -1.7529296875, -1.348388671875, -0.94384765625, -0.539306640625, -0.134765625, 0.269775390625, 0.67431640625, 1.078857421875, 1.4833984375, 1.887939453125, 2.29248046875, 2.697021484375, 3.1015625, 3.506103515625, 3.91064453125, 4.315185546875, 4.7197265625, 5.124267578125, 5.52880859375, 5.933349609375, 6.337890625, 6.742431640625, 7.14697265625, 7.551513671875, 7.9560546875, 8.360595703125, 8.76513671875, 9.169677734375, 9.57421875, 9.978759765625, 10.38330078125, 10.787841796875, 11.1923828125, 11.596923828125, 12.00146484375, 12.406005859375, 12.810546875, 13.215087890625, 13.61962890625, 14.024169921875, 14.4287109375, 14.833251953125, 15.23779296875, 15.642333984375, 16.046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 6.0, 9.0, 15.0, 13.0, 26.0, 34.0, 39.0, 80.0, 128.0, 195.0, 436.0, 792.0, 1061.0, 592.0, 274.0, 142.0, 79.0, 62.0, 34.0, 20.0, 14.0, 8.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1796875, -11.82470703125, -11.4697265625, -11.11474609375, -10.759765625, -10.40478515625, -10.0498046875, -9.69482421875, -9.33984375, -8.98486328125, -8.6298828125, -8.27490234375, -7.919921875, -7.56494140625, -7.2099609375, -6.85498046875, -6.5, -6.14501953125, -5.7900390625, -5.43505859375, -5.080078125, -4.72509765625, -4.3701171875, -4.01513671875, -3.66015625, -3.30517578125, -2.9501953125, -2.59521484375, -2.240234375, -1.88525390625, -1.5302734375, -1.17529296875, -0.8203125, -0.46533203125, -0.1103515625, 0.24462890625, 0.599609375, 0.95458984375, 1.3095703125, 1.66455078125, 2.01953125, 2.37451171875, 2.7294921875, 3.08447265625, 3.439453125, 3.79443359375, 4.1494140625, 4.50439453125, 4.859375, 5.21435546875, 5.5693359375, 5.92431640625, 6.279296875, 6.63427734375, 6.9892578125, 7.34423828125, 7.69921875, 8.05419921875, 8.4091796875, 8.76416015625, 9.119140625, 9.47412109375, 9.8291015625, 10.18408203125, 10.5390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 9.0, 9.0, 31.0, 67.0, 151.0, 199.0, 211.0, 141.0, 89.0, 41.0, 17.0, 8.0, 6.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.14857482910156, -85.72647094726562, -82.30436706542969, -78.88226318359375, -75.46016693115234, -72.0380630493164, -68.61595916748047, -65.19385528564453, -61.77175521850586, -58.34965133666992, -54.92755126953125, -51.50544738769531, -48.083343505859375, -44.6612434387207, -41.239139556884766, -37.817039489746094, -34.394935607910156, -30.97283363342285, -27.550731658935547, -24.12862777709961, -20.706525802612305, -17.284423828125, -13.862319946289062, -10.440217971801758, -7.018115997314453, -3.5960135459899902, -0.17391109466552734, 3.2481918334960938, 6.670293807983398, 10.092395782470703, 13.51449966430664, 16.936601638793945, 20.35870361328125, 23.780805587768555, 27.20290756225586, 30.625011444091797, 34.04711151123047, 37.469215393066406, 40.891319274902344, 44.31342315673828, 47.73552322387695, 51.15762710571289, 54.57972717285156, 58.0018310546875, 61.42393493652344, 64.84603881835938, 68.26814270019531, 71.69023895263672, 75.11234283447266, 78.5344467163086, 81.95655059814453, 85.37864685058594, 88.80075073242188, 92.22285461425781, 95.64495849609375, 99.06706237792969, 102.48916625976562, 105.91127014160156, 109.3333740234375, 112.75547790527344, 116.17757415771484, 119.59967803955078, 123.02178192138672, 126.44388580322266, 129.86598205566406]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 11.0, 10.0, 12.0, 15.0, 18.0, 36.0, 20.0, 33.0, 37.0, 40.0, 35.0, 56.0, 44.0, 52.0, 51.0, 48.0, 35.0, 38.0, 52.0, 43.0, 47.0, 40.0, 32.0, 30.0, 25.0, 25.0, 23.0, 19.0, 15.0, 3.0, 11.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.12617492675781, -46.679893493652344, -45.23360824584961, -43.78732681274414, -42.341041564941406, -40.89476013183594, -39.4484748840332, -38.002193450927734, -36.555908203125, -35.10962677001953, -33.6633415222168, -32.21706008911133, -30.770774841308594, -29.324491500854492, -27.87820816040039, -26.431926727294922, -24.98564338684082, -23.53936004638672, -22.093076705932617, -20.646793365478516, -19.200510025024414, -17.754226684570312, -16.307945251464844, -14.861660957336426, -13.415377616882324, -11.969094276428223, -10.522810935974121, -9.076528549194336, -7.630244731903076, -6.183961391448975, -4.737678527832031, -3.2913951873779297, -1.8451118469238281, -0.3988286256790161, 1.047454595565796, 2.4937376976013184, 3.94002103805542, 5.3863043785095215, 6.832587242126465, 8.278870582580566, 9.725153923034668, 11.17143726348877, 12.617720603942871, 14.064002990722656, 15.510286331176758, 16.95656967163086, 18.40285301208496, 19.849136352539062, 21.295419692993164, 22.741703033447266, 24.187986373901367, 25.63426971435547, 27.08055305480957, 28.526836395263672, 29.97311782836914, 31.419403076171875, 32.865684509277344, 34.31196594238281, 35.75825119018555, 37.204532623291016, 38.65081787109375, 40.09709930419922, 41.54338455200195, 42.98966598510742, 44.435951232910156]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 13.0, 18.0, 38.0, 62.0, 86.0, 160.0, 274.0, 508.0, 973.0, 1860.0, 4204.0, 10525.0, 29057.0, 82355.0, 235260.0, 398048.0, 183321.0, 63968.0, 22496.0, 8427.0, 3592.0, 1586.0, 724.0, 419.0, 229.0, 132.0, 67.0, 44.0, 30.0, 23.0, 14.0, 9.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0, -6.7838134765625, -6.567626953125, -6.3514404296875, -6.13525390625, -5.9190673828125, -5.702880859375, -5.4866943359375, -5.2705078125, -5.0543212890625, -4.838134765625, -4.6219482421875, -4.40576171875, -4.1895751953125, -3.973388671875, -3.7572021484375, -3.541015625, -3.3248291015625, -3.108642578125, -2.8924560546875, -2.67626953125, -2.4600830078125, -2.243896484375, -2.0277099609375, -1.8115234375, -1.5953369140625, -1.379150390625, -1.1629638671875, -0.94677734375, -0.7305908203125, -0.514404296875, -0.2982177734375, -0.08203125, 0.1341552734375, 0.350341796875, 0.5665283203125, 0.78271484375, 0.9989013671875, 1.215087890625, 1.4312744140625, 1.6474609375, 1.8636474609375, 2.079833984375, 2.2960205078125, 2.51220703125, 2.7283935546875, 2.944580078125, 3.1607666015625, 3.376953125, 3.5931396484375, 3.809326171875, 4.0255126953125, 4.24169921875, 4.4578857421875, 4.674072265625, 4.8902587890625, 5.1064453125, 5.3226318359375, 5.538818359375, 5.7550048828125, 5.97119140625, 6.1873779296875, 6.403564453125, 6.6197509765625, 6.8359375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 10.0, 21.0, 23.0, 22.0, 18.0, 29.0, 27.0, 28.0, 33.0, 42.0, 44.0, 49.0, 50.0, 50.0, 37.0, 45.0, 51.0, 45.0, 51.0, 33.0, 42.0, 39.0, 31.0, 24.0, 28.0, 22.0, 23.0, 15.0, 9.0, 7.0, 8.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-3.587890625, -3.4920654296875, -3.396240234375, -3.3004150390625, -3.20458984375, -3.1087646484375, -3.012939453125, -2.9171142578125, -2.8212890625, -2.7254638671875, -2.629638671875, -2.5338134765625, -2.43798828125, -2.3421630859375, -2.246337890625, -2.1505126953125, -2.0546875, -1.9588623046875, -1.863037109375, -1.7672119140625, -1.67138671875, -1.5755615234375, -1.479736328125, -1.3839111328125, -1.2880859375, -1.1922607421875, -1.096435546875, -1.0006103515625, -0.90478515625, -0.8089599609375, -0.713134765625, -0.6173095703125, -0.521484375, -0.4256591796875, -0.329833984375, -0.2340087890625, -0.13818359375, -0.0423583984375, 0.053466796875, 0.1492919921875, 0.2451171875, 0.3409423828125, 0.436767578125, 0.5325927734375, 0.62841796875, 0.7242431640625, 0.820068359375, 0.9158935546875, 1.01171875, 1.1075439453125, 1.203369140625, 1.2991943359375, 1.39501953125, 1.4908447265625, 1.586669921875, 1.6824951171875, 1.7783203125, 1.8741455078125, 1.969970703125, 2.0657958984375, 2.16162109375, 2.2574462890625, 2.353271484375, 2.4490966796875, 2.544921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 5.0, 6.0, 10.0, 10.0, 10.0, 20.0, 22.0, 31.0, 51.0, 65.0, 84.0, 117.0, 196.0, 294.0, 445.0, 772.0, 1156.0, 2438.0, 6606.0, 37192.0, 437236.0, 510142.0, 38928.0, 6894.0, 2449.0, 1276.0, 729.0, 453.0, 295.0, 196.0, 131.0, 95.0, 60.0, 35.0, 25.0, 25.0, 30.0, 5.0, 7.0, 5.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.8828125, -14.4451904296875, -14.007568359375, -13.5699462890625, -13.13232421875, -12.6947021484375, -12.257080078125, -11.8194580078125, -11.3818359375, -10.9442138671875, -10.506591796875, -10.0689697265625, -9.63134765625, -9.1937255859375, -8.756103515625, -8.3184814453125, -7.880859375, -7.4432373046875, -7.005615234375, -6.5679931640625, -6.13037109375, -5.6927490234375, -5.255126953125, -4.8175048828125, -4.3798828125, -3.9422607421875, -3.504638671875, -3.0670166015625, -2.62939453125, -2.1917724609375, -1.754150390625, -1.3165283203125, -0.87890625, -0.4412841796875, -0.003662109375, 0.4339599609375, 0.87158203125, 1.3092041015625, 1.746826171875, 2.1844482421875, 2.6220703125, 3.0596923828125, 3.497314453125, 3.9349365234375, 4.37255859375, 4.8101806640625, 5.247802734375, 5.6854248046875, 6.123046875, 6.5606689453125, 6.998291015625, 7.4359130859375, 7.87353515625, 8.3111572265625, 8.748779296875, 9.1864013671875, 9.6240234375, 10.0616455078125, 10.499267578125, 10.9368896484375, 11.37451171875, 11.8121337890625, 12.249755859375, 12.6873779296875, 13.125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 8.0, 4.0, 5.0, 11.0, 11.0, 16.0, 13.0, 20.0, 28.0, 30.0, 29.0, 39.0, 36.0, 52.0, 32.0, 45.0, 59.0, 59.0, 49.0, 41.0, 45.0, 42.0, 39.0, 38.0, 37.0, 34.0, 35.0, 20.0, 28.0, 16.0, 14.0, 23.0, 8.0, 6.0, 5.0, 8.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.109375, -14.6795654296875, -14.249755859375, -13.8199462890625, -13.39013671875, -12.9603271484375, -12.530517578125, -12.1007080078125, -11.6708984375, -11.2410888671875, -10.811279296875, -10.3814697265625, -9.95166015625, -9.5218505859375, -9.092041015625, -8.6622314453125, -8.232421875, -7.8026123046875, -7.372802734375, -6.9429931640625, -6.51318359375, -6.0833740234375, -5.653564453125, -5.2237548828125, -4.7939453125, -4.3641357421875, -3.934326171875, -3.5045166015625, -3.07470703125, -2.6448974609375, -2.215087890625, -1.7852783203125, -1.35546875, -0.9256591796875, -0.495849609375, -0.0660400390625, 0.36376953125, 0.7935791015625, 1.223388671875, 1.6531982421875, 2.0830078125, 2.5128173828125, 2.942626953125, 3.3724365234375, 3.80224609375, 4.2320556640625, 4.661865234375, 5.0916748046875, 5.521484375, 5.9512939453125, 6.381103515625, 6.8109130859375, 7.24072265625, 7.6705322265625, 8.100341796875, 8.5301513671875, 8.9599609375, 9.3897705078125, 9.819580078125, 10.2493896484375, 10.67919921875, 11.1090087890625, 11.538818359375, 11.9686279296875, 12.3984375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 6.0, 8.0, 16.0, 23.0, 33.0, 45.0, 56.0, 137.0, 196.0, 338.0, 726.0, 2067.0, 7529.0, 47770.0, 805030.0, 162679.0, 15924.0, 3612.0, 1169.0, 489.0, 274.0, 156.0, 76.0, 48.0, 34.0, 30.0, 20.0, 12.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.47265625, -7.27459716796875, -7.0765380859375, -6.87847900390625, -6.680419921875, -6.48236083984375, -6.2843017578125, -6.08624267578125, -5.88818359375, -5.69012451171875, -5.4920654296875, -5.29400634765625, -5.095947265625, -4.89788818359375, -4.6998291015625, -4.50177001953125, -4.3037109375, -4.10565185546875, -3.9075927734375, -3.70953369140625, -3.511474609375, -3.31341552734375, -3.1153564453125, -2.91729736328125, -2.71923828125, -2.52117919921875, -2.3231201171875, -2.12506103515625, -1.927001953125, -1.72894287109375, -1.5308837890625, -1.33282470703125, -1.134765625, -0.93670654296875, -0.7386474609375, -0.54058837890625, -0.342529296875, -0.14447021484375, 0.0535888671875, 0.25164794921875, 0.44970703125, 0.64776611328125, 0.8458251953125, 1.04388427734375, 1.241943359375, 1.44000244140625, 1.6380615234375, 1.83612060546875, 2.0341796875, 2.23223876953125, 2.4302978515625, 2.62835693359375, 2.826416015625, 3.02447509765625, 3.2225341796875, 3.42059326171875, 3.61865234375, 3.81671142578125, 4.0147705078125, 4.21282958984375, 4.410888671875, 4.60894775390625, 4.8070068359375, 5.00506591796875, 5.203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 2.0, 6.0, 4.0, 1.0, 8.0, 10.0, 18.0, 21.0, 19.0, 35.0, 34.0, 42.0, 63.0, 106.0, 195.0, 128.0, 68.0, 72.0, 30.0, 35.0, 18.0, 17.0, 13.0, 5.0, 8.0, 8.0, 4.0, 4.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011119842529296875, -0.001074463129043579, -0.0010369420051574707, -0.0009994208812713623, -0.0009618997573852539, -0.0009243786334991455, -0.0008868575096130371, -0.0008493363857269287, -0.0008118152618408203, -0.0007742941379547119, -0.0007367730140686035, -0.0006992518901824951, -0.0006617307662963867, -0.0006242096424102783, -0.0005866885185241699, -0.0005491673946380615, -0.0005116462707519531, -0.0004741251468658447, -0.00043660402297973633, -0.00039908289909362793, -0.00036156177520751953, -0.00032404065132141113, -0.00028651952743530273, -0.00024899840354919434, -0.00021147727966308594, -0.00017395615577697754, -0.00013643503189086914, -9.891390800476074e-05, -6.139278411865234e-05, -2.3871660232543945e-05, 1.3649463653564453e-05, 5.117058753967285e-05, 8.869171142578125e-05, 0.00012621283531188965, 0.00016373395919799805, 0.00020125508308410645, 0.00023877620697021484, 0.00027629733085632324, 0.00031381845474243164, 0.00035133957862854004, 0.00038886070251464844, 0.00042638182640075684, 0.00046390295028686523, 0.0005014240741729736, 0.000538945198059082, 0.0005764663219451904, 0.0006139874458312988, 0.0006515085697174072, 0.0006890296936035156, 0.000726550817489624, 0.0007640719413757324, 0.0008015930652618408, 0.0008391141891479492, 0.0008766353130340576, 0.000914156436920166, 0.0009516775608062744, 0.0009891986846923828, 0.0010267198085784912, 0.0010642409324645996, 0.001101762056350708, 0.0011392831802368164, 0.0011768043041229248, 0.0012143254280090332, 0.0012518465518951416, 0.00128936767578125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 5.0, 10.0, 14.0, 12.0, 14.0, 29.0, 43.0, 57.0, 99.0, 156.0, 221.0, 363.0, 624.0, 1194.0, 2521.0, 6478.0, 20953.0, 133647.0, 773903.0, 82328.0, 15848.0, 5307.0, 2152.0, 1043.0, 547.0, 337.0, 215.0, 131.0, 83.0, 65.0, 45.0, 29.0, 20.0, 13.0, 10.0, 7.0, 4.0, 6.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.5546875, -4.40484619140625, -4.2550048828125, -4.10516357421875, -3.955322265625, -3.80548095703125, -3.6556396484375, -3.50579833984375, -3.35595703125, -3.20611572265625, -3.0562744140625, -2.90643310546875, -2.756591796875, -2.60675048828125, -2.4569091796875, -2.30706787109375, -2.1572265625, -2.00738525390625, -1.8575439453125, -1.70770263671875, -1.557861328125, -1.40802001953125, -1.2581787109375, -1.10833740234375, -0.95849609375, -0.80865478515625, -0.6588134765625, -0.50897216796875, -0.359130859375, -0.20928955078125, -0.0594482421875, 0.09039306640625, 0.240234375, 0.39007568359375, 0.5399169921875, 0.68975830078125, 0.839599609375, 0.98944091796875, 1.1392822265625, 1.28912353515625, 1.43896484375, 1.58880615234375, 1.7386474609375, 1.88848876953125, 2.038330078125, 2.18817138671875, 2.3380126953125, 2.48785400390625, 2.6376953125, 2.78753662109375, 2.9373779296875, 3.08721923828125, 3.237060546875, 3.38690185546875, 3.5367431640625, 3.68658447265625, 3.83642578125, 3.98626708984375, 4.1361083984375, 4.28594970703125, 4.435791015625, 4.58563232421875, 4.7354736328125, 4.88531494140625, 5.03515625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 0.0, 4.0, 9.0, 5.0, 8.0, 10.0, 12.0, 11.0, 17.0, 28.0, 37.0, 53.0, 65.0, 106.0, 118.0, 131.0, 97.0, 78.0, 50.0, 43.0, 26.0, 13.0, 20.0, 12.0, 5.0, 8.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.41796875, -5.275787353515625, -5.13360595703125, -4.991424560546875, -4.8492431640625, -4.707061767578125, -4.56488037109375, -4.422698974609375, -4.280517578125, -4.138336181640625, -3.99615478515625, -3.853973388671875, -3.7117919921875, -3.569610595703125, -3.42742919921875, -3.285247802734375, -3.14306640625, -3.000885009765625, -2.85870361328125, -2.716522216796875, -2.5743408203125, -2.432159423828125, -2.28997802734375, -2.147796630859375, -2.005615234375, -1.863433837890625, -1.72125244140625, -1.579071044921875, -1.4368896484375, -1.294708251953125, -1.15252685546875, -1.010345458984375, -0.8681640625, -0.725982666015625, -0.58380126953125, -0.441619873046875, -0.2994384765625, -0.157257080078125, -0.01507568359375, 0.127105712890625, 0.269287109375, 0.411468505859375, 0.55364990234375, 0.695831298828125, 0.8380126953125, 0.980194091796875, 1.12237548828125, 1.264556884765625, 1.40673828125, 1.548919677734375, 1.69110107421875, 1.833282470703125, 1.9754638671875, 2.117645263671875, 2.25982666015625, 2.402008056640625, 2.544189453125, 2.686370849609375, 2.82855224609375, 2.970733642578125, 3.1129150390625, 3.255096435546875, 3.39727783203125, 3.539459228515625, 3.681640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 21.0, 55.0, 122.0, 235.0, 274.0, 146.0, 68.0, 34.0, 11.0, 8.0, 4.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.13037872314453, -88.49954223632812, -84.86870574951172, -81.23786926269531, -77.6070327758789, -73.9761962890625, -70.34535217285156, -66.71452331542969, -63.083683013916016, -59.45284652709961, -55.8220100402832, -52.19116973876953, -48.560333251953125, -44.92949676513672, -41.29866027832031, -37.667823791503906, -34.0369873046875, -30.406150817871094, -26.775314331054688, -23.14447593688965, -19.513639450073242, -15.882802963256836, -12.251964569091797, -8.62112808227539, -4.990291595458984, -1.35945463180542, 2.2713823318481445, 5.902219772338867, 9.533056259155273, 13.16389274597168, 16.79473114013672, 20.425567626953125, 24.056396484375, 27.687232971191406, 31.318069458007812, 34.94890594482422, 38.579742431640625, 42.21057891845703, 45.8414192199707, 49.47225570678711, 53.103092193603516, 56.73392868041992, 60.36476516723633, 63.99560546875, 67.6264419555664, 71.25727844238281, 74.88811492919922, 78.51895141601562, 82.14978790283203, 85.78062438964844, 89.41146087646484, 93.04229736328125, 96.67313385009766, 100.30397033691406, 103.934814453125, 107.56564331054688, 111.19648742675781, 114.82732391357422, 118.45816040039062, 122.08899688720703, 125.71983337402344, 129.35067749023438, 132.98150634765625, 136.6123504638672, 140.24317932128906]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 2.0, 8.0, 8.0, 8.0, 11.0, 21.0, 17.0, 30.0, 23.0, 19.0, 23.0, 33.0, 30.0, 41.0, 43.0, 51.0, 58.0, 79.0, 75.0, 54.0, 54.0, 35.0, 27.0, 31.0, 35.0, 27.0, 19.0, 30.0, 15.0, 20.0, 12.0, 14.0, 12.0, 4.0, 9.0, 9.0, 8.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-62.071678161621094, -60.34473419189453, -58.61779022216797, -56.890846252441406, -55.163902282714844, -53.43695831298828, -51.71001052856445, -49.98306655883789, -48.25612258911133, -46.529178619384766, -44.8022346496582, -43.07529067993164, -41.34834289550781, -39.62139892578125, -37.89445495605469, -36.167510986328125, -34.44056701660156, -32.713623046875, -30.986679077148438, -29.259733200073242, -27.53278923034668, -25.805845260620117, -24.078899383544922, -22.35195541381836, -20.625011444091797, -18.898067474365234, -17.171123504638672, -15.444177627563477, -13.717233657836914, -11.990289688110352, -10.263344764709473, -8.536399841308594, -6.809459686279297, -5.082515239715576, -3.3555707931518555, -1.6286263465881348, 0.09831809997558594, 1.8252620697021484, 3.5522069931030273, 5.279151916503906, 7.006095886230469, 8.733039855957031, 10.45998477935791, 12.186929702758789, 13.913873672485352, 15.640817642211914, 17.36776351928711, 19.094707489013672, 20.821651458740234, 22.548595428466797, 24.27553939819336, 26.002485275268555, 27.729429244995117, 29.45637321472168, 31.183319091796875, 32.91026306152344, 34.63720703125, 36.36415100097656, 38.091094970703125, 39.81803894042969, 41.54498291015625, 43.27192687988281, 44.99887466430664, 46.7258186340332, 48.452762603759766]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 4.0, 11.0, 10.0, 19.0, 22.0, 30.0, 61.0, 58.0, 97.0, 160.0, 265.0, 445.0, 788.0, 1474.0, 2785.0, 6083.0, 14958.0, 44714.0, 223033.0, 2063211.0, 1598283.0, 173223.0, 39447.0, 13629.0, 5652.0, 2608.0, 1361.0, 703.0, 405.0, 268.0, 159.0, 109.0, 60.0, 43.0, 29.0, 28.0, 15.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.75408935546875, -4.6097412109375, -4.46539306640625, -4.321044921875, -4.17669677734375, -4.0323486328125, -3.88800048828125, -3.74365234375, -3.59930419921875, -3.4549560546875, -3.31060791015625, -3.166259765625, -3.02191162109375, -2.8775634765625, -2.73321533203125, -2.5888671875, -2.44451904296875, -2.3001708984375, -2.15582275390625, -2.011474609375, -1.86712646484375, -1.7227783203125, -1.57843017578125, -1.43408203125, -1.28973388671875, -1.1453857421875, -1.00103759765625, -0.856689453125, -0.71234130859375, -0.5679931640625, -0.42364501953125, -0.279296875, -0.13494873046875, 0.0093994140625, 0.15374755859375, 0.298095703125, 0.44244384765625, 0.5867919921875, 0.73114013671875, 0.87548828125, 1.01983642578125, 1.1641845703125, 1.30853271484375, 1.452880859375, 1.59722900390625, 1.7415771484375, 1.88592529296875, 2.0302734375, 2.17462158203125, 2.3189697265625, 2.46331787109375, 2.607666015625, 2.75201416015625, 2.8963623046875, 3.04071044921875, 3.18505859375, 3.32940673828125, 3.4737548828125, 3.61810302734375, 3.762451171875, 3.90679931640625, 4.0511474609375, 4.19549560546875, 4.33984375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 10.0, 8.0, 10.0, 11.0, 16.0, 18.0, 23.0, 30.0, 27.0, 25.0, 39.0, 48.0, 40.0, 55.0, 60.0, 54.0, 59.0, 49.0, 59.0, 44.0, 55.0, 44.0, 46.0, 37.0, 17.0, 18.0, 28.0, 18.0, 15.0, 14.0, 10.0, 7.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4453125, -3.34210205078125, -3.2388916015625, -3.13568115234375, -3.032470703125, -2.92926025390625, -2.8260498046875, -2.72283935546875, -2.61962890625, -2.51641845703125, -2.4132080078125, -2.30999755859375, -2.206787109375, -2.10357666015625, -2.0003662109375, -1.89715576171875, -1.7939453125, -1.69073486328125, -1.5875244140625, -1.48431396484375, -1.381103515625, -1.27789306640625, -1.1746826171875, -1.07147216796875, -0.96826171875, -0.86505126953125, -0.7618408203125, -0.65863037109375, -0.555419921875, -0.45220947265625, -0.3489990234375, -0.24578857421875, -0.142578125, -0.03936767578125, 0.0638427734375, 0.16705322265625, 0.270263671875, 0.37347412109375, 0.4766845703125, 0.57989501953125, 0.68310546875, 0.78631591796875, 0.8895263671875, 0.99273681640625, 1.095947265625, 1.19915771484375, 1.3023681640625, 1.40557861328125, 1.5087890625, 1.61199951171875, 1.7152099609375, 1.81842041015625, 1.921630859375, 2.02484130859375, 2.1280517578125, 2.23126220703125, 2.33447265625, 2.43768310546875, 2.5408935546875, 2.64410400390625, 2.747314453125, 2.85052490234375, 2.9537353515625, 3.05694580078125, 3.16015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 12.0, 14.0, 31.0, 54.0, 64.0, 126.0, 208.0, 327.0, 684.0, 1605.0, 4854.0, 18141.0, 96137.0, 1842098.0, 2100233.0, 102478.0, 18017.0, 5004.0, 1937.0, 844.0, 484.0, 277.0, 199.0, 130.0, 75.0, 63.0, 39.0, 33.0, 28.0, 21.0, 12.0, 14.0, 6.0, 3.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9765625, -5.7376708984375, -5.498779296875, -5.2598876953125, -5.02099609375, -4.7821044921875, -4.543212890625, -4.3043212890625, -4.0654296875, -3.8265380859375, -3.587646484375, -3.3487548828125, -3.10986328125, -2.8709716796875, -2.632080078125, -2.3931884765625, -2.154296875, -1.9154052734375, -1.676513671875, -1.4376220703125, -1.19873046875, -0.9598388671875, -0.720947265625, -0.4820556640625, -0.2431640625, -0.0042724609375, 0.234619140625, 0.4735107421875, 0.71240234375, 0.9512939453125, 1.190185546875, 1.4290771484375, 1.66796875, 1.9068603515625, 2.145751953125, 2.3846435546875, 2.62353515625, 2.8624267578125, 3.101318359375, 3.3402099609375, 3.5791015625, 3.8179931640625, 4.056884765625, 4.2957763671875, 4.53466796875, 4.7735595703125, 5.012451171875, 5.2513427734375, 5.490234375, 5.7291259765625, 5.968017578125, 6.2069091796875, 6.44580078125, 6.6846923828125, 6.923583984375, 7.1624755859375, 7.4013671875, 7.6402587890625, 7.879150390625, 8.1180419921875, 8.35693359375, 8.5958251953125, 8.834716796875, 9.0736083984375, 9.3125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 2.0, 9.0, 8.0, 12.0, 27.0, 27.0, 38.0, 101.0, 166.0, 358.0, 772.0, 1145.0, 759.0, 299.0, 142.0, 92.0, 41.0, 30.0, 15.0, 10.0, 14.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.57696533203125, -4.2359619140625, -3.89495849609375, -3.553955078125, -3.21295166015625, -2.8719482421875, -2.53094482421875, -2.18994140625, -1.84893798828125, -1.5079345703125, -1.16693115234375, -0.825927734375, -0.48492431640625, -0.1439208984375, 0.19708251953125, 0.5380859375, 0.87908935546875, 1.2200927734375, 1.56109619140625, 1.902099609375, 2.24310302734375, 2.5841064453125, 2.92510986328125, 3.26611328125, 3.60711669921875, 3.9481201171875, 4.28912353515625, 4.630126953125, 4.97113037109375, 5.3121337890625, 5.65313720703125, 5.994140625, 6.33514404296875, 6.6761474609375, 7.01715087890625, 7.358154296875, 7.69915771484375, 8.0401611328125, 8.38116455078125, 8.72216796875, 9.06317138671875, 9.4041748046875, 9.74517822265625, 10.086181640625, 10.42718505859375, 10.7681884765625, 11.10919189453125, 11.4501953125, 11.79119873046875, 12.1322021484375, 12.47320556640625, 12.814208984375, 13.15521240234375, 13.4962158203125, 13.83721923828125, 14.17822265625, 14.51922607421875, 14.8602294921875, 15.20123291015625, 15.542236328125, 15.88323974609375, 16.2242431640625, 16.56524658203125, 16.90625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 15.0, 103.0, 343.0, 373.0, 114.0, 20.0, 8.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.40359497070312, -211.8328857421875, -206.26217651367188, -200.69146728515625, -195.12075805664062, -189.550048828125, -183.97933959960938, -178.4086456298828, -172.8379364013672, -167.26722717285156, -161.69651794433594, -156.1258087158203, -150.5550994873047, -144.98440551757812, -139.4136962890625, -133.84298706054688, -128.27227783203125, -122.70156860351562, -117.130859375, -111.56015014648438, -105.98944854736328, -100.41873931884766, -94.84803009033203, -89.27732849121094, -83.70660400390625, -78.13589477539062, -72.565185546875, -66.99447631835938, -61.42377471923828, -55.853065490722656, -50.28235626220703, -44.71165084838867, -39.14094543457031, -33.57023620605469, -27.999530792236328, -22.428821563720703, -16.85811424255371, -11.287406921386719, -5.716697692871094, -0.14599227905273438, 5.424716949462891, 10.995424270629883, 16.566131591796875, 22.1368408203125, 27.707548141479492, 33.278255462646484, 38.84896469116211, 44.41967010498047, 49.990379333496094, 55.56108856201172, 61.13179397583008, 66.70249938964844, 72.27320861816406, 77.84391784667969, 83.41462707519531, 88.98533630371094, 94.55604553222656, 100.12675476074219, 105.69746398925781, 111.26817321777344, 116.83887481689453, 122.40958404541016, 127.98029327392578, 133.55099487304688, 139.1217041015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 10.0, 10.0, 15.0, 24.0, 15.0, 22.0, 24.0, 23.0, 42.0, 33.0, 35.0, 44.0, 55.0, 49.0, 51.0, 61.0, 46.0, 43.0, 60.0, 54.0, 39.0, 34.0, 33.0, 38.0, 29.0, 21.0, 19.0, 16.0, 8.0, 15.0, 9.0, 3.0, 3.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.903024673461914, -26.82782554626465, -25.752626419067383, -24.677427291870117, -23.60222816467285, -22.527029037475586, -21.451828002929688, -20.376628875732422, -19.301429748535156, -18.22623062133789, -17.151031494140625, -16.07583236694336, -15.000633239746094, -13.925434112548828, -12.850234031677246, -11.77503490447998, -10.699836730957031, -9.624637603759766, -8.5494384765625, -7.474238872528076, -6.3990397453308105, -5.323840618133545, -4.248641014099121, -3.1734418869018555, -2.09824275970459, -1.0230435132980347, 0.05215573310852051, 1.1273550987243652, 2.202554225921631, 3.2777533531188965, 4.35295295715332, 5.428152084350586, 6.503349304199219, 7.578548431396484, 8.65374755859375, 9.728946685791016, 10.804145812988281, 11.879344940185547, 12.954545021057129, 14.029744148254395, 15.10494327545166, 16.180143356323242, 17.255342483520508, 18.330541610717773, 19.40574073791504, 20.480939865112305, 21.55613899230957, 22.631338119506836, 23.7065372467041, 24.781736373901367, 25.856935501098633, 26.9321346282959, 28.007333755493164, 29.08253288269043, 30.157733917236328, 31.232933044433594, 32.30813217163086, 33.383331298828125, 34.45853042602539, 35.533729553222656, 36.60892868041992, 37.68412780761719, 38.75932693481445, 39.83452606201172, 40.909725189208984]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 13.0, 7.0, 10.0, 15.0, 22.0, 32.0, 41.0, 80.0, 96.0, 174.0, 268.0, 457.0, 785.0, 1303.0, 2575.0, 5307.0, 11247.0, 25854.0, 63760.0, 173700.0, 379403.0, 236384.0, 85368.0, 33565.0, 14464.0, 6566.0, 3266.0, 1600.0, 869.0, 499.0, 278.0, 176.0, 117.0, 79.0, 45.0, 32.0, 30.0, 18.0, 9.0, 12.0, 3.0, 6.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.48529052734375, -4.3104248046875, -4.13555908203125, -3.960693359375, -3.78582763671875, -3.6109619140625, -3.43609619140625, -3.26123046875, -3.08636474609375, -2.9114990234375, -2.73663330078125, -2.561767578125, -2.38690185546875, -2.2120361328125, -2.03717041015625, -1.8623046875, -1.68743896484375, -1.5125732421875, -1.33770751953125, -1.162841796875, -0.98797607421875, -0.8131103515625, -0.63824462890625, -0.46337890625, -0.28851318359375, -0.1136474609375, 0.06121826171875, 0.236083984375, 0.41094970703125, 0.5858154296875, 0.76068115234375, 0.935546875, 1.11041259765625, 1.2852783203125, 1.46014404296875, 1.635009765625, 1.80987548828125, 1.9847412109375, 2.15960693359375, 2.33447265625, 2.50933837890625, 2.6842041015625, 2.85906982421875, 3.033935546875, 3.20880126953125, 3.3836669921875, 3.55853271484375, 3.7333984375, 3.90826416015625, 4.0831298828125, 4.25799560546875, 4.432861328125, 4.60772705078125, 4.7825927734375, 4.95745849609375, 5.13232421875, 5.30718994140625, 5.4820556640625, 5.65692138671875, 5.831787109375, 6.00665283203125, 6.1815185546875, 6.35638427734375, 6.53125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 14.0, 11.0, 16.0, 16.0, 23.0, 27.0, 35.0, 26.0, 35.0, 49.0, 56.0, 61.0, 56.0, 59.0, 56.0, 60.0, 46.0, 43.0, 59.0, 34.0, 33.0, 33.0, 24.0, 26.0, 24.0, 19.0, 13.0, 10.0, 6.0, 4.0, 9.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.5234375, -3.4173583984375, -3.311279296875, -3.2052001953125, -3.09912109375, -2.9930419921875, -2.886962890625, -2.7808837890625, -2.6748046875, -2.5687255859375, -2.462646484375, -2.3565673828125, -2.25048828125, -2.1444091796875, -2.038330078125, -1.9322509765625, -1.826171875, -1.7200927734375, -1.614013671875, -1.5079345703125, -1.40185546875, -1.2957763671875, -1.189697265625, -1.0836181640625, -0.9775390625, -0.8714599609375, -0.765380859375, -0.6593017578125, -0.55322265625, -0.4471435546875, -0.341064453125, -0.2349853515625, -0.12890625, -0.0228271484375, 0.083251953125, 0.1893310546875, 0.29541015625, 0.4014892578125, 0.507568359375, 0.6136474609375, 0.7197265625, 0.8258056640625, 0.931884765625, 1.0379638671875, 1.14404296875, 1.2501220703125, 1.356201171875, 1.4622802734375, 1.568359375, 1.6744384765625, 1.780517578125, 1.8865966796875, 1.99267578125, 2.0987548828125, 2.204833984375, 2.3109130859375, 2.4169921875, 2.5230712890625, 2.629150390625, 2.7352294921875, 2.84130859375, 2.9473876953125, 3.053466796875, 3.1595458984375, 3.265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 6.0, 8.0, 12.0, 21.0, 27.0, 47.0, 50.0, 81.0, 146.0, 226.0, 382.0, 700.0, 1330.0, 3400.0, 15471.0, 171471.0, 786898.0, 55985.0, 7634.0, 2235.0, 977.0, 569.0, 317.0, 183.0, 121.0, 90.0, 38.0, 39.0, 27.0, 10.0, 8.0, 7.0, 5.0, 7.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.8671875, -13.3770751953125, -12.886962890625, -12.3968505859375, -11.90673828125, -11.4166259765625, -10.926513671875, -10.4364013671875, -9.9462890625, -9.4561767578125, -8.966064453125, -8.4759521484375, -7.98583984375, -7.4957275390625, -7.005615234375, -6.5155029296875, -6.025390625, -5.5352783203125, -5.045166015625, -4.5550537109375, -4.06494140625, -3.5748291015625, -3.084716796875, -2.5946044921875, -2.1044921875, -1.6143798828125, -1.124267578125, -0.6341552734375, -0.14404296875, 0.3460693359375, 0.836181640625, 1.3262939453125, 1.81640625, 2.3065185546875, 2.796630859375, 3.2867431640625, 3.77685546875, 4.2669677734375, 4.757080078125, 5.2471923828125, 5.7373046875, 6.2274169921875, 6.717529296875, 7.2076416015625, 7.69775390625, 8.1878662109375, 8.677978515625, 9.1680908203125, 9.658203125, 10.1483154296875, 10.638427734375, 11.1285400390625, 11.61865234375, 12.1087646484375, 12.598876953125, 13.0889892578125, 13.5791015625, 14.0692138671875, 14.559326171875, 15.0494384765625, 15.53955078125, 16.0296630859375, 16.519775390625, 17.0098876953125, 17.5]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 7.0, 12.0, 9.0, 12.0, 15.0, 19.0, 17.0, 22.0, 39.0, 31.0, 49.0, 47.0, 44.0, 62.0, 57.0, 66.0, 54.0, 74.0, 48.0, 48.0, 41.0, 46.0, 34.0, 31.0, 17.0, 26.0, 16.0, 13.0, 5.0, 14.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8671875, -15.4322509765625, -14.997314453125, -14.5623779296875, -14.12744140625, -13.6925048828125, -13.257568359375, -12.8226318359375, -12.3876953125, -11.9527587890625, -11.517822265625, -11.0828857421875, -10.64794921875, -10.2130126953125, -9.778076171875, -9.3431396484375, -8.908203125, -8.4732666015625, -8.038330078125, -7.6033935546875, -7.16845703125, -6.7335205078125, -6.298583984375, -5.8636474609375, -5.4287109375, -4.9937744140625, -4.558837890625, -4.1239013671875, -3.68896484375, -3.2540283203125, -2.819091796875, -2.3841552734375, -1.94921875, -1.5142822265625, -1.079345703125, -0.6444091796875, -0.20947265625, 0.2254638671875, 0.660400390625, 1.0953369140625, 1.5302734375, 1.9652099609375, 2.400146484375, 2.8350830078125, 3.27001953125, 3.7049560546875, 4.139892578125, 4.5748291015625, 5.009765625, 5.4447021484375, 5.879638671875, 6.3145751953125, 6.74951171875, 7.1844482421875, 7.619384765625, 8.0543212890625, 8.4892578125, 8.9241943359375, 9.359130859375, 9.7940673828125, 10.22900390625, 10.6639404296875, 11.098876953125, 11.5338134765625, 11.96875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 6.0, 3.0, 3.0, 2.0, 15.0, 9.0, 9.0, 16.0, 23.0, 42.0, 60.0, 97.0, 188.0, 490.0, 1572.0, 9505.0, 930569.0, 100475.0, 3807.0, 928.0, 329.0, 151.0, 89.0, 45.0, 27.0, 20.0, 14.0, 11.0, 8.0, 9.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.90625, -11.51953125, -11.1328125, -10.74609375, -10.359375, -9.97265625, -9.5859375, -9.19921875, -8.8125, -8.42578125, -8.0390625, -7.65234375, -7.265625, -6.87890625, -6.4921875, -6.10546875, -5.71875, -5.33203125, -4.9453125, -4.55859375, -4.171875, -3.78515625, -3.3984375, -3.01171875, -2.625, -2.23828125, -1.8515625, -1.46484375, -1.078125, -0.69140625, -0.3046875, 0.08203125, 0.46875, 0.85546875, 1.2421875, 1.62890625, 2.015625, 2.40234375, 2.7890625, 3.17578125, 3.5625, 3.94921875, 4.3359375, 4.72265625, 5.109375, 5.49609375, 5.8828125, 6.26953125, 6.65625, 7.04296875, 7.4296875, 7.81640625, 8.203125, 8.58984375, 8.9765625, 9.36328125, 9.75, 10.13671875, 10.5234375, 10.91015625, 11.296875, 11.68359375, 12.0703125, 12.45703125, 12.84375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 8.0, 4.0, 5.0, 7.0, 14.0, 26.0, 28.0, 43.0, 83.0, 138.0, 204.0, 172.0, 79.0, 66.0, 32.0, 29.0, 12.0, 16.0, 10.0, 9.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009741783142089844, -0.0009330585598945618, -0.0008919388055801392, -0.0008508190512657166, -0.0008096992969512939, -0.0007685795426368713, -0.0007274597883224487, -0.0006863400340080261, -0.0006452202796936035, -0.0006041005253791809, -0.0005629807710647583, -0.0005218610167503357, -0.0004807412624359131, -0.0004396215081214905, -0.00039850175380706787, -0.00035738199949264526, -0.00031626224517822266, -0.00027514249086380005, -0.00023402273654937744, -0.00019290298223495483, -0.00015178322792053223, -0.00011066347360610962, -6.954371929168701e-05, -2.8423964977264404e-05, 1.2695789337158203e-05, 5.381554365158081e-05, 9.493529796600342e-05, 0.00013605505228042603, 0.00017717480659484863, 0.00021829456090927124, 0.00025941431522369385, 0.00030053406953811646, 0.00034165382385253906, 0.00038277357816696167, 0.0004238933324813843, 0.0004650130867958069, 0.0005061328411102295, 0.0005472525954246521, 0.0005883723497390747, 0.0006294921040534973, 0.0006706118583679199, 0.0007117316126823425, 0.0007528513669967651, 0.0007939711213111877, 0.0008350908756256104, 0.000876210629940033, 0.0009173303842544556, 0.0009584501385688782, 0.0009995698928833008, 0.0010406896471977234, 0.001081809401512146, 0.0011229291558265686, 0.0011640489101409912, 0.0012051686644554138, 0.0012462884187698364, 0.001287408173084259, 0.0013285279273986816, 0.0013696476817131042, 0.0014107674360275269, 0.0014518871903419495, 0.001493006944656372, 0.0015341266989707947, 0.0015752464532852173, 0.00161636620759964, 0.0016574859619140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 4.0, 8.0, 10.0, 8.0, 8.0, 8.0, 11.0, 18.0, 10.0, 24.0, 20.0, 33.0, 24.0, 40.0, 88.0, 108.0, 152.0, 259.0, 458.0, 907.0, 1871.0, 4601.0, 15886.0, 93619.0, 758519.0, 141414.0, 20055.0, 5772.0, 2209.0, 992.0, 517.0, 284.0, 167.0, 117.0, 69.0, 46.0, 42.0, 36.0, 27.0, 17.0, 14.0, 16.0, 12.0, 14.0, 5.0, 16.0, 10.0, 2.0, 5.0, 5.0, 2.0, 4.0, 2.0], "bins": [-4.50390625, -4.377349853515625, -4.25079345703125, -4.124237060546875, -3.9976806640625, -3.871124267578125, -3.74456787109375, -3.618011474609375, -3.491455078125, -3.364898681640625, -3.23834228515625, -3.111785888671875, -2.9852294921875, -2.858673095703125, -2.73211669921875, -2.605560302734375, -2.47900390625, -2.352447509765625, -2.22589111328125, -2.099334716796875, -1.9727783203125, -1.846221923828125, -1.71966552734375, -1.593109130859375, -1.466552734375, -1.339996337890625, -1.21343994140625, -1.086883544921875, -0.9603271484375, -0.833770751953125, -0.70721435546875, -0.580657958984375, -0.4541015625, -0.327545166015625, -0.20098876953125, -0.074432373046875, 0.0521240234375, 0.178680419921875, 0.30523681640625, 0.431793212890625, 0.558349609375, 0.684906005859375, 0.81146240234375, 0.938018798828125, 1.0645751953125, 1.191131591796875, 1.31768798828125, 1.444244384765625, 1.57080078125, 1.697357177734375, 1.82391357421875, 1.950469970703125, 2.0770263671875, 2.203582763671875, 2.33013916015625, 2.456695556640625, 2.583251953125, 2.709808349609375, 2.83636474609375, 2.962921142578125, 3.0894775390625, 3.216033935546875, 3.34259033203125, 3.469146728515625, 3.595703125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 8.0, 4.0, 11.0, 18.0, 33.0, 38.0, 87.0, 112.0, 182.0, 151.0, 133.0, 83.0, 41.0, 30.0, 17.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.9453125, -6.752197265625, -6.55908203125, -6.365966796875, -6.1728515625, -5.979736328125, -5.78662109375, -5.593505859375, -5.400390625, -5.207275390625, -5.01416015625, -4.821044921875, -4.6279296875, -4.434814453125, -4.24169921875, -4.048583984375, -3.85546875, -3.662353515625, -3.46923828125, -3.276123046875, -3.0830078125, -2.889892578125, -2.69677734375, -2.503662109375, -2.310546875, -2.117431640625, -1.92431640625, -1.731201171875, -1.5380859375, -1.344970703125, -1.15185546875, -0.958740234375, -0.765625, -0.572509765625, -0.37939453125, -0.186279296875, 0.0068359375, 0.199951171875, 0.39306640625, 0.586181640625, 0.779296875, 0.972412109375, 1.16552734375, 1.358642578125, 1.5517578125, 1.744873046875, 1.93798828125, 2.131103515625, 2.32421875, 2.517333984375, 2.71044921875, 2.903564453125, 3.0966796875, 3.289794921875, 3.48291015625, 3.676025390625, 3.869140625, 4.062255859375, 4.25537109375, 4.448486328125, 4.6416015625, 4.834716796875, 5.02783203125, 5.220947265625, 5.4140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 6.0, 3.0, 9.0, 14.0, 32.0, 84.0, 202.0, 354.0, 164.0, 68.0, 27.0, 6.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.1141357421875, -103.4736099243164, -99.83309173583984, -96.19256591796875, -92.55204010009766, -88.91151428222656, -85.27099609375, -81.6304702758789, -77.98994445800781, -74.34941864013672, -70.70890045166016, -67.06837463378906, -63.42784881591797, -59.78732681274414, -56.14680480957031, -52.50627899169922, -48.865760803222656, -45.22523880004883, -41.584712982177734, -37.944190979003906, -34.30366516113281, -30.663143157958984, -27.022621154785156, -23.382097244262695, -19.741573333740234, -16.101049423217773, -12.460526466369629, -8.820003509521484, -5.179479598999023, -1.5389556884765625, 2.1015663146972656, 5.742090225219727, 9.382606506347656, 13.023130416870117, 16.663654327392578, 20.304176330566406, 23.944700241088867, 27.585224151611328, 31.225746154785156, 34.86627197265625, 38.50679397583008, 42.147315979003906, 45.787841796875, 49.42836380004883, 53.068885803222656, 56.70941162109375, 60.34993362426758, 63.990455627441406, 67.6309814453125, 71.2715072631836, 74.91202545166016, 78.55255126953125, 82.19307708740234, 85.83360290527344, 89.47412109375, 93.1146469116211, 96.75517272949219, 100.39569854736328, 104.03621673583984, 107.67674255371094, 111.31726837158203, 114.95779418945312, 118.59831237792969, 122.23883819580078, 125.87935638427734]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 6.0, 11.0, 5.0, 25.0, 32.0, 42.0, 48.0, 49.0, 66.0, 90.0, 117.0, 128.0, 63.0, 59.0, 52.0, 51.0, 38.0, 33.0, 33.0, 19.0, 11.0, 9.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-112.49517822265625, -109.80683898925781, -107.11849212646484, -104.4301528930664, -101.74181365966797, -99.053466796875, -96.36512756347656, -93.67678833007812, -90.98844909667969, -88.30010986328125, -85.61176300048828, -82.92342376708984, -80.2350845336914, -77.54673767089844, -74.8583984375, -72.17005920410156, -69.4817123413086, -66.79337310791016, -64.10502624511719, -61.41668701171875, -58.72834777832031, -56.04000473022461, -53.351661682128906, -50.66332244873047, -47.974979400634766, -45.28663635253906, -42.598297119140625, -39.90995407104492, -37.22161102294922, -34.53327178955078, -31.844928741455078, -29.156587600708008, -26.468246459960938, -23.779905319213867, -21.091564178466797, -18.403221130371094, -15.714879989624023, -13.026538848876953, -10.33819580078125, -7.64985466003418, -4.961513519287109, -2.273171901702881, 0.41516971588134766, 3.1035118103027344, 5.791852951049805, 8.480194091796875, 11.168537139892578, 13.856878280639648, 16.54521942138672, 19.23356056213379, 21.92190170288086, 24.610244750976562, 27.298585891723633, 29.986927032470703, 32.675270080566406, 35.363609313964844, 38.05195236206055, 40.74029541015625, 43.42863464355469, 46.11697769165039, 48.805320739746094, 51.49365997314453, 54.182003021240234, 56.87034606933594, 59.558685302734375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 16.0, 27.0, 39.0, 92.0, 229.0, 663.0, 3186.0, 35040.0, 3710367.0, 430223.0, 11244.0, 2084.0, 615.0, 257.0, 86.0, 50.0, 12.0, 11.0, 11.0, 7.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6484375, -14.2501220703125, -13.851806640625, -13.4534912109375, -13.05517578125, -12.6568603515625, -12.258544921875, -11.8602294921875, -11.4619140625, -11.0635986328125, -10.665283203125, -10.2669677734375, -9.86865234375, -9.4703369140625, -9.072021484375, -8.6737060546875, -8.275390625, -7.8770751953125, -7.478759765625, -7.0804443359375, -6.68212890625, -6.2838134765625, -5.885498046875, -5.4871826171875, -5.0888671875, -4.6905517578125, -4.292236328125, -3.8939208984375, -3.49560546875, -3.0972900390625, -2.698974609375, -2.3006591796875, -1.90234375, -1.5040283203125, -1.105712890625, -0.7073974609375, -0.30908203125, 0.0892333984375, 0.487548828125, 0.8858642578125, 1.2841796875, 1.6824951171875, 2.080810546875, 2.4791259765625, 2.87744140625, 3.2757568359375, 3.674072265625, 4.0723876953125, 4.470703125, 4.8690185546875, 5.267333984375, 5.6656494140625, 6.06396484375, 6.4622802734375, 6.860595703125, 7.2589111328125, 7.6572265625, 8.0555419921875, 8.453857421875, 8.8521728515625, 9.25048828125, 9.6488037109375, 10.047119140625, 10.4454345703125, 10.84375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 11.0, 23.0, 34.0, 42.0, 88.0, 105.0, 128.0, 147.0, 123.0, 114.0, 76.0, 48.0, 36.0, 20.0, 10.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.359375, -11.12005615234375, -10.8807373046875, -10.64141845703125, -10.402099609375, -10.16278076171875, -9.9234619140625, -9.68414306640625, -9.44482421875, -9.20550537109375, -8.9661865234375, -8.72686767578125, -8.487548828125, -8.24822998046875, -8.0089111328125, -7.76959228515625, -7.5302734375, -7.29095458984375, -7.0516357421875, -6.81231689453125, -6.572998046875, -6.33367919921875, -6.0943603515625, -5.85504150390625, -5.61572265625, -5.37640380859375, -5.1370849609375, -4.89776611328125, -4.658447265625, -4.41912841796875, -4.1798095703125, -3.94049072265625, -3.701171875, -3.46185302734375, -3.2225341796875, -2.98321533203125, -2.743896484375, -2.50457763671875, -2.2652587890625, -2.02593994140625, -1.78662109375, -1.54730224609375, -1.3079833984375, -1.06866455078125, -0.829345703125, -0.59002685546875, -0.3507080078125, -0.11138916015625, 0.1279296875, 0.36724853515625, 0.6065673828125, 0.84588623046875, 1.085205078125, 1.32452392578125, 1.5638427734375, 1.80316162109375, 2.04248046875, 2.28179931640625, 2.5211181640625, 2.76043701171875, 2.999755859375, 3.23907470703125, 3.4783935546875, 3.71771240234375, 3.95703125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 19.0, 34.0, 49.0, 117.0, 198.0, 478.0, 1335.0, 5497.0, 135761.0, 4012635.0, 32675.0, 3332.0, 1124.0, 513.0, 246.0, 126.0, 53.0, 24.0, 15.0, 12.0, 10.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.09375, -19.525146484375, -18.95654296875, -18.387939453125, -17.8193359375, -17.250732421875, -16.68212890625, -16.113525390625, -15.544921875, -14.976318359375, -14.40771484375, -13.839111328125, -13.2705078125, -12.701904296875, -12.13330078125, -11.564697265625, -10.99609375, -10.427490234375, -9.85888671875, -9.290283203125, -8.7216796875, -8.153076171875, -7.58447265625, -7.015869140625, -6.447265625, -5.878662109375, -5.31005859375, -4.741455078125, -4.1728515625, -3.604248046875, -3.03564453125, -2.467041015625, -1.8984375, -1.329833984375, -0.76123046875, -0.192626953125, 0.3759765625, 0.944580078125, 1.51318359375, 2.081787109375, 2.650390625, 3.218994140625, 3.78759765625, 4.356201171875, 4.9248046875, 5.493408203125, 6.06201171875, 6.630615234375, 7.19921875, 7.767822265625, 8.33642578125, 8.905029296875, 9.4736328125, 10.042236328125, 10.61083984375, 11.179443359375, 11.748046875, 12.316650390625, 12.88525390625, 13.453857421875, 14.0224609375, 14.591064453125, 15.15966796875, 15.728271484375, 16.296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 9.0, 11.0, 13.0, 21.0, 44.0, 90.0, 160.0, 484.0, 1370.0, 1205.0, 387.0, 141.0, 70.0, 29.0, 18.0, 12.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.13671875, -6.73687744140625, -6.3370361328125, -5.93719482421875, -5.537353515625, -5.13751220703125, -4.7376708984375, -4.33782958984375, -3.93798828125, -3.53814697265625, -3.1383056640625, -2.73846435546875, -2.338623046875, -1.93878173828125, -1.5389404296875, -1.13909912109375, -0.7392578125, -0.33941650390625, 0.0604248046875, 0.46026611328125, 0.860107421875, 1.25994873046875, 1.6597900390625, 2.05963134765625, 2.45947265625, 2.85931396484375, 3.2591552734375, 3.65899658203125, 4.058837890625, 4.45867919921875, 4.8585205078125, 5.25836181640625, 5.658203125, 6.05804443359375, 6.4578857421875, 6.85772705078125, 7.257568359375, 7.65740966796875, 8.0572509765625, 8.45709228515625, 8.85693359375, 9.25677490234375, 9.6566162109375, 10.05645751953125, 10.456298828125, 10.85614013671875, 11.2559814453125, 11.65582275390625, 12.0556640625, 12.45550537109375, 12.8553466796875, 13.25518798828125, 13.655029296875, 14.05487060546875, 14.4547119140625, 14.85455322265625, 15.25439453125, 15.65423583984375, 16.0540771484375, 16.45391845703125, 16.853759765625, 17.25360107421875, 17.6534423828125, 18.05328369140625, 18.453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 11.0, 18.0, 50.0, 157.0, 299.0, 268.0, 119.0, 27.0, 11.0, 12.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-153.31689453125, -149.81695556640625, -146.3170166015625, -142.8170928955078, -139.31715393066406, -135.8172149658203, -132.31727600097656, -128.81735229492188, -125.31741333007812, -121.81747436523438, -118.31754302978516, -114.8176040649414, -111.31767272949219, -107.81773376464844, -104.31779479980469, -100.81786346435547, -97.31792449951172, -93.81798553466797, -90.31805419921875, -86.818115234375, -83.31818389892578, -79.81824493408203, -76.31831359863281, -72.81837463378906, -69.31843566894531, -65.81849670410156, -62.318565368652344, -58.818626403808594, -55.318695068359375, -51.818756103515625, -48.31882095336914, -44.818885803222656, -41.31896209716797, -37.819026947021484, -34.319091796875, -30.819154739379883, -27.3192195892334, -23.819284439086914, -20.319347381591797, -16.819412231445312, -13.319477081298828, -9.819541931152344, -6.319605827331543, -2.819669723510742, 0.6802654266357422, 4.180200576782227, 7.680137634277344, 11.180072784423828, 14.680007934570312, 18.179943084716797, 21.67987823486328, 25.1798152923584, 28.679750442504883, 32.1796875, 35.679622650146484, 39.17955780029297, 42.67949295043945, 46.17942810058594, 49.67936325073242, 53.179298400878906, 56.679237365722656, 60.179168701171875, 63.679107666015625, 67.17904663085938, 70.6789779663086]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 11.0, 16.0, 21.0, 32.0, 40.0, 64.0, 68.0, 100.0, 104.0, 119.0, 111.0, 72.0, 72.0, 59.0, 37.0, 33.0, 19.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.76144027709961, -46.77614212036133, -44.79084396362305, -42.805545806884766, -40.820247650146484, -38.8349494934082, -36.84965515136719, -34.864356994628906, -32.879058837890625, -30.893760681152344, -28.908462524414062, -26.92316436767578, -24.9378662109375, -22.95256805419922, -20.96727180480957, -18.98197364807129, -16.996673583984375, -15.011375427246094, -13.026077270507812, -11.040780067443848, -9.055481910705566, -7.070183753967285, -5.08488655090332, -3.099588394165039, -1.1142902374267578, 0.8710076808929443, 2.8563055992126465, 4.8416032791137695, 6.826901435852051, 8.812199592590332, 10.797496795654297, 12.782794952392578, 14.768096923828125, 16.753395080566406, 18.738693237304688, 20.72399139404297, 22.70928955078125, 24.69458770751953, 26.67988395690918, 28.66518211364746, 30.650480270385742, 32.63577651977539, 34.62107467651367, 36.60637283325195, 38.591670989990234, 40.576969146728516, 42.5622673034668, 44.54756546020508, 46.53286361694336, 48.51816177368164, 50.50345993041992, 52.4887580871582, 54.474056243896484, 56.459354400634766, 58.44464874267578, 60.42994689941406, 62.415245056152344, 64.40054321289062, 66.3858413696289, 68.37113952636719, 70.35643768310547, 72.34173583984375, 74.32703399658203, 76.31233215332031, 78.2976303100586]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 2.0, 7.0, 11.0, 9.0, 8.0, 17.0, 21.0, 29.0, 33.0, 69.0, 97.0, 151.0, 292.0, 587.0, 1503.0, 4737.0, 19670.0, 120929.0, 586672.0, 263343.0, 38273.0, 8016.0, 2317.0, 862.0, 335.0, 142.0, 113.0, 75.0, 52.0, 41.0, 36.0, 22.0, 16.0, 14.0, 14.0, 9.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.1307373046875, -7.847412109375, -7.5640869140625, -7.28076171875, -6.9974365234375, -6.714111328125, -6.4307861328125, -6.1474609375, -5.8641357421875, -5.580810546875, -5.2974853515625, -5.01416015625, -4.7308349609375, -4.447509765625, -4.1641845703125, -3.880859375, -3.5975341796875, -3.314208984375, -3.0308837890625, -2.74755859375, -2.4642333984375, -2.180908203125, -1.8975830078125, -1.6142578125, -1.3309326171875, -1.047607421875, -0.7642822265625, -0.48095703125, -0.1976318359375, 0.085693359375, 0.3690185546875, 0.65234375, 0.9356689453125, 1.218994140625, 1.5023193359375, 1.78564453125, 2.0689697265625, 2.352294921875, 2.6356201171875, 2.9189453125, 3.2022705078125, 3.485595703125, 3.7689208984375, 4.05224609375, 4.3355712890625, 4.618896484375, 4.9022216796875, 5.185546875, 5.4688720703125, 5.752197265625, 6.0355224609375, 6.31884765625, 6.6021728515625, 6.885498046875, 7.1688232421875, 7.4521484375, 7.7354736328125, 8.018798828125, 8.3021240234375, 8.58544921875, 8.8687744140625, 9.152099609375, 9.4354248046875, 9.71875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 25.0, 41.0, 52.0, 91.0, 95.0, 127.0, 144.0, 126.0, 96.0, 87.0, 56.0, 35.0, 16.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.5234375, -12.269866943359375, -12.01629638671875, -11.762725830078125, -11.5091552734375, -11.255584716796875, -11.00201416015625, -10.748443603515625, -10.494873046875, -10.241302490234375, -9.98773193359375, -9.734161376953125, -9.4805908203125, -9.227020263671875, -8.97344970703125, -8.719879150390625, -8.46630859375, -8.212738037109375, -7.95916748046875, -7.705596923828125, -7.4520263671875, -7.198455810546875, -6.94488525390625, -6.691314697265625, -6.437744140625, -6.184173583984375, -5.93060302734375, -5.677032470703125, -5.4234619140625, -5.169891357421875, -4.91632080078125, -4.662750244140625, -4.4091796875, -4.155609130859375, -3.90203857421875, -3.648468017578125, -3.3948974609375, -3.141326904296875, -2.88775634765625, -2.634185791015625, -2.380615234375, -2.127044677734375, -1.87347412109375, -1.619903564453125, -1.3663330078125, -1.112762451171875, -0.85919189453125, -0.605621337890625, -0.35205078125, -0.098480224609375, 0.15509033203125, 0.408660888671875, 0.6622314453125, 0.915802001953125, 1.16937255859375, 1.422943115234375, 1.676513671875, 1.930084228515625, 2.18365478515625, 2.437225341796875, 2.6907958984375, 2.944366455078125, 3.19793701171875, 3.451507568359375, 3.705078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 6.0, 9.0, 9.0, 11.0, 21.0, 28.0, 35.0, 52.0, 69.0, 111.0, 180.0, 337.0, 640.0, 1494.0, 4226.0, 14749.0, 74557.0, 575974.0, 307974.0, 50858.0, 11149.0, 3404.0, 1276.0, 534.0, 276.0, 170.0, 130.0, 66.0, 59.0, 33.0, 25.0, 20.0, 18.0, 11.0, 16.0, 7.0, 2.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-9.2578125, -8.9998779296875, -8.741943359375, -8.4840087890625, -8.22607421875, -7.9681396484375, -7.710205078125, -7.4522705078125, -7.1943359375, -6.9364013671875, -6.678466796875, -6.4205322265625, -6.16259765625, -5.9046630859375, -5.646728515625, -5.3887939453125, -5.130859375, -4.8729248046875, -4.614990234375, -4.3570556640625, -4.09912109375, -3.8411865234375, -3.583251953125, -3.3253173828125, -3.0673828125, -2.8094482421875, -2.551513671875, -2.2935791015625, -2.03564453125, -1.7777099609375, -1.519775390625, -1.2618408203125, -1.00390625, -0.7459716796875, -0.488037109375, -0.2301025390625, 0.02783203125, 0.2857666015625, 0.543701171875, 0.8016357421875, 1.0595703125, 1.3175048828125, 1.575439453125, 1.8333740234375, 2.09130859375, 2.3492431640625, 2.607177734375, 2.8651123046875, 3.123046875, 3.3809814453125, 3.638916015625, 3.8968505859375, 4.15478515625, 4.4127197265625, 4.670654296875, 4.9285888671875, 5.1865234375, 5.4444580078125, 5.702392578125, 5.9603271484375, 6.21826171875, 6.4761962890625, 6.734130859375, 6.9920654296875, 7.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 7.0, 9.0, 14.0, 15.0, 20.0, 24.0, 21.0, 42.0, 30.0, 40.0, 37.0, 60.0, 52.0, 68.0, 56.0, 49.0, 70.0, 61.0, 53.0, 49.0, 48.0, 37.0, 24.0, 27.0, 16.0, 13.0, 13.0, 5.0, 8.0, 10.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.5322265625, -9.142578125, -8.7529296875, -8.36328125, -7.9736328125, -7.583984375, -7.1943359375, -6.8046875, -6.4150390625, -6.025390625, -5.6357421875, -5.24609375, -4.8564453125, -4.466796875, -4.0771484375, -3.6875, -3.2978515625, -2.908203125, -2.5185546875, -2.12890625, -1.7392578125, -1.349609375, -0.9599609375, -0.5703125, -0.1806640625, 0.208984375, 0.5986328125, 0.98828125, 1.3779296875, 1.767578125, 2.1572265625, 2.546875, 2.9365234375, 3.326171875, 3.7158203125, 4.10546875, 4.4951171875, 4.884765625, 5.2744140625, 5.6640625, 6.0537109375, 6.443359375, 6.8330078125, 7.22265625, 7.6123046875, 8.001953125, 8.3916015625, 8.78125, 9.1708984375, 9.560546875, 9.9501953125, 10.33984375, 10.7294921875, 11.119140625, 11.5087890625, 11.8984375, 12.2880859375, 12.677734375, 13.0673828125, 13.45703125, 13.8466796875, 14.236328125, 14.6259765625, 15.015625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 3.0, 9.0, 15.0, 15.0, 43.0, 61.0, 130.0, 298.0, 848.0, 3058.0, 14852.0, 120479.0, 790388.0, 101093.0, 13104.0, 2748.0, 809.0, 293.0, 134.0, 61.0, 36.0, 29.0, 15.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.839691162109375, -2.73992919921875, -2.640167236328125, -2.5404052734375, -2.440643310546875, -2.34088134765625, -2.241119384765625, -2.141357421875, -2.041595458984375, -1.94183349609375, -1.842071533203125, -1.7423095703125, -1.642547607421875, -1.54278564453125, -1.443023681640625, -1.34326171875, -1.243499755859375, -1.14373779296875, -1.043975830078125, -0.9442138671875, -0.844451904296875, -0.74468994140625, -0.644927978515625, -0.545166015625, -0.445404052734375, -0.34564208984375, -0.245880126953125, -0.1461181640625, -0.046356201171875, 0.05340576171875, 0.153167724609375, 0.2529296875, 0.352691650390625, 0.45245361328125, 0.552215576171875, 0.6519775390625, 0.751739501953125, 0.85150146484375, 0.951263427734375, 1.051025390625, 1.150787353515625, 1.25054931640625, 1.350311279296875, 1.4500732421875, 1.549835205078125, 1.64959716796875, 1.749359130859375, 1.84912109375, 1.948883056640625, 2.04864501953125, 2.148406982421875, 2.2481689453125, 2.347930908203125, 2.44769287109375, 2.547454833984375, 2.647216796875, 2.746978759765625, 2.84674072265625, 2.946502685546875, 3.0462646484375, 3.146026611328125, 3.24578857421875, 3.345550537109375, 3.4453125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 6.0, 5.0, 5.0, 14.0, 17.0, 32.0, 52.0, 104.0, 167.0, 185.0, 162.0, 88.0, 62.0, 39.0, 24.0, 8.0, 2.0, 11.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0010976791381835938, -0.0010699033737182617, -0.0010421276092529297, -0.0010143518447875977, -0.0009865760803222656, -0.0009588003158569336, -0.0009310245513916016, -0.0009032487869262695, -0.0008754730224609375, -0.0008476972579956055, -0.0008199214935302734, -0.0007921457290649414, -0.0007643699645996094, -0.0007365942001342773, -0.0007088184356689453, -0.0006810426712036133, -0.0006532669067382812, -0.0006254911422729492, -0.0005977153778076172, -0.0005699396133422852, -0.0005421638488769531, -0.0005143880844116211, -0.00048661231994628906, -0.00045883655548095703, -0.000431060791015625, -0.00040328502655029297, -0.00037550926208496094, -0.0003477334976196289, -0.0003199577331542969, -0.00029218196868896484, -0.0002644062042236328, -0.00023663043975830078, -0.00020885467529296875, -0.00018107891082763672, -0.0001533031463623047, -0.00012552738189697266, -9.775161743164062e-05, -6.99758529663086e-05, -4.220008850097656e-05, -1.4424324035644531e-05, 1.33514404296875e-05, 4.112720489501953e-05, 6.890296936035156e-05, 9.66787338256836e-05, 0.00012445449829101562, 0.00015223026275634766, 0.0001800060272216797, 0.00020778179168701172, 0.00023555755615234375, 0.0002633333206176758, 0.0002911090850830078, 0.00031888484954833984, 0.0003466606140136719, 0.0003744363784790039, 0.00040221214294433594, 0.00042998790740966797, 0.000457763671875, 0.00048553943634033203, 0.0005133152008056641, 0.0005410909652709961, 0.0005688667297363281, 0.0005966424942016602, 0.0006244182586669922, 0.0006521940231323242, 0.0006799697875976562]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 18.0, 9.0, 19.0, 24.0, 41.0, 67.0, 103.0, 181.0, 349.0, 909.0, 2996.0, 11876.0, 74068.0, 696124.0, 225084.0, 28084.0, 5843.0, 1578.0, 552.0, 248.0, 149.0, 85.0, 38.0, 27.0, 27.0, 16.0, 10.0, 7.0, 5.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.640625, -3.544189453125, -3.44775390625, -3.351318359375, -3.2548828125, -3.158447265625, -3.06201171875, -2.965576171875, -2.869140625, -2.772705078125, -2.67626953125, -2.579833984375, -2.4833984375, -2.386962890625, -2.29052734375, -2.194091796875, -2.09765625, -2.001220703125, -1.90478515625, -1.808349609375, -1.7119140625, -1.615478515625, -1.51904296875, -1.422607421875, -1.326171875, -1.229736328125, -1.13330078125, -1.036865234375, -0.9404296875, -0.843994140625, -0.74755859375, -0.651123046875, -0.5546875, -0.458251953125, -0.36181640625, -0.265380859375, -0.1689453125, -0.072509765625, 0.02392578125, 0.120361328125, 0.216796875, 0.313232421875, 0.40966796875, 0.506103515625, 0.6025390625, 0.698974609375, 0.79541015625, 0.891845703125, 0.98828125, 1.084716796875, 1.18115234375, 1.277587890625, 1.3740234375, 1.470458984375, 1.56689453125, 1.663330078125, 1.759765625, 1.856201171875, 1.95263671875, 2.049072265625, 2.1455078125, 2.241943359375, 2.33837890625, 2.434814453125, 2.53125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 8.0, 3.0, 17.0, 20.0, 39.0, 63.0, 119.0, 166.0, 168.0, 146.0, 93.0, 58.0, 42.0, 26.0, 22.0, 9.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.67578125, -6.538055419921875, -6.40032958984375, -6.262603759765625, -6.1248779296875, -5.987152099609375, -5.84942626953125, -5.711700439453125, -5.573974609375, -5.436248779296875, -5.29852294921875, -5.160797119140625, -5.0230712890625, -4.885345458984375, -4.74761962890625, -4.609893798828125, -4.47216796875, -4.334442138671875, -4.19671630859375, -4.058990478515625, -3.9212646484375, -3.783538818359375, -3.64581298828125, -3.508087158203125, -3.370361328125, -3.232635498046875, -3.09490966796875, -2.957183837890625, -2.8194580078125, -2.681732177734375, -2.54400634765625, -2.406280517578125, -2.2685546875, -2.130828857421875, -1.99310302734375, -1.855377197265625, -1.7176513671875, -1.579925537109375, -1.44219970703125, -1.304473876953125, -1.166748046875, -1.029022216796875, -0.89129638671875, -0.753570556640625, -0.6158447265625, -0.478118896484375, -0.34039306640625, -0.202667236328125, -0.06494140625, 0.072784423828125, 0.21051025390625, 0.348236083984375, 0.4859619140625, 0.623687744140625, 0.76141357421875, 0.899139404296875, 1.036865234375, 1.174591064453125, 1.31231689453125, 1.450042724609375, 1.5877685546875, 1.725494384765625, 1.86322021484375, 2.000946044921875, 2.138671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 29.0, 70.0, 152.0, 339.0, 212.0, 99.0, 40.0, 30.0, 8.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.77525329589844, -81.92320251464844, -79.07115936279297, -76.21910858154297, -73.3670654296875, -70.5150146484375, -67.6629638671875, -64.81092071533203, -61.9588737487793, -59.10682678222656, -56.25477981567383, -53.402732849121094, -50.550682067871094, -47.698638916015625, -44.846588134765625, -41.99454116821289, -39.142494201660156, -36.29044723510742, -33.43840026855469, -30.58635139465332, -27.734304428100586, -24.88225746154785, -22.030208587646484, -19.17816162109375, -16.326114654541016, -13.474067687988281, -10.62201976776123, -7.76997184753418, -4.917924880981445, -2.065877914428711, 0.7861709594726562, 3.6382179260253906, 6.490257263183594, 9.342304229736328, 12.194352149963379, 15.04640007019043, 17.898447036743164, 20.7504940032959, 23.602542877197266, 26.45458984375, 29.306636810302734, 32.15868377685547, 35.0107307434082, 37.86277770996094, 40.71482849121094, 43.566871643066406, 46.418922424316406, 49.27096939086914, 52.123016357421875, 54.97506332397461, 57.827110290527344, 60.679161071777344, 63.53120422363281, 66.38325500488281, 69.23530578613281, 72.08734893798828, 74.93939208984375, 77.79144287109375, 80.64348602294922, 83.49553680419922, 86.34757995605469, 89.19963073730469, 92.05168151855469, 94.90372467041016, 97.75577545166016]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 14.0, 9.0, 10.0, 9.0, 11.0, 23.0, 15.0, 28.0, 26.0, 44.0, 37.0, 41.0, 41.0, 51.0, 85.0, 82.0, 92.0, 63.0, 42.0, 47.0, 42.0, 31.0, 20.0, 16.0, 20.0, 13.0, 21.0, 15.0, 7.0, 10.0, 11.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.60091018676758, -48.99504852294922, -47.389190673828125, -45.783329010009766, -44.177467346191406, -42.57160949707031, -40.96574783325195, -39.359886169433594, -37.7540283203125, -36.14816665649414, -34.54230880737305, -32.93644714355469, -31.330585479736328, -29.7247257232666, -28.118865966796875, -26.513004302978516, -24.907142639160156, -23.30128288269043, -21.69542121887207, -20.089561462402344, -18.483699798583984, -16.877840042114258, -15.271980285644531, -13.666119575500488, -12.060258865356445, -10.454398155212402, -8.84853744506836, -7.242677688598633, -5.63681697845459, -4.030956268310547, -2.4250965118408203, -0.8192358016967773, 0.78662109375, 2.392481565475464, 3.9983420372009277, 5.6042022705078125, 7.2100629806518555, 8.815923690795898, 10.421783447265625, 12.027644157409668, 13.633504867553711, 15.239365577697754, 16.845226287841797, 18.451086044311523, 20.05694580078125, 21.66280746459961, 23.268667221069336, 24.874526977539062, 26.480388641357422, 28.08624839782715, 29.692110061645508, 31.297969818115234, 32.903831481933594, 34.50968933105469, 36.11555099487305, 37.721412658691406, 39.3272705078125, 40.93313217163086, 42.53899002075195, 44.14485168457031, 45.75071334838867, 47.35657501220703, 48.962432861328125, 50.568294525146484, 52.174156188964844]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 13.0, 13.0, 34.0, 82.0, 177.0, 425.0, 1510.0, 9274.0, 223088.0, 3855165.0, 94424.0, 7312.0, 1767.0, 618.0, 217.0, 88.0, 29.0, 11.0, 8.0, 12.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.8515625, -11.5260009765625, -11.200439453125, -10.8748779296875, -10.54931640625, -10.2237548828125, -9.898193359375, -9.5726318359375, -9.2470703125, -8.9215087890625, -8.595947265625, -8.2703857421875, -7.94482421875, -7.6192626953125, -7.293701171875, -6.9681396484375, -6.642578125, -6.3170166015625, -5.991455078125, -5.6658935546875, -5.34033203125, -5.0147705078125, -4.689208984375, -4.3636474609375, -4.0380859375, -3.7125244140625, -3.386962890625, -3.0614013671875, -2.73583984375, -2.4102783203125, -2.084716796875, -1.7591552734375, -1.43359375, -1.1080322265625, -0.782470703125, -0.4569091796875, -0.13134765625, 0.1942138671875, 0.519775390625, 0.8453369140625, 1.1708984375, 1.4964599609375, 1.822021484375, 2.1475830078125, 2.47314453125, 2.7987060546875, 3.124267578125, 3.4498291015625, 3.775390625, 4.1009521484375, 4.426513671875, 4.7520751953125, 5.07763671875, 5.4031982421875, 5.728759765625, 6.0543212890625, 6.3798828125, 6.7054443359375, 7.031005859375, 7.3565673828125, 7.68212890625, 8.0076904296875, 8.333251953125, 8.6588134765625, 8.984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 9.0, 13.0, 37.0, 43.0, 60.0, 88.0, 105.0, 109.0, 131.0, 125.0, 86.0, 72.0, 59.0, 30.0, 21.0, 13.0, 5.0, 5.0, 1.0, 2.0], "bins": [-11.5625, -11.3408203125, -11.119140625, -10.8974609375, -10.67578125, -10.4541015625, -10.232421875, -10.0107421875, -9.7890625, -9.5673828125, -9.345703125, -9.1240234375, -8.90234375, -8.6806640625, -8.458984375, -8.2373046875, -8.015625, -7.7939453125, -7.572265625, -7.3505859375, -7.12890625, -6.9072265625, -6.685546875, -6.4638671875, -6.2421875, -6.0205078125, -5.798828125, -5.5771484375, -5.35546875, -5.1337890625, -4.912109375, -4.6904296875, -4.46875, -4.2470703125, -4.025390625, -3.8037109375, -3.58203125, -3.3603515625, -3.138671875, -2.9169921875, -2.6953125, -2.4736328125, -2.251953125, -2.0302734375, -1.80859375, -1.5869140625, -1.365234375, -1.1435546875, -0.921875, -0.7001953125, -0.478515625, -0.2568359375, -0.03515625, 0.1865234375, 0.408203125, 0.6298828125, 0.8515625, 1.0732421875, 1.294921875, 1.5166015625, 1.73828125, 1.9599609375, 2.181640625, 2.4033203125, 2.625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 4.0, 9.0, 3.0, 3.0, 12.0, 11.0, 20.0, 37.0, 28.0, 51.0, 77.0, 150.0, 290.0, 579.0, 1534.0, 5141.0, 21626.0, 215695.0, 3576679.0, 335056.0, 27649.0, 6167.0, 1897.0, 746.0, 310.0, 180.0, 97.0, 59.0, 39.0, 35.0, 26.0, 18.0, 10.0, 7.0, 9.0, 2.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.60546875, -7.38543701171875, -7.1654052734375, -6.94537353515625, -6.725341796875, -6.50531005859375, -6.2852783203125, -6.06524658203125, -5.84521484375, -5.62518310546875, -5.4051513671875, -5.18511962890625, -4.965087890625, -4.74505615234375, -4.5250244140625, -4.30499267578125, -4.0849609375, -3.86492919921875, -3.6448974609375, -3.42486572265625, -3.204833984375, -2.98480224609375, -2.7647705078125, -2.54473876953125, -2.32470703125, -2.10467529296875, -1.8846435546875, -1.66461181640625, -1.444580078125, -1.22454833984375, -1.0045166015625, -0.78448486328125, -0.564453125, -0.34442138671875, -0.1243896484375, 0.09564208984375, 0.315673828125, 0.53570556640625, 0.7557373046875, 0.97576904296875, 1.19580078125, 1.41583251953125, 1.6358642578125, 1.85589599609375, 2.075927734375, 2.29595947265625, 2.5159912109375, 2.73602294921875, 2.9560546875, 3.17608642578125, 3.3961181640625, 3.61614990234375, 3.836181640625, 4.05621337890625, 4.2762451171875, 4.49627685546875, 4.71630859375, 4.93634033203125, 5.1563720703125, 5.37640380859375, 5.596435546875, 5.81646728515625, 6.0364990234375, 6.25653076171875, 6.4765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 11.0, 4.0, 6.0, 12.0, 13.0, 20.0, 15.0, 31.0, 44.0, 64.0, 84.0, 156.0, 220.0, 313.0, 460.0, 552.0, 586.0, 464.0, 303.0, 229.0, 152.0, 83.0, 71.0, 48.0, 29.0, 26.0, 15.0, 12.0, 6.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.2734375, -4.1307373046875, -3.988037109375, -3.8453369140625, -3.70263671875, -3.5599365234375, -3.417236328125, -3.2745361328125, -3.1318359375, -2.9891357421875, -2.846435546875, -2.7037353515625, -2.56103515625, -2.4183349609375, -2.275634765625, -2.1329345703125, -1.990234375, -1.8475341796875, -1.704833984375, -1.5621337890625, -1.41943359375, -1.2767333984375, -1.134033203125, -0.9913330078125, -0.8486328125, -0.7059326171875, -0.563232421875, -0.4205322265625, -0.27783203125, -0.1351318359375, 0.007568359375, 0.1502685546875, 0.29296875, 0.4356689453125, 0.578369140625, 0.7210693359375, 0.86376953125, 1.0064697265625, 1.149169921875, 1.2918701171875, 1.4345703125, 1.5772705078125, 1.719970703125, 1.8626708984375, 2.00537109375, 2.1480712890625, 2.290771484375, 2.4334716796875, 2.576171875, 2.7188720703125, 2.861572265625, 3.0042724609375, 3.14697265625, 3.2896728515625, 3.432373046875, 3.5750732421875, 3.7177734375, 3.8604736328125, 4.003173828125, 4.1458740234375, 4.28857421875, 4.4312744140625, 4.573974609375, 4.7166748046875, 4.859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 9.0, 29.0, 83.0, 148.0, 219.0, 240.0, 170.0, 52.0, 22.0, 13.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.94607925415039, -28.575361251831055, -26.204641342163086, -23.83392333984375, -21.46320343017578, -19.092485427856445, -16.72176742553711, -14.35104751586914, -11.980329513549805, -9.609610557556152, -7.238892078399658, -4.868173599243164, -2.4974546432495117, -0.12673568725585938, 2.2439823150634766, 4.614702224731445, 6.985420227050781, 9.356139183044434, 11.726858139038086, 14.097576141357422, 16.46829605102539, 18.839014053344727, 21.209732055664062, 23.58045196533203, 25.951169967651367, 28.321887969970703, 30.692607879638672, 33.063323974609375, 35.434043884277344, 37.80476379394531, 40.17548370361328, 42.54620361328125, 44.91691589355469, 47.287635803222656, 49.65835189819336, 52.02907180786133, 54.3997917175293, 56.7705078125, 59.14122772216797, 61.51194763183594, 63.882667541503906, 66.25338745117188, 68.62410736083984, 70.99482727050781, 73.36553955078125, 75.73625946044922, 78.10697937011719, 80.47769927978516, 82.84841918945312, 85.2191390991211, 87.58985900878906, 89.9605712890625, 92.33129119873047, 94.70201110839844, 97.0727310180664, 99.44345092773438, 101.81416320800781, 104.18488311767578, 106.55560302734375, 108.92631530761719, 111.29703521728516, 113.66775512695312, 116.0384750366211, 118.40919494628906, 120.77991485595703]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 12.0, 11.0, 14.0, 16.0, 16.0, 21.0, 19.0, 25.0, 27.0, 33.0, 33.0, 44.0, 38.0, 35.0, 42.0, 43.0, 44.0, 41.0, 47.0, 39.0, 40.0, 35.0, 39.0, 32.0, 43.0, 27.0, 22.0, 21.0, 18.0, 24.0, 12.0, 9.0, 11.0, 14.0, 7.0, 6.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.85090446472168, -19.187030792236328, -18.52315902709961, -17.859285354614258, -17.19541358947754, -16.531539916992188, -15.867667198181152, -15.203794479370117, -14.539921760559082, -13.876049041748047, -13.212176322937012, -12.548303604125977, -11.884429931640625, -11.220558166503906, -10.556684494018555, -9.89281177520752, -9.228939056396484, -8.56506633758545, -7.901193618774414, -7.237320423126221, -6.5734477043151855, -5.90957498550415, -5.245701789855957, -4.581829071044922, -3.9179563522338867, -3.2540836334228516, -2.5902106761932373, -1.9263378381729126, -1.262465000152588, -0.5985922813415527, 0.06528067588806152, 0.7291536331176758, 1.3930282592773438, 2.056900978088379, 2.720773935317993, 3.3846468925476074, 4.048519611358643, 4.712392330169678, 5.376265525817871, 6.040138244628906, 6.704010963439941, 7.367883682250977, 8.031756401062012, 8.695629119873047, 9.359502792358398, 10.023374557495117, 10.687248229980469, 11.351120948791504, 12.014993667602539, 12.678866386413574, 13.34273910522461, 14.006611824035645, 14.67048454284668, 15.334358215332031, 15.998230934143066, 16.6621036529541, 17.325977325439453, 17.989850997924805, 18.653722763061523, 19.317596435546875, 19.981468200683594, 20.645341873168945, 21.309213638305664, 21.973087310791016, 22.636959075927734]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 6.0, 4.0, 8.0, 12.0, 6.0, 23.0, 22.0, 42.0, 72.0, 138.0, 247.0, 545.0, 1741.0, 8511.0, 71535.0, 659486.0, 275521.0, 25018.0, 3803.0, 984.0, 386.0, 165.0, 107.0, 44.0, 41.0, 18.0, 18.0, 20.0, 10.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4609375, -9.132080078125, -8.80322265625, -8.474365234375, -8.1455078125, -7.816650390625, -7.48779296875, -7.158935546875, -6.830078125, -6.501220703125, -6.17236328125, -5.843505859375, -5.5146484375, -5.185791015625, -4.85693359375, -4.528076171875, -4.19921875, -3.870361328125, -3.54150390625, -3.212646484375, -2.8837890625, -2.554931640625, -2.22607421875, -1.897216796875, -1.568359375, -1.239501953125, -0.91064453125, -0.581787109375, -0.2529296875, 0.075927734375, 0.40478515625, 0.733642578125, 1.0625, 1.391357421875, 1.72021484375, 2.049072265625, 2.3779296875, 2.706787109375, 3.03564453125, 3.364501953125, 3.693359375, 4.022216796875, 4.35107421875, 4.679931640625, 5.0087890625, 5.337646484375, 5.66650390625, 5.995361328125, 6.32421875, 6.653076171875, 6.98193359375, 7.310791015625, 7.6396484375, 7.968505859375, 8.29736328125, 8.626220703125, 8.955078125, 9.283935546875, 9.61279296875, 9.941650390625, 10.2705078125, 10.599365234375, 10.92822265625, 11.257080078125, 11.5859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 10.0, 21.0, 46.0, 41.0, 71.0, 96.0, 106.0, 110.0, 119.0, 121.0, 96.0, 63.0, 44.0, 31.0, 13.0, 13.0, 5.0, 5.0, 0.0, 1.0], "bins": [-11.5625, -11.339447021484375, -11.11639404296875, -10.893341064453125, -10.6702880859375, -10.447235107421875, -10.22418212890625, -10.001129150390625, -9.778076171875, -9.555023193359375, -9.33197021484375, -9.108917236328125, -8.8858642578125, -8.662811279296875, -8.43975830078125, -8.216705322265625, -7.99365234375, -7.770599365234375, -7.54754638671875, -7.324493408203125, -7.1014404296875, -6.878387451171875, -6.65533447265625, -6.432281494140625, -6.209228515625, -5.986175537109375, -5.76312255859375, -5.540069580078125, -5.3170166015625, -5.093963623046875, -4.87091064453125, -4.647857666015625, -4.4248046875, -4.201751708984375, -3.97869873046875, -3.755645751953125, -3.5325927734375, -3.309539794921875, -3.08648681640625, -2.863433837890625, -2.640380859375, -2.417327880859375, -2.19427490234375, -1.971221923828125, -1.7481689453125, -1.525115966796875, -1.30206298828125, -1.079010009765625, -0.85595703125, -0.632904052734375, -0.40985107421875, -0.186798095703125, 0.0362548828125, 0.259307861328125, 0.48236083984375, 0.705413818359375, 0.928466796875, 1.151519775390625, 1.37457275390625, 1.597625732421875, 1.8206787109375, 2.043731689453125, 2.26678466796875, 2.489837646484375, 2.712890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 11.0, 22.0, 28.0, 36.0, 54.0, 115.0, 173.0, 283.0, 550.0, 1202.0, 3768.0, 25155.0, 654750.0, 337375.0, 19482.0, 3272.0, 1056.0, 502.0, 266.0, 161.0, 89.0, 60.0, 31.0, 31.0, 20.0, 11.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.3802490234375, -8.971435546875, -8.5626220703125, -8.15380859375, -7.7449951171875, -7.336181640625, -6.9273681640625, -6.5185546875, -6.1097412109375, -5.700927734375, -5.2921142578125, -4.88330078125, -4.4744873046875, -4.065673828125, -3.6568603515625, -3.248046875, -2.8392333984375, -2.430419921875, -2.0216064453125, -1.61279296875, -1.2039794921875, -0.795166015625, -0.3863525390625, 0.0224609375, 0.4312744140625, 0.840087890625, 1.2489013671875, 1.65771484375, 2.0665283203125, 2.475341796875, 2.8841552734375, 3.29296875, 3.7017822265625, 4.110595703125, 4.5194091796875, 4.92822265625, 5.3370361328125, 5.745849609375, 6.1546630859375, 6.5634765625, 6.9722900390625, 7.381103515625, 7.7899169921875, 8.19873046875, 8.6075439453125, 9.016357421875, 9.4251708984375, 9.833984375, 10.2427978515625, 10.651611328125, 11.0604248046875, 11.46923828125, 11.8780517578125, 12.286865234375, 12.6956787109375, 13.1044921875, 13.5133056640625, 13.922119140625, 14.3309326171875, 14.73974609375, 15.1485595703125, 15.557373046875, 15.9661865234375, 16.375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 1.0, 6.0, 6.0, 5.0, 10.0, 7.0, 20.0, 23.0, 32.0, 40.0, 38.0, 42.0, 51.0, 49.0, 60.0, 78.0, 69.0, 68.0, 62.0, 56.0, 58.0, 51.0, 40.0, 34.0, 16.0, 22.0, 8.0, 11.0, 8.0, 9.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.171875, -11.72314453125, -11.2744140625, -10.82568359375, -10.376953125, -9.92822265625, -9.4794921875, -9.03076171875, -8.58203125, -8.13330078125, -7.6845703125, -7.23583984375, -6.787109375, -6.33837890625, -5.8896484375, -5.44091796875, -4.9921875, -4.54345703125, -4.0947265625, -3.64599609375, -3.197265625, -2.74853515625, -2.2998046875, -1.85107421875, -1.40234375, -0.95361328125, -0.5048828125, -0.05615234375, 0.392578125, 0.84130859375, 1.2900390625, 1.73876953125, 2.1875, 2.63623046875, 3.0849609375, 3.53369140625, 3.982421875, 4.43115234375, 4.8798828125, 5.32861328125, 5.77734375, 6.22607421875, 6.6748046875, 7.12353515625, 7.572265625, 8.02099609375, 8.4697265625, 8.91845703125, 9.3671875, 9.81591796875, 10.2646484375, 10.71337890625, 11.162109375, 11.61083984375, 12.0595703125, 12.50830078125, 12.95703125, 13.40576171875, 13.8544921875, 14.30322265625, 14.751953125, 15.20068359375, 15.6494140625, 16.09814453125, 16.546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 4.0, 2.0, 4.0, 9.0, 19.0, 21.0, 37.0, 46.0, 84.0, 146.0, 405.0, 1058.0, 3727.0, 19463.0, 202485.0, 773643.0, 38456.0, 6292.0, 1575.0, 557.0, 220.0, 105.0, 69.0, 36.0, 27.0, 18.0, 17.0, 7.0, 6.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.093017578125, -3.98291015625, -3.872802734375, -3.7626953125, -3.652587890625, -3.54248046875, -3.432373046875, -3.322265625, -3.212158203125, -3.10205078125, -2.991943359375, -2.8818359375, -2.771728515625, -2.66162109375, -2.551513671875, -2.44140625, -2.331298828125, -2.22119140625, -2.111083984375, -2.0009765625, -1.890869140625, -1.78076171875, -1.670654296875, -1.560546875, -1.450439453125, -1.34033203125, -1.230224609375, -1.1201171875, -1.010009765625, -0.89990234375, -0.789794921875, -0.6796875, -0.569580078125, -0.45947265625, -0.349365234375, -0.2392578125, -0.129150390625, -0.01904296875, 0.091064453125, 0.201171875, 0.311279296875, 0.42138671875, 0.531494140625, 0.6416015625, 0.751708984375, 0.86181640625, 0.971923828125, 1.08203125, 1.192138671875, 1.30224609375, 1.412353515625, 1.5224609375, 1.632568359375, 1.74267578125, 1.852783203125, 1.962890625, 2.072998046875, 2.18310546875, 2.293212890625, 2.4033203125, 2.513427734375, 2.62353515625, 2.733642578125, 2.84375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 1.0, 3.0, 5.0, 5.0, 0.0, 2.0, 2.0, 10.0, 6.0, 8.0, 17.0, 17.0, 32.0, 30.0, 41.0, 67.0, 104.0, 172.0, 151.0, 97.0, 50.0, 38.0, 30.0, 23.0, 26.0, 10.0, 19.0, 7.0, 8.0, 6.0, 0.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005536079406738281, -0.0005362257361412048, -0.0005188435316085815, -0.0005014613270759583, -0.00048407912254333496, -0.00046669691801071167, -0.0004493147134780884, -0.0004319325089454651, -0.0004145503044128418, -0.0003971680998802185, -0.0003797858953475952, -0.0003624036908149719, -0.00034502148628234863, -0.00032763928174972534, -0.00031025707721710205, -0.00029287487268447876, -0.00027549266815185547, -0.0002581104636192322, -0.0002407282590866089, -0.0002233460545539856, -0.0002059638500213623, -0.00018858164548873901, -0.00017119944095611572, -0.00015381723642349243, -0.00013643503189086914, -0.00011905282735824585, -0.00010167062282562256, -8.428841829299927e-05, -6.690621376037598e-05, -4.9524009227752686e-05, -3.2141804695129395e-05, -1.4759600162506104e-05, 2.6226043701171875e-06, 2.000480890274048e-05, 3.738701343536377e-05, 5.476921796798706e-05, 7.215142250061035e-05, 8.953362703323364e-05, 0.00010691583156585693, 0.00012429803609848022, 0.00014168024063110352, 0.0001590624451637268, 0.0001764446496963501, 0.0001938268542289734, 0.00021120905876159668, 0.00022859126329421997, 0.00024597346782684326, 0.00026335567235946655, 0.00028073787689208984, 0.00029812008142471313, 0.0003155022859573364, 0.0003328844904899597, 0.000350266695022583, 0.0003676488995552063, 0.0003850311040878296, 0.0004024133086204529, 0.00041979551315307617, 0.00043717771768569946, 0.00045455992221832275, 0.00047194212675094604, 0.0004893243312835693, 0.0005067065358161926, 0.0005240887403488159, 0.0005414709448814392, 0.0005588531494140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 8.0, 13.0, 22.0, 22.0, 34.0, 41.0, 60.0, 95.0, 197.0, 370.0, 728.0, 1640.0, 4586.0, 15684.0, 74850.0, 739388.0, 170674.0, 28227.0, 7202.0, 2513.0, 1042.0, 479.0, 274.0, 124.0, 84.0, 62.0, 59.0, 29.0, 10.0, 11.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-3.173828125, -3.091827392578125, -3.00982666015625, -2.927825927734375, -2.8458251953125, -2.763824462890625, -2.68182373046875, -2.599822998046875, -2.517822265625, -2.435821533203125, -2.35382080078125, -2.271820068359375, -2.1898193359375, -2.107818603515625, -2.02581787109375, -1.943817138671875, -1.86181640625, -1.779815673828125, -1.69781494140625, -1.615814208984375, -1.5338134765625, -1.451812744140625, -1.36981201171875, -1.287811279296875, -1.205810546875, -1.123809814453125, -1.04180908203125, -0.959808349609375, -0.8778076171875, -0.795806884765625, -0.71380615234375, -0.631805419921875, -0.5498046875, -0.467803955078125, -0.38580322265625, -0.303802490234375, -0.2218017578125, -0.139801025390625, -0.05780029296875, 0.024200439453125, 0.106201171875, 0.188201904296875, 0.27020263671875, 0.352203369140625, 0.4342041015625, 0.516204833984375, 0.59820556640625, 0.680206298828125, 0.76220703125, 0.844207763671875, 0.92620849609375, 1.008209228515625, 1.0902099609375, 1.172210693359375, 1.25421142578125, 1.336212158203125, 1.418212890625, 1.500213623046875, 1.58221435546875, 1.664215087890625, 1.7462158203125, 1.828216552734375, 1.91021728515625, 1.992218017578125, 2.07421875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 12.0, 6.0, 11.0, 6.0, 16.0, 20.0, 14.0, 34.0, 41.0, 55.0, 54.0, 72.0, 120.0, 104.0, 87.0, 99.0, 45.0, 37.0, 28.0, 29.0, 14.0, 19.0, 8.0, 15.0, 14.0, 8.0, 4.0, 3.0, 7.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.333984375, -2.268096923828125, -2.20220947265625, -2.136322021484375, -2.0704345703125, -2.004547119140625, -1.93865966796875, -1.872772216796875, -1.806884765625, -1.740997314453125, -1.67510986328125, -1.609222412109375, -1.5433349609375, -1.477447509765625, -1.41156005859375, -1.345672607421875, -1.27978515625, -1.213897705078125, -1.14801025390625, -1.082122802734375, -1.0162353515625, -0.950347900390625, -0.88446044921875, -0.818572998046875, -0.752685546875, -0.686798095703125, -0.62091064453125, -0.555023193359375, -0.4891357421875, -0.423248291015625, -0.35736083984375, -0.291473388671875, -0.2255859375, -0.159698486328125, -0.09381103515625, -0.027923583984375, 0.0379638671875, 0.103851318359375, 0.16973876953125, 0.235626220703125, 0.301513671875, 0.367401123046875, 0.43328857421875, 0.499176025390625, 0.5650634765625, 0.630950927734375, 0.69683837890625, 0.762725830078125, 0.82861328125, 0.894500732421875, 0.96038818359375, 1.026275634765625, 1.0921630859375, 1.158050537109375, 1.22393798828125, 1.289825439453125, 1.355712890625, 1.421600341796875, 1.48748779296875, 1.553375244140625, 1.6192626953125, 1.685150146484375, 1.75103759765625, 1.816925048828125, 1.8828125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 15.0, 28.0, 74.0, 233.0, 411.0, 124.0, 62.0, 20.0, 13.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.45770263671875, -86.38419342041016, -83.31067657470703, -80.23716735839844, -77.16365051269531, -74.09014129638672, -71.0166244506836, -67.943115234375, -64.86959838867188, -61.796085357666016, -58.722572326660156, -55.6490592956543, -52.57554626464844, -49.50203323364258, -46.42852020263672, -43.355010986328125, -40.281497955322266, -37.207984924316406, -34.13447189331055, -31.060958862304688, -27.987445831298828, -24.91393280029297, -21.840421676635742, -18.766908645629883, -15.693395614624023, -12.619882583618164, -9.546369552612305, -6.472857475280762, -3.3993444442749023, -0.32583141326904297, 2.7476806640625, 5.821193695068359, 8.894706726074219, 11.968219757080078, 15.041732788085938, 18.115245819091797, 21.188758850097656, 24.262271881103516, 27.335783004760742, 30.4092960357666, 33.482810974121094, 36.55632400512695, 39.62983703613281, 42.70335006713867, 45.77686309814453, 48.85037612915039, 51.92388916015625, 54.997398376464844, 58.0709114074707, 61.14442443847656, 64.21793365478516, 67.29145050048828, 70.36495971679688, 73.4384765625, 76.5119857788086, 79.58550262451172, 82.65901184082031, 85.7325210571289, 88.80603790283203, 91.87954711914062, 94.95306396484375, 98.02657318115234, 101.10009002685547, 104.17359924316406, 107.24711608886719]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 10.0, 12.0, 16.0, 13.0, 15.0, 33.0, 29.0, 29.0, 32.0, 36.0, 49.0, 76.0, 127.0, 113.0, 80.0, 53.0, 36.0, 32.0, 31.0, 28.0, 19.0, 14.0, 22.0, 15.0, 19.0, 5.0, 8.0, 11.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.97138214111328, -41.42879104614258, -39.886199951171875, -38.34360885620117, -36.80101776123047, -35.2584228515625, -33.7158317565918, -32.173240661621094, -30.63064956665039, -29.088058471679688, -27.545467376708984, -26.00287437438965, -24.460283279418945, -22.917692184448242, -21.375099182128906, -19.832508087158203, -18.2899169921875, -16.747325897216797, -15.204733848571777, -13.662141799926758, -12.119550704956055, -10.576959609985352, -9.034367561340332, -7.4917755126953125, -5.949184417724609, -4.406592845916748, -2.8640012741088867, -1.3214097023010254, 0.22118186950683594, 1.7637734413146973, 3.3063650131225586, 4.848957061767578, 6.391548156738281, 7.934139728546143, 9.476731300354004, 11.019323348999023, 12.561914443969727, 14.10450553894043, 15.64709758758545, 17.18968963623047, 18.732280731201172, 20.274871826171875, 21.817462921142578, 23.360055923461914, 24.902647018432617, 26.44523811340332, 27.987831115722656, 29.53042221069336, 31.073013305664062, 32.615604400634766, 34.15819549560547, 35.70078659057617, 37.243377685546875, 38.785972595214844, 40.32856369018555, 41.87115478515625, 43.41374588012695, 44.956336975097656, 46.49892807006836, 48.04151916503906, 49.58411407470703, 51.126705169677734, 52.66929626464844, 54.21188735961914, 55.754478454589844]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 7.0, 15.0, 14.0, 18.0, 24.0, 51.0, 111.0, 244.0, 467.0, 1082.0, 2903.0, 10372.0, 60736.0, 991138.0, 2885657.0, 208475.0, 23694.0, 5681.0, 1998.0, 834.0, 370.0, 154.0, 103.0, 46.0, 38.0, 8.0, 15.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.82421875, -4.640380859375, -4.45654296875, -4.272705078125, -4.0888671875, -3.905029296875, -3.72119140625, -3.537353515625, -3.353515625, -3.169677734375, -2.98583984375, -2.802001953125, -2.6181640625, -2.434326171875, -2.25048828125, -2.066650390625, -1.8828125, -1.698974609375, -1.51513671875, -1.331298828125, -1.1474609375, -0.963623046875, -0.77978515625, -0.595947265625, -0.412109375, -0.228271484375, -0.04443359375, 0.139404296875, 0.3232421875, 0.507080078125, 0.69091796875, 0.874755859375, 1.05859375, 1.242431640625, 1.42626953125, 1.610107421875, 1.7939453125, 1.977783203125, 2.16162109375, 2.345458984375, 2.529296875, 2.713134765625, 2.89697265625, 3.080810546875, 3.2646484375, 3.448486328125, 3.63232421875, 3.816162109375, 4.0, 4.183837890625, 4.36767578125, 4.551513671875, 4.7353515625, 4.919189453125, 5.10302734375, 5.286865234375, 5.470703125, 5.654541015625, 5.83837890625, 6.022216796875, 6.2060546875, 6.389892578125, 6.57373046875, 6.757568359375, 6.94140625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 14.0, 18.0, 27.0, 32.0, 37.0, 46.0, 63.0, 77.0, 68.0, 83.0, 85.0, 69.0, 68.0, 77.0, 58.0, 60.0, 30.0, 24.0, 20.0, 13.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.9140625, -6.764129638671875, -6.61419677734375, -6.464263916015625, -6.3143310546875, -6.164398193359375, -6.01446533203125, -5.864532470703125, -5.714599609375, -5.564666748046875, -5.41473388671875, -5.264801025390625, -5.1148681640625, -4.964935302734375, -4.81500244140625, -4.665069580078125, -4.51513671875, -4.365203857421875, -4.21527099609375, -4.065338134765625, -3.9154052734375, -3.765472412109375, -3.61553955078125, -3.465606689453125, -3.315673828125, -3.165740966796875, -3.01580810546875, -2.865875244140625, -2.7159423828125, -2.566009521484375, -2.41607666015625, -2.266143798828125, -2.1162109375, -1.966278076171875, -1.81634521484375, -1.666412353515625, -1.5164794921875, -1.366546630859375, -1.21661376953125, -1.066680908203125, -0.916748046875, -0.766815185546875, -0.61688232421875, -0.466949462890625, -0.3170166015625, -0.167083740234375, -0.01715087890625, 0.132781982421875, 0.28271484375, 0.432647705078125, 0.58258056640625, 0.732513427734375, 0.8824462890625, 1.032379150390625, 1.18231201171875, 1.332244873046875, 1.482177734375, 1.632110595703125, 1.78204345703125, 1.931976318359375, 2.0819091796875, 2.231842041015625, 2.38177490234375, 2.531707763671875, 2.681640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 13.0, 19.0, 21.0, 43.0, 43.0, 98.0, 177.0, 393.0, 1238.0, 5124.0, 35906.0, 1314377.0, 2774366.0, 53527.0, 6542.0, 1474.0, 427.0, 186.0, 96.0, 66.0, 43.0, 24.0, 16.0, 14.0, 6.0, 10.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.74755859375, -7.4716796875, -7.19580078125, -6.919921875, -6.64404296875, -6.3681640625, -6.09228515625, -5.81640625, -5.54052734375, -5.2646484375, -4.98876953125, -4.712890625, -4.43701171875, -4.1611328125, -3.88525390625, -3.609375, -3.33349609375, -3.0576171875, -2.78173828125, -2.505859375, -2.22998046875, -1.9541015625, -1.67822265625, -1.40234375, -1.12646484375, -0.8505859375, -0.57470703125, -0.298828125, -0.02294921875, 0.2529296875, 0.52880859375, 0.8046875, 1.08056640625, 1.3564453125, 1.63232421875, 1.908203125, 2.18408203125, 2.4599609375, 2.73583984375, 3.01171875, 3.28759765625, 3.5634765625, 3.83935546875, 4.115234375, 4.39111328125, 4.6669921875, 4.94287109375, 5.21875, 5.49462890625, 5.7705078125, 6.04638671875, 6.322265625, 6.59814453125, 6.8740234375, 7.14990234375, 7.42578125, 7.70166015625, 7.9775390625, 8.25341796875, 8.529296875, 8.80517578125, 9.0810546875, 9.35693359375, 9.6328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 7.0, 2.0, 7.0, 9.0, 16.0, 15.0, 19.0, 20.0, 27.0, 45.0, 60.0, 75.0, 131.0, 182.0, 293.0, 420.0, 572.0, 615.0, 487.0, 349.0, 208.0, 157.0, 102.0, 77.0, 51.0, 27.0, 29.0, 21.0, 7.0, 9.0, 6.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.76953125, -4.611328125, -4.453125, -4.294921875, -4.13671875, -3.978515625, -3.8203125, -3.662109375, -3.50390625, -3.345703125, -3.1875, -3.029296875, -2.87109375, -2.712890625, -2.5546875, -2.396484375, -2.23828125, -2.080078125, -1.921875, -1.763671875, -1.60546875, -1.447265625, -1.2890625, -1.130859375, -0.97265625, -0.814453125, -0.65625, -0.498046875, -0.33984375, -0.181640625, -0.0234375, 0.134765625, 0.29296875, 0.451171875, 0.609375, 0.767578125, 0.92578125, 1.083984375, 1.2421875, 1.400390625, 1.55859375, 1.716796875, 1.875, 2.033203125, 2.19140625, 2.349609375, 2.5078125, 2.666015625, 2.82421875, 2.982421875, 3.140625, 3.298828125, 3.45703125, 3.615234375, 3.7734375, 3.931640625, 4.08984375, 4.248046875, 4.40625, 4.564453125, 4.72265625, 4.880859375, 5.0390625, 5.197265625, 5.35546875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 9.0, 5.0, 10.0, 23.0, 58.0, 112.0, 214.0, 271.0, 176.0, 80.0, 23.0, 11.0, 4.0, 5.0, 3.0, 4.0, 1.0], "bins": [-120.76243591308594, -118.53803253173828, -116.31362915039062, -114.08922576904297, -111.86482238769531, -109.64041900634766, -107.416015625, -105.19160461425781, -102.96720886230469, -100.74280548095703, -98.51840209960938, -96.29399871826172, -94.06959533691406, -91.8451919555664, -89.62078857421875, -87.39637756347656, -85.1719741821289, -82.94757080078125, -80.7231674194336, -78.49876403808594, -76.27436065673828, -74.04995727539062, -71.82555389404297, -69.60115051269531, -67.37673950195312, -65.15233612060547, -62.92793273925781, -60.703529357910156, -58.4791259765625, -56.254722595214844, -54.03031539916992, -51.805912017822266, -49.581512451171875, -47.35710906982422, -45.13270568847656, -42.908302307128906, -40.68389892578125, -38.459495544433594, -36.23508834838867, -34.010684967041016, -31.78628158569336, -29.561878204345703, -27.337474822998047, -25.113069534301758, -22.8886661529541, -20.664262771606445, -18.439857482910156, -16.2154541015625, -13.991050720214844, -11.766647338867188, -9.542243003845215, -7.3178391456604, -5.093435287475586, -2.8690319061279297, -0.644627571105957, 1.5797767639160156, 3.804180145263672, 6.028584003448486, 8.2529878616333, 10.477392196655273, 12.70179557800293, 14.926198959350586, 17.150604248046875, 19.37500762939453, 21.599411010742188]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 3.0, 7.0, 13.0, 14.0, 11.0, 29.0, 13.0, 19.0, 21.0, 26.0, 37.0, 35.0, 35.0, 43.0, 48.0, 71.0, 62.0, 67.0, 62.0, 44.0, 42.0, 40.0, 26.0, 30.0, 40.0, 24.0, 26.0, 16.0, 22.0, 13.0, 16.0, 5.0, 11.0, 6.0, 2.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-32.296241760253906, -31.374244689941406, -30.45224952697754, -29.53025245666504, -28.608257293701172, -27.686260223388672, -26.764263153076172, -25.842267990112305, -24.920272827148438, -23.998275756835938, -23.07628059387207, -22.15428352355957, -21.232288360595703, -20.310291290283203, -19.388294219970703, -18.466299057006836, -17.544301986694336, -16.622304916381836, -15.700309753417969, -14.778312683105469, -13.856317520141602, -12.934320449829102, -12.012324333190918, -11.090328216552734, -10.16833209991455, -9.246335983276367, -8.324339866638184, -7.402343273162842, -6.480347156524658, -5.558351039886475, -4.636354446411133, -3.714358329772949, -2.7923622131347656, -1.8703659772872925, -0.9483697414398193, -0.02637338638305664, 0.895622730255127, 1.8176188468933105, 2.7396154403686523, 3.661611557006836, 4.5836076736450195, 5.505603790283203, 6.427599906921387, 7.3495965003967285, 8.27159309387207, 9.193588256835938, 10.115585327148438, 11.037581443786621, 11.959577560424805, 12.881573677062988, 13.803569793701172, 14.725566864013672, 15.647562026977539, 16.56955909729004, 17.491554260253906, 18.413551330566406, 19.335548400878906, 20.257545471191406, 21.179540634155273, 22.101537704467773, 23.02353286743164, 23.94552993774414, 24.86752700805664, 25.789522171020508, 26.711517333984375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 4.0, 10.0, 7.0, 11.0, 16.0, 26.0, 45.0, 44.0, 90.0, 148.0, 281.0, 522.0, 1288.0, 3158.0, 8905.0, 31217.0, 129389.0, 530890.0, 263318.0, 55710.0, 15034.0, 4900.0, 1814.0, 813.0, 378.0, 212.0, 113.0, 64.0, 44.0, 32.0, 18.0, 11.0, 5.0, 8.0, 8.0, 11.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90234375, -7.66796875, -7.43359375, -7.19921875, -6.96484375, -6.73046875, -6.49609375, -6.26171875, -6.02734375, -5.79296875, -5.55859375, -5.32421875, -5.08984375, -4.85546875, -4.62109375, -4.38671875, -4.15234375, -3.91796875, -3.68359375, -3.44921875, -3.21484375, -2.98046875, -2.74609375, -2.51171875, -2.27734375, -2.04296875, -1.80859375, -1.57421875, -1.33984375, -1.10546875, -0.87109375, -0.63671875, -0.40234375, -0.16796875, 0.06640625, 0.30078125, 0.53515625, 0.76953125, 1.00390625, 1.23828125, 1.47265625, 1.70703125, 1.94140625, 2.17578125, 2.41015625, 2.64453125, 2.87890625, 3.11328125, 3.34765625, 3.58203125, 3.81640625, 4.05078125, 4.28515625, 4.51953125, 4.75390625, 4.98828125, 5.22265625, 5.45703125, 5.69140625, 5.92578125, 6.16015625, 6.39453125, 6.62890625, 6.86328125, 7.09765625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 11.0, 7.0, 11.0, 18.0, 27.0, 36.0, 41.0, 59.0, 78.0, 80.0, 80.0, 80.0, 76.0, 88.0, 64.0, 63.0, 45.0, 40.0, 35.0, 23.0, 21.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9296875, -6.77081298828125, -6.6119384765625, -6.45306396484375, -6.294189453125, -6.13531494140625, -5.9764404296875, -5.81756591796875, -5.65869140625, -5.49981689453125, -5.3409423828125, -5.18206787109375, -5.023193359375, -4.86431884765625, -4.7054443359375, -4.54656982421875, -4.3876953125, -4.22882080078125, -4.0699462890625, -3.91107177734375, -3.752197265625, -3.59332275390625, -3.4344482421875, -3.27557373046875, -3.11669921875, -2.95782470703125, -2.7989501953125, -2.64007568359375, -2.481201171875, -2.32232666015625, -2.1634521484375, -2.00457763671875, -1.845703125, -1.68682861328125, -1.5279541015625, -1.36907958984375, -1.210205078125, -1.05133056640625, -0.8924560546875, -0.73358154296875, -0.57470703125, -0.41583251953125, -0.2569580078125, -0.09808349609375, 0.060791015625, 0.21966552734375, 0.3785400390625, 0.53741455078125, 0.6962890625, 0.85516357421875, 1.0140380859375, 1.17291259765625, 1.331787109375, 1.49066162109375, 1.6495361328125, 1.80841064453125, 1.96728515625, 2.12615966796875, 2.2850341796875, 2.44390869140625, 2.602783203125, 2.76165771484375, 2.9205322265625, 3.07940673828125, 3.23828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 6.0, 3.0, 9.0, 15.0, 17.0, 30.0, 60.0, 118.0, 148.0, 299.0, 536.0, 1138.0, 3117.0, 20914.0, 868232.0, 142666.0, 7725.0, 1852.0, 734.0, 381.0, 199.0, 136.0, 68.0, 38.0, 30.0, 17.0, 20.0, 13.0, 9.0, 4.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.390625, -17.84619140625, -17.3017578125, -16.75732421875, -16.212890625, -15.66845703125, -15.1240234375, -14.57958984375, -14.03515625, -13.49072265625, -12.9462890625, -12.40185546875, -11.857421875, -11.31298828125, -10.7685546875, -10.22412109375, -9.6796875, -9.13525390625, -8.5908203125, -8.04638671875, -7.501953125, -6.95751953125, -6.4130859375, -5.86865234375, -5.32421875, -4.77978515625, -4.2353515625, -3.69091796875, -3.146484375, -2.60205078125, -2.0576171875, -1.51318359375, -0.96875, -0.42431640625, 0.1201171875, 0.66455078125, 1.208984375, 1.75341796875, 2.2978515625, 2.84228515625, 3.38671875, 3.93115234375, 4.4755859375, 5.02001953125, 5.564453125, 6.10888671875, 6.6533203125, 7.19775390625, 7.7421875, 8.28662109375, 8.8310546875, 9.37548828125, 9.919921875, 10.46435546875, 11.0087890625, 11.55322265625, 12.09765625, 12.64208984375, 13.1865234375, 13.73095703125, 14.275390625, 14.81982421875, 15.3642578125, 15.90869140625, 16.453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 7.0, 6.0, 17.0, 9.0, 23.0, 31.0, 35.0, 37.0, 45.0, 69.0, 86.0, 97.0, 122.0, 82.0, 90.0, 70.0, 35.0, 53.0, 26.0, 25.0, 5.0, 13.0, 8.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.671875, -15.024658203125, -14.37744140625, -13.730224609375, -13.0830078125, -12.435791015625, -11.78857421875, -11.141357421875, -10.494140625, -9.846923828125, -9.19970703125, -8.552490234375, -7.9052734375, -7.258056640625, -6.61083984375, -5.963623046875, -5.31640625, -4.669189453125, -4.02197265625, -3.374755859375, -2.7275390625, -2.080322265625, -1.43310546875, -0.785888671875, -0.138671875, 0.508544921875, 1.15576171875, 1.802978515625, 2.4501953125, 3.097412109375, 3.74462890625, 4.391845703125, 5.0390625, 5.686279296875, 6.33349609375, 6.980712890625, 7.6279296875, 8.275146484375, 8.92236328125, 9.569580078125, 10.216796875, 10.864013671875, 11.51123046875, 12.158447265625, 12.8056640625, 13.452880859375, 14.10009765625, 14.747314453125, 15.39453125, 16.041748046875, 16.68896484375, 17.336181640625, 17.9833984375, 18.630615234375, 19.27783203125, 19.925048828125, 20.572265625, 21.219482421875, 21.86669921875, 22.513916015625, 23.1611328125, 23.808349609375, 24.45556640625, 25.102783203125, 25.75]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 3.0, 5.0, 5.0, 10.0, 23.0, 25.0, 15.0, 37.0, 48.0, 71.0, 108.0, 209.0, 428.0, 989.0, 3048.0, 12765.0, 201481.0, 803369.0, 19245.0, 4166.0, 1382.0, 489.0, 237.0, 128.0, 69.0, 50.0, 32.0, 15.0, 19.0, 17.0, 10.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.546875, -5.38427734375, -5.2216796875, -5.05908203125, -4.896484375, -4.73388671875, -4.5712890625, -4.40869140625, -4.24609375, -4.08349609375, -3.9208984375, -3.75830078125, -3.595703125, -3.43310546875, -3.2705078125, -3.10791015625, -2.9453125, -2.78271484375, -2.6201171875, -2.45751953125, -2.294921875, -2.13232421875, -1.9697265625, -1.80712890625, -1.64453125, -1.48193359375, -1.3193359375, -1.15673828125, -0.994140625, -0.83154296875, -0.6689453125, -0.50634765625, -0.34375, -0.18115234375, -0.0185546875, 0.14404296875, 0.306640625, 0.46923828125, 0.6318359375, 0.79443359375, 0.95703125, 1.11962890625, 1.2822265625, 1.44482421875, 1.607421875, 1.77001953125, 1.9326171875, 2.09521484375, 2.2578125, 2.42041015625, 2.5830078125, 2.74560546875, 2.908203125, 3.07080078125, 3.2333984375, 3.39599609375, 3.55859375, 3.72119140625, 3.8837890625, 4.04638671875, 4.208984375, 4.37158203125, 4.5341796875, 4.69677734375, 4.859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 10.0, 6.0, 4.0, 10.0, 20.0, 23.0, 31.0, 27.0, 62.0, 121.0, 241.0, 188.0, 75.0, 52.0, 32.0, 26.0, 12.0, 10.0, 9.0, 6.0, 4.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009493827819824219, -0.0009094998240470886, -0.0008696168661117554, -0.0008297339081764221, -0.0007898509502410889, -0.0007499679923057556, -0.0007100850343704224, -0.0006702020764350891, -0.0006303191184997559, -0.0005904361605644226, -0.0005505532026290894, -0.0005106702446937561, -0.00047078728675842285, -0.0004309043288230896, -0.00039102137088775635, -0.0003511384129524231, -0.00031125545501708984, -0.0002713724970817566, -0.00023148953914642334, -0.0001916065812110901, -0.00015172362327575684, -0.00011184066534042358, -7.195770740509033e-05, -3.207474946975708e-05, 7.808208465576172e-06, 4.7691166400909424e-05, 8.757412433624268e-05, 0.00012745708227157593, 0.00016734004020690918, 0.00020722299814224243, 0.0002471059560775757, 0.00028698891401290894, 0.0003268718719482422, 0.00036675482988357544, 0.0004066377878189087, 0.00044652074575424194, 0.0004864037036895752, 0.0005262866616249084, 0.0005661696195602417, 0.000606052577495575, 0.0006459355354309082, 0.0006858184933662415, 0.0007257014513015747, 0.000765584409236908, 0.0008054673671722412, 0.0008453503251075745, 0.0008852332830429077, 0.000925116240978241, 0.0009649991989135742, 0.0010048821568489075, 0.0010447651147842407, 0.001084648072719574, 0.0011245310306549072, 0.0011644139885902405, 0.0012042969465255737, 0.001244179904460907, 0.0012840628623962402, 0.0013239458203315735, 0.0013638287782669067, 0.00140371173620224, 0.0014435946941375732, 0.0014834776520729065, 0.0015233606100082397, 0.001563243567943573, 0.0016031265258789062]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 6.0, 12.0, 12.0, 20.0, 29.0, 32.0, 36.0, 42.0, 54.0, 93.0, 140.0, 206.0, 294.0, 593.0, 1155.0, 2317.0, 5628.0, 15468.0, 67453.0, 743810.0, 167373.0, 28305.0, 8536.0, 3392.0, 1519.0, 828.0, 410.0, 248.0, 172.0, 95.0, 75.0, 57.0, 29.0, 28.0, 16.0, 9.0, 11.0, 17.0, 8.0, 4.0, 3.0, 3.0, 5.0, 2.0, 5.0, 1.0], "bins": [-3.01171875, -2.931884765625, -2.85205078125, -2.772216796875, -2.6923828125, -2.612548828125, -2.53271484375, -2.452880859375, -2.373046875, -2.293212890625, -2.21337890625, -2.133544921875, -2.0537109375, -1.973876953125, -1.89404296875, -1.814208984375, -1.734375, -1.654541015625, -1.57470703125, -1.494873046875, -1.4150390625, -1.335205078125, -1.25537109375, -1.175537109375, -1.095703125, -1.015869140625, -0.93603515625, -0.856201171875, -0.7763671875, -0.696533203125, -0.61669921875, -0.536865234375, -0.45703125, -0.377197265625, -0.29736328125, -0.217529296875, -0.1376953125, -0.057861328125, 0.02197265625, 0.101806640625, 0.181640625, 0.261474609375, 0.34130859375, 0.421142578125, 0.5009765625, 0.580810546875, 0.66064453125, 0.740478515625, 0.8203125, 0.900146484375, 0.97998046875, 1.059814453125, 1.1396484375, 1.219482421875, 1.29931640625, 1.379150390625, 1.458984375, 1.538818359375, 1.61865234375, 1.698486328125, 1.7783203125, 1.858154296875, 1.93798828125, 2.017822265625, 2.09765625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 4.0, 6.0, 7.0, 6.0, 6.0, 9.0, 8.0, 13.0, 16.0, 42.0, 35.0, 30.0, 56.0, 81.0, 106.0, 113.0, 94.0, 92.0, 55.0, 47.0, 41.0, 28.0, 17.0, 14.0, 15.0, 13.0, 6.0, 2.0, 4.0, 6.0, 1.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.75, -2.672607421875, -2.59521484375, -2.517822265625, -2.4404296875, -2.363037109375, -2.28564453125, -2.208251953125, -2.130859375, -2.053466796875, -1.97607421875, -1.898681640625, -1.8212890625, -1.743896484375, -1.66650390625, -1.589111328125, -1.51171875, -1.434326171875, -1.35693359375, -1.279541015625, -1.2021484375, -1.124755859375, -1.04736328125, -0.969970703125, -0.892578125, -0.815185546875, -0.73779296875, -0.660400390625, -0.5830078125, -0.505615234375, -0.42822265625, -0.350830078125, -0.2734375, -0.196044921875, -0.11865234375, -0.041259765625, 0.0361328125, 0.113525390625, 0.19091796875, 0.268310546875, 0.345703125, 0.423095703125, 0.50048828125, 0.577880859375, 0.6552734375, 0.732666015625, 0.81005859375, 0.887451171875, 0.96484375, 1.042236328125, 1.11962890625, 1.197021484375, 1.2744140625, 1.351806640625, 1.42919921875, 1.506591796875, 1.583984375, 1.661376953125, 1.73876953125, 1.816162109375, 1.8935546875, 1.970947265625, 2.04833984375, 2.125732421875, 2.203125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 14.0, 54.0, 173.0, 516.0, 124.0, 58.0, 19.0, 18.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-127.51632690429688, -123.69622802734375, -119.87612915039062, -116.05602264404297, -112.23592376708984, -108.41582489013672, -104.5957260131836, -100.77561950683594, -96.95552062988281, -93.13542175292969, -89.31532287597656, -85.4952163696289, -81.67511749267578, -77.85501861572266, -74.03491973876953, -70.21481323242188, -66.39471435546875, -62.574615478515625, -58.754512786865234, -54.93441390991211, -51.11431121826172, -47.294212341308594, -43.47411346435547, -39.65401077270508, -35.83391571044922, -32.013816833496094, -28.193714141845703, -24.373615264892578, -20.553512573242188, -16.733413696289062, -12.913312911987305, -9.093212127685547, -5.273109436035156, -1.4530088901519775, 2.367091655731201, 6.187191963195801, 10.007292747497559, 13.827392578125, 17.647493362426758, 21.467594146728516, 25.287694931030273, 29.10779571533203, 32.927894592285156, 36.74799728393555, 40.56809616088867, 44.38819885253906, 48.20829772949219, 52.02839660644531, 55.8484992980957, 59.66859817504883, 63.48870086669922, 67.30879974365234, 71.12889862060547, 74.94900512695312, 78.76910400390625, 82.58920288085938, 86.4093017578125, 90.22940063476562, 94.04949951171875, 97.8696060180664, 101.68970489501953, 105.50980377197266, 109.32990264892578, 113.15000915527344, 116.97010803222656]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 12.0, 10.0, 14.0, 20.0, 25.0, 28.0, 34.0, 41.0, 37.0, 57.0, 60.0, 133.0, 172.0, 70.0, 46.0, 40.0, 32.0, 33.0, 35.0, 25.0, 20.0, 9.0, 7.0, 9.0, 3.0, 9.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.125999450683594, -44.997379302978516, -42.86875915527344, -40.74013900756836, -38.61151885986328, -36.48289489746094, -34.35427474975586, -32.22565460205078, -30.097034454345703, -27.968414306640625, -25.839794158935547, -23.711172103881836, -21.582551956176758, -19.45393180847168, -17.32530975341797, -15.19668960571289, -13.068069458007812, -10.939449310302734, -8.81082820892334, -6.6822075843811035, -4.553586959838867, -2.424966812133789, -0.29634571075439453, 1.832275390625, 3.960895538330078, 6.0895161628723145, 8.21813678741455, 10.346757888793945, 12.475378036499023, 14.603998184204102, 16.732620239257812, 18.86124038696289, 20.9898681640625, 23.118488311767578, 25.247108459472656, 27.375730514526367, 29.504350662231445, 31.632970809936523, 33.761592864990234, 35.89021301269531, 38.01883316040039, 40.14745330810547, 42.27607345581055, 44.404693603515625, 46.53331756591797, 48.66193389892578, 50.790557861328125, 52.9191780090332, 55.04779815673828, 57.17641830444336, 59.30503845214844, 61.433658599853516, 63.562278747558594, 65.69090270996094, 67.81951904296875, 69.9481430053711, 72.07676696777344, 74.20539093017578, 76.3340072631836, 78.46263122558594, 80.59124755859375, 82.7198715209961, 84.8484878540039, 86.97711181640625, 89.10572814941406]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 9.0, 11.0, 39.0, 42.0, 76.0, 154.0, 304.0, 651.0, 1538.0, 4120.0, 16897.0, 144029.0, 2008962.0, 1861032.0, 132911.0, 16786.0, 4113.0, 1428.0, 604.0, 289.0, 124.0, 60.0, 36.0, 26.0, 13.0, 8.0, 9.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5390625, -8.28778076171875, -8.0364990234375, -7.78521728515625, -7.533935546875, -7.28265380859375, -7.0313720703125, -6.78009033203125, -6.52880859375, -6.27752685546875, -6.0262451171875, -5.77496337890625, -5.523681640625, -5.27239990234375, -5.0211181640625, -4.76983642578125, -4.5185546875, -4.26727294921875, -4.0159912109375, -3.76470947265625, -3.513427734375, -3.26214599609375, -3.0108642578125, -2.75958251953125, -2.50830078125, -2.25701904296875, -2.0057373046875, -1.75445556640625, -1.503173828125, -1.25189208984375, -1.0006103515625, -0.74932861328125, -0.498046875, -0.24676513671875, 0.0045166015625, 0.25579833984375, 0.507080078125, 0.75836181640625, 1.0096435546875, 1.26092529296875, 1.51220703125, 1.76348876953125, 2.0147705078125, 2.26605224609375, 2.517333984375, 2.76861572265625, 3.0198974609375, 3.27117919921875, 3.5224609375, 3.77374267578125, 4.0250244140625, 4.27630615234375, 4.527587890625, 4.77886962890625, 5.0301513671875, 5.28143310546875, 5.53271484375, 5.78399658203125, 6.0352783203125, 6.28656005859375, 6.537841796875, 6.78912353515625, 7.0404052734375, 7.29168701171875, 7.54296875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 6.0, 16.0, 18.0, 37.0, 26.0, 31.0, 39.0, 34.0, 47.0, 48.0, 51.0, 45.0, 55.0, 58.0, 50.0, 42.0, 50.0, 51.0, 51.0, 45.0, 27.0, 31.0, 25.0, 21.0, 15.0, 16.0, 20.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.41796875, -3.31927490234375, -3.2205810546875, -3.12188720703125, -3.023193359375, -2.92449951171875, -2.8258056640625, -2.72711181640625, -2.62841796875, -2.52972412109375, -2.4310302734375, -2.33233642578125, -2.233642578125, -2.13494873046875, -2.0362548828125, -1.93756103515625, -1.8388671875, -1.74017333984375, -1.6414794921875, -1.54278564453125, -1.444091796875, -1.34539794921875, -1.2467041015625, -1.14801025390625, -1.04931640625, -0.95062255859375, -0.8519287109375, -0.75323486328125, -0.654541015625, -0.55584716796875, -0.4571533203125, -0.35845947265625, -0.259765625, -0.16107177734375, -0.0623779296875, 0.03631591796875, 0.135009765625, 0.23370361328125, 0.3323974609375, 0.43109130859375, 0.52978515625, 0.62847900390625, 0.7271728515625, 0.82586669921875, 0.924560546875, 1.02325439453125, 1.1219482421875, 1.22064208984375, 1.3193359375, 1.41802978515625, 1.5167236328125, 1.61541748046875, 1.714111328125, 1.81280517578125, 1.9114990234375, 2.01019287109375, 2.10888671875, 2.20758056640625, 2.3062744140625, 2.40496826171875, 2.503662109375, 2.60235595703125, 2.7010498046875, 2.79974365234375, 2.8984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 13.0, 16.0, 28.0, 41.0, 83.0, 132.0, 273.0, 559.0, 1258.0, 3839.0, 38783.0, 4001281.0, 137788.0, 6751.0, 1868.0, 793.0, 340.0, 177.0, 90.0, 65.0, 31.0, 12.0, 13.0, 7.0, 8.0, 9.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.5, -21.850341796875, -21.20068359375, -20.551025390625, -19.9013671875, -19.251708984375, -18.60205078125, -17.952392578125, -17.302734375, -16.653076171875, -16.00341796875, -15.353759765625, -14.7041015625, -14.054443359375, -13.40478515625, -12.755126953125, -12.10546875, -11.455810546875, -10.80615234375, -10.156494140625, -9.5068359375, -8.857177734375, -8.20751953125, -7.557861328125, -6.908203125, -6.258544921875, -5.60888671875, -4.959228515625, -4.3095703125, -3.659912109375, -3.01025390625, -2.360595703125, -1.7109375, -1.061279296875, -0.41162109375, 0.238037109375, 0.8876953125, 1.537353515625, 2.18701171875, 2.836669921875, 3.486328125, 4.135986328125, 4.78564453125, 5.435302734375, 6.0849609375, 6.734619140625, 7.38427734375, 8.033935546875, 8.68359375, 9.333251953125, 9.98291015625, 10.632568359375, 11.2822265625, 11.931884765625, 12.58154296875, 13.231201171875, 13.880859375, 14.530517578125, 15.18017578125, 15.829833984375, 16.4794921875, 17.129150390625, 17.77880859375, 18.428466796875, 19.078125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 5.0, 10.0, 11.0, 15.0, 15.0, 29.0, 44.0, 63.0, 77.0, 115.0, 188.0, 271.0, 403.0, 507.0, 600.0, 482.0, 370.0, 231.0, 186.0, 125.0, 93.0, 57.0, 57.0, 35.0, 20.0, 21.0, 14.0, 7.0, 10.0, 5.0, 8.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.1898193359375, -4.887451171875, -4.5850830078125, -4.28271484375, -3.9803466796875, -3.677978515625, -3.3756103515625, -3.0732421875, -2.7708740234375, -2.468505859375, -2.1661376953125, -1.86376953125, -1.5614013671875, -1.259033203125, -0.9566650390625, -0.654296875, -0.3519287109375, -0.049560546875, 0.2528076171875, 0.55517578125, 0.8575439453125, 1.159912109375, 1.4622802734375, 1.7646484375, 2.0670166015625, 2.369384765625, 2.6717529296875, 2.97412109375, 3.2764892578125, 3.578857421875, 3.8812255859375, 4.18359375, 4.4859619140625, 4.788330078125, 5.0906982421875, 5.39306640625, 5.6954345703125, 5.997802734375, 6.3001708984375, 6.6025390625, 6.9049072265625, 7.207275390625, 7.5096435546875, 7.81201171875, 8.1143798828125, 8.416748046875, 8.7191162109375, 9.021484375, 9.3238525390625, 9.626220703125, 9.9285888671875, 10.23095703125, 10.5333251953125, 10.835693359375, 11.1380615234375, 11.4404296875, 11.7427978515625, 12.045166015625, 12.3475341796875, 12.64990234375, 12.9522705078125, 13.254638671875, 13.5570068359375, 13.859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 9.0, 23.0, 65.0, 160.0, 275.0, 252.0, 100.0, 44.0, 23.0, 8.0, 7.0, 5.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.3152313232422, -136.5103302001953, -130.70541381835938, -124.9005126953125, -119.09559631347656, -113.29069519042969, -107.48578643798828, -101.68087768554688, -95.87596893310547, -90.07106018066406, -84.26615142822266, -78.46124267578125, -72.65634155273438, -66.85142517089844, -61.04652404785156, -55.241615295410156, -49.43670654296875, -43.631797790527344, -37.82688903808594, -32.0219841003418, -26.21707534790039, -20.412166595458984, -14.607261657714844, -8.802352905273438, -2.9974441528320312, 2.8074636459350586, 8.612371444702148, 14.417278289794922, 20.222187042236328, 26.027095794677734, 31.832000732421875, 37.63690948486328, 43.44183349609375, 49.246742248535156, 55.05165100097656, 60.8565559387207, 66.66146850585938, 72.46636962890625, 78.27127838134766, 84.07618713378906, 89.88109588623047, 95.68600463867188, 101.49091339111328, 107.29582214355469, 113.10072326660156, 118.9056396484375, 124.71054077148438, 130.51544189453125, 136.3203582763672, 142.12525939941406, 147.93017578125, 153.73507690429688, 159.5399932861328, 165.3448944091797, 171.14981079101562, 176.9547119140625, 182.75961303710938, 188.56451416015625, 194.3694305419922, 200.17433166503906, 205.979248046875, 211.78414916992188, 217.58905029296875, 223.3939666748047, 229.19888305664062]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 11.0, 16.0, 11.0, 16.0, 10.0, 30.0, 22.0, 42.0, 38.0, 45.0, 51.0, 54.0, 53.0, 67.0, 72.0, 92.0, 84.0, 55.0, 56.0, 35.0, 37.0, 25.0, 26.0, 20.0, 14.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-99.5884780883789, -97.29733276367188, -95.00619506835938, -92.71504974365234, -90.42390441894531, -88.13276672363281, -85.84162139892578, -83.55047607421875, -81.25933837890625, -78.96819305419922, -76.67705535888672, -74.38591003417969, -72.09477233886719, -69.80362701416016, -67.51248168945312, -65.22134399414062, -62.930198669433594, -60.63905715942383, -58.34791564941406, -56.05677032470703, -53.765628814697266, -51.4744873046875, -49.18334197998047, -46.8922004699707, -44.60105895996094, -42.30991744995117, -40.018775939941406, -37.727630615234375, -35.43648910522461, -33.145347595214844, -30.854204177856445, -28.563060760498047, -26.271915435791016, -23.98077392578125, -21.68963050842285, -19.398487091064453, -17.107345581054688, -14.816203117370605, -12.525060653686523, -10.233917236328125, -7.942775726318359, -5.651633262634277, -3.3604907989501953, -1.0693483352661133, 1.2217941284179688, 3.512936592102051, 5.804079055786133, 8.095222473144531, 10.386363983154297, 12.677506446838379, 14.968648910522461, 17.25979232788086, 19.550933837890625, 21.84207534790039, 24.13321876525879, 26.424362182617188, 28.715503692626953, 31.00664520263672, 33.29779052734375, 35.588932037353516, 37.88007354736328, 40.17121505737305, 42.46235656738281, 44.753501892089844, 47.04464340209961]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 6.0, 10.0, 22.0, 27.0, 37.0, 53.0, 75.0, 137.0, 168.0, 369.0, 630.0, 1392.0, 3262.0, 8067.0, 23980.0, 100166.0, 659777.0, 192577.0, 37995.0, 11659.0, 4327.0, 1804.0, 924.0, 442.0, 229.0, 132.0, 97.0, 43.0, 31.0, 24.0, 20.0, 9.0, 8.0, 8.0, 4.0, 13.0, 4.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.0, -6.80914306640625, -6.6182861328125, -6.42742919921875, -6.236572265625, -6.04571533203125, -5.8548583984375, -5.66400146484375, -5.47314453125, -5.28228759765625, -5.0914306640625, -4.90057373046875, -4.709716796875, -4.51885986328125, -4.3280029296875, -4.13714599609375, -3.9462890625, -3.75543212890625, -3.5645751953125, -3.37371826171875, -3.182861328125, -2.99200439453125, -2.8011474609375, -2.61029052734375, -2.41943359375, -2.22857666015625, -2.0377197265625, -1.84686279296875, -1.656005859375, -1.46514892578125, -1.2742919921875, -1.08343505859375, -0.892578125, -0.70172119140625, -0.5108642578125, -0.32000732421875, -0.129150390625, 0.06170654296875, 0.2525634765625, 0.44342041015625, 0.63427734375, 0.82513427734375, 1.0159912109375, 1.20684814453125, 1.397705078125, 1.58856201171875, 1.7794189453125, 1.97027587890625, 2.1611328125, 2.35198974609375, 2.5428466796875, 2.73370361328125, 2.924560546875, 3.11541748046875, 3.3062744140625, 3.49713134765625, 3.68798828125, 3.87884521484375, 4.0697021484375, 4.26055908203125, 4.451416015625, 4.64227294921875, 4.8331298828125, 5.02398681640625, 5.21484375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 6.0, 8.0, 13.0, 16.0, 32.0, 36.0, 47.0, 38.0, 61.0, 65.0, 86.0, 95.0, 96.0, 96.0, 59.0, 63.0, 35.0, 37.0, 37.0, 29.0, 18.0, 11.0, 6.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.2578125, -8.07366943359375, -7.8895263671875, -7.70538330078125, -7.521240234375, -7.33709716796875, -7.1529541015625, -6.96881103515625, -6.78466796875, -6.60052490234375, -6.4163818359375, -6.23223876953125, -6.048095703125, -5.86395263671875, -5.6798095703125, -5.49566650390625, -5.3115234375, -5.12738037109375, -4.9432373046875, -4.75909423828125, -4.574951171875, -4.39080810546875, -4.2066650390625, -4.02252197265625, -3.83837890625, -3.65423583984375, -3.4700927734375, -3.28594970703125, -3.101806640625, -2.91766357421875, -2.7335205078125, -2.54937744140625, -2.365234375, -2.18109130859375, -1.9969482421875, -1.81280517578125, -1.628662109375, -1.44451904296875, -1.2603759765625, -1.07623291015625, -0.89208984375, -0.70794677734375, -0.5238037109375, -0.33966064453125, -0.155517578125, 0.02862548828125, 0.2127685546875, 0.39691162109375, 0.5810546875, 0.76519775390625, 0.9493408203125, 1.13348388671875, 1.317626953125, 1.50177001953125, 1.6859130859375, 1.87005615234375, 2.05419921875, 2.23834228515625, 2.4224853515625, 2.60662841796875, 2.790771484375, 2.97491455078125, 3.1590576171875, 3.34320068359375, 3.52734375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 7.0, 10.0, 15.0, 21.0, 29.0, 45.0, 52.0, 102.0, 104.0, 183.0, 323.0, 496.0, 1209.0, 3124.0, 15852.0, 249288.0, 752012.0, 19284.0, 3630.0, 1188.0, 625.0, 307.0, 184.0, 120.0, 110.0, 52.0, 46.0, 35.0, 28.0, 20.0, 12.0, 5.0, 9.0, 8.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.35546875, -7.09320068359375, -6.8309326171875, -6.56866455078125, -6.306396484375, -6.04412841796875, -5.7818603515625, -5.51959228515625, -5.25732421875, -4.99505615234375, -4.7327880859375, -4.47052001953125, -4.208251953125, -3.94598388671875, -3.6837158203125, -3.42144775390625, -3.1591796875, -2.89691162109375, -2.6346435546875, -2.37237548828125, -2.110107421875, -1.84783935546875, -1.5855712890625, -1.32330322265625, -1.06103515625, -0.79876708984375, -0.5364990234375, -0.27423095703125, -0.011962890625, 0.25030517578125, 0.5125732421875, 0.77484130859375, 1.037109375, 1.29937744140625, 1.5616455078125, 1.82391357421875, 2.086181640625, 2.34844970703125, 2.6107177734375, 2.87298583984375, 3.13525390625, 3.39752197265625, 3.6597900390625, 3.92205810546875, 4.184326171875, 4.44659423828125, 4.7088623046875, 4.97113037109375, 5.2333984375, 5.49566650390625, 5.7579345703125, 6.02020263671875, 6.282470703125, 6.54473876953125, 6.8070068359375, 7.06927490234375, 7.33154296875, 7.59381103515625, 7.8560791015625, 8.11834716796875, 8.380615234375, 8.64288330078125, 8.9051513671875, 9.16741943359375, 9.4296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 14.0, 10.0, 7.0, 19.0, 18.0, 22.0, 24.0, 40.0, 37.0, 46.0, 62.0, 89.0, 104.0, 107.0, 74.0, 53.0, 56.0, 39.0, 24.0, 26.0, 26.0, 25.0, 15.0, 11.0, 14.0, 11.0, 4.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.592529296875, -18.06005859375, -17.527587890625, -16.9951171875, -16.462646484375, -15.93017578125, -15.397705078125, -14.865234375, -14.332763671875, -13.80029296875, -13.267822265625, -12.7353515625, -12.202880859375, -11.67041015625, -11.137939453125, -10.60546875, -10.072998046875, -9.54052734375, -9.008056640625, -8.4755859375, -7.943115234375, -7.41064453125, -6.878173828125, -6.345703125, -5.813232421875, -5.28076171875, -4.748291015625, -4.2158203125, -3.683349609375, -3.15087890625, -2.618408203125, -2.0859375, -1.553466796875, -1.02099609375, -0.488525390625, 0.0439453125, 0.576416015625, 1.10888671875, 1.641357421875, 2.173828125, 2.706298828125, 3.23876953125, 3.771240234375, 4.3037109375, 4.836181640625, 5.36865234375, 5.901123046875, 6.43359375, 6.966064453125, 7.49853515625, 8.031005859375, 8.5634765625, 9.095947265625, 9.62841796875, 10.160888671875, 10.693359375, 11.225830078125, 11.75830078125, 12.290771484375, 12.8232421875, 13.355712890625, 13.88818359375, 14.420654296875, 14.953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 4.0, 6.0, 6.0, 6.0, 12.0, 17.0, 19.0, 28.0, 29.0, 57.0, 83.0, 168.0, 246.0, 508.0, 928.0, 2696.0, 9161.0, 54170.0, 899526.0, 65488.0, 10327.0, 2805.0, 1053.0, 510.0, 228.0, 145.0, 83.0, 42.0, 43.0, 34.0, 19.0, 18.0, 14.0, 15.0, 13.0, 6.0, 1.0, 3.0, 3.0, 4.0, 3.0, 0.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.271484375, -1.231170654296875, -1.19085693359375, -1.150543212890625, -1.1102294921875, -1.069915771484375, -1.02960205078125, -0.989288330078125, -0.948974609375, -0.908660888671875, -0.86834716796875, -0.828033447265625, -0.7877197265625, -0.747406005859375, -0.70709228515625, -0.666778564453125, -0.62646484375, -0.586151123046875, -0.54583740234375, -0.505523681640625, -0.4652099609375, -0.424896240234375, -0.38458251953125, -0.344268798828125, -0.303955078125, -0.263641357421875, -0.22332763671875, -0.183013916015625, -0.1427001953125, -0.102386474609375, -0.06207275390625, -0.021759033203125, 0.0185546875, 0.058868408203125, 0.09918212890625, 0.139495849609375, 0.1798095703125, 0.220123291015625, 0.26043701171875, 0.300750732421875, 0.341064453125, 0.381378173828125, 0.42169189453125, 0.462005615234375, 0.5023193359375, 0.542633056640625, 0.58294677734375, 0.623260498046875, 0.66357421875, 0.703887939453125, 0.74420166015625, 0.784515380859375, 0.8248291015625, 0.865142822265625, 0.90545654296875, 0.945770263671875, 0.986083984375, 1.026397705078125, 1.06671142578125, 1.107025146484375, 1.1473388671875, 1.187652587890625, 1.22796630859375, 1.268280029296875, 1.30859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 8.0, 21.0, 18.0, 24.0, 20.0, 43.0, 57.0, 86.0, 131.0, 150.0, 125.0, 86.0, 62.0, 49.0, 15.0, 26.0, 17.0, 14.0, 10.0, 6.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031495094299316406, -0.00030463188886642456, -0.00029431283473968506, -0.00028399378061294556, -0.00027367472648620605, -0.00026335567235946655, -0.00025303661823272705, -0.00024271756410598755, -0.00023239850997924805, -0.00022207945585250854, -0.00021176040172576904, -0.00020144134759902954, -0.00019112229347229004, -0.00018080323934555054, -0.00017048418521881104, -0.00016016513109207153, -0.00014984607696533203, -0.00013952702283859253, -0.00012920796871185303, -0.00011888891458511353, -0.00010856986045837402, -9.825080633163452e-05, -8.793175220489502e-05, -7.761269807815552e-05, -6.729364395141602e-05, -5.6974589824676514e-05, -4.665553569793701e-05, -3.633648157119751e-05, -2.6017427444458008e-05, -1.5698373317718506e-05, -5.379319190979004e-06, 4.939734935760498e-06, 1.52587890625e-05, 2.5577843189239502e-05, 3.5896897315979004e-05, 4.6215951442718506e-05, 5.653500556945801e-05, 6.685405969619751e-05, 7.717311382293701e-05, 8.749216794967651e-05, 9.781122207641602e-05, 0.00010813027620315552, 0.00011844933032989502, 0.00012876838445663452, 0.00013908743858337402, 0.00014940649271011353, 0.00015972554683685303, 0.00017004460096359253, 0.00018036365509033203, 0.00019068270921707153, 0.00020100176334381104, 0.00021132081747055054, 0.00022163987159729004, 0.00023195892572402954, 0.00024227797985076904, 0.00025259703397750854, 0.00026291608810424805, 0.00027323514223098755, 0.00028355419635772705, 0.00029387325048446655, 0.00030419230461120605, 0.00031451135873794556, 0.00032483041286468506, 0.00033514946699142456, 0.00034546852111816406]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 9.0, 5.0, 10.0, 13.0, 27.0, 28.0, 34.0, 66.0, 71.0, 170.0, 254.0, 472.0, 818.0, 1604.0, 3332.0, 7891.0, 22409.0, 105364.0, 809052.0, 67222.0, 17375.0, 6412.0, 2792.0, 1345.0, 700.0, 383.0, 262.0, 152.0, 95.0, 57.0, 53.0, 28.0, 13.0, 14.0, 7.0, 2.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.778717041015625, -0.75128173828125, -0.723846435546875, -0.6964111328125, -0.668975830078125, -0.64154052734375, -0.614105224609375, -0.586669921875, -0.559234619140625, -0.53179931640625, -0.504364013671875, -0.4769287109375, -0.449493408203125, -0.42205810546875, -0.394622802734375, -0.3671875, -0.339752197265625, -0.31231689453125, -0.284881591796875, -0.2574462890625, -0.230010986328125, -0.20257568359375, -0.175140380859375, -0.147705078125, -0.120269775390625, -0.09283447265625, -0.065399169921875, -0.0379638671875, -0.010528564453125, 0.01690673828125, 0.044342041015625, 0.07177734375, 0.099212646484375, 0.12664794921875, 0.154083251953125, 0.1815185546875, 0.208953857421875, 0.23638916015625, 0.263824462890625, 0.291259765625, 0.318695068359375, 0.34613037109375, 0.373565673828125, 0.4010009765625, 0.428436279296875, 0.45587158203125, 0.483306884765625, 0.5107421875, 0.538177490234375, 0.56561279296875, 0.593048095703125, 0.6204833984375, 0.647918701171875, 0.67535400390625, 0.702789306640625, 0.730224609375, 0.757659912109375, 0.78509521484375, 0.812530517578125, 0.8399658203125, 0.867401123046875, 0.89483642578125, 0.922271728515625, 0.94970703125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 21.0, 17.0, 14.0, 17.0, 27.0, 36.0, 43.0, 77.0, 105.0, 104.0, 103.0, 85.0, 79.0, 69.0, 54.0, 28.0, 28.0, 14.0, 11.0, 11.0, 8.0, 6.0, 6.0, 7.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1240234375, -1.08685302734375, -1.0496826171875, -1.01251220703125, -0.975341796875, -0.93817138671875, -0.9010009765625, -0.86383056640625, -0.82666015625, -0.78948974609375, -0.7523193359375, -0.71514892578125, -0.677978515625, -0.64080810546875, -0.6036376953125, -0.56646728515625, -0.529296875, -0.49212646484375, -0.4549560546875, -0.41778564453125, -0.380615234375, -0.34344482421875, -0.3062744140625, -0.26910400390625, -0.23193359375, -0.19476318359375, -0.1575927734375, -0.12042236328125, -0.083251953125, -0.04608154296875, -0.0089111328125, 0.02825927734375, 0.0654296875, 0.10260009765625, 0.1397705078125, 0.17694091796875, 0.214111328125, 0.25128173828125, 0.2884521484375, 0.32562255859375, 0.36279296875, 0.39996337890625, 0.4371337890625, 0.47430419921875, 0.511474609375, 0.54864501953125, 0.5858154296875, 0.62298583984375, 0.66015625, 0.69732666015625, 0.7344970703125, 0.77166748046875, 0.808837890625, 0.84600830078125, 0.8831787109375, 0.92034912109375, 0.95751953125, 0.99468994140625, 1.0318603515625, 1.06903076171875, 1.106201171875, 1.14337158203125, 1.1805419921875, 1.21771240234375, 1.2548828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 36.0, 62.0, 229.0, 487.0, 82.0, 38.0, 25.0, 9.0, 1.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.791805267333984, -54.43795394897461, -52.08409881591797, -49.730247497558594, -47.37639617919922, -45.022544860839844, -42.6686897277832, -40.31483840942383, -37.96098327636719, -35.60713195800781, -33.25327682495117, -30.899425506591797, -28.545574188232422, -26.191720962524414, -23.837867736816406, -21.48401641845703, -19.130165100097656, -16.77631187438965, -14.422460556030273, -12.068607330322266, -9.714755058288574, -7.360902786254883, -5.007049560546875, -2.6531982421875, -0.2993450164794922, 2.0545074939727783, 4.408360004425049, 6.762212753295898, 9.11606502532959, 11.469917297363281, 13.823770523071289, 16.177621841430664, 18.531478881835938, 20.885332107543945, 23.23918342590332, 25.593036651611328, 27.946887969970703, 30.30074119567871, 32.65459442138672, 35.008445739746094, 37.36229705810547, 39.716148376464844, 42.070003509521484, 44.42385482788086, 46.777706146240234, 49.131561279296875, 51.48541259765625, 53.839263916015625, 56.193119049072266, 58.54697036743164, 60.90082550048828, 63.254676818847656, 65.60852813720703, 67.9623794555664, 70.31623840332031, 72.67008972167969, 75.02394104003906, 77.37779235839844, 79.73164367675781, 82.08549499511719, 84.4393539428711, 86.79320526123047, 89.14705657958984, 91.50090789794922, 93.8547592163086]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 9.0, 3.0, 13.0, 8.0, 14.0, 15.0, 22.0, 20.0, 33.0, 23.0, 35.0, 29.0, 96.0, 281.0, 136.0, 42.0, 27.0, 35.0, 29.0, 29.0, 16.0, 9.0, 12.0, 14.0, 8.0, 10.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.119911193847656, -52.64208221435547, -51.164249420166016, -49.68642044067383, -48.20859146118164, -46.73075866699219, -45.2529296875, -43.77510070800781, -42.297271728515625, -40.81944274902344, -39.341609954833984, -37.8637809753418, -36.38595199584961, -34.908119201660156, -33.43029022216797, -31.95246124267578, -30.474628448486328, -28.996797561645508, -27.51896858215332, -26.0411376953125, -24.563308715820312, -23.085477828979492, -21.607646942138672, -20.129817962646484, -18.651987075805664, -17.174156188964844, -15.696327209472656, -14.218496322631836, -12.740666389465332, -11.262836456298828, -9.785005569458008, -8.307175636291504, -6.829349517822266, -5.351519584655762, -3.8736891746520996, -2.3958587646484375, -0.9180288314819336, 0.5598011016845703, 2.0376319885253906, 3.5154619216918945, 4.993291854858398, 6.471121788024902, 7.9489521980285645, 9.426782608032227, 10.90461254119873, 12.382442474365234, 13.860273361206055, 15.338103294372559, 16.815933227539062, 18.293764114379883, 19.77159309387207, 21.24942398071289, 22.727252960205078, 24.2050838470459, 25.68291473388672, 27.160743713378906, 28.638574600219727, 30.116405487060547, 31.594234466552734, 33.07206726074219, 34.549896240234375, 36.02772521972656, 37.50555419921875, 38.9833869934082, 40.46121597290039]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 12.0, 15.0, 13.0, 23.0, 31.0, 25.0, 27.0, 30.0, 58.0, 73.0, 308.0, 113.0, 44.0, 34.0, 35.0, 34.0, 18.0, 17.0, 17.0, 18.0, 11.0, 11.0, 14.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19921875, -5.0572509765625, -4.915283203125, -4.7733154296875, -4.63134765625, -4.4893798828125, -4.347412109375, -4.2054443359375, -4.0634765625, -3.9215087890625, -3.779541015625, -3.6375732421875, -3.49560546875, -3.3536376953125, -3.211669921875, -3.0697021484375, -2.927734375, -2.7857666015625, -2.643798828125, -2.5018310546875, -2.35986328125, -2.2178955078125, -2.075927734375, -1.9339599609375, -1.7919921875, -1.6500244140625, -1.508056640625, -1.3660888671875, -1.22412109375, -1.0821533203125, -0.940185546875, -0.7982177734375, -0.65625, -0.5142822265625, -0.372314453125, -0.2303466796875, -0.08837890625, 0.0535888671875, 0.195556640625, 0.3375244140625, 0.4794921875, 0.6214599609375, 0.763427734375, 0.9053955078125, 1.04736328125, 1.1893310546875, 1.331298828125, 1.4732666015625, 1.615234375, 1.7572021484375, 1.899169921875, 2.0411376953125, 2.18310546875, 2.3250732421875, 2.467041015625, 2.6090087890625, 2.7509765625, 2.8929443359375, 3.034912109375, 3.1768798828125, 3.31884765625, 3.4608154296875, 3.602783203125, 3.7447509765625, 3.88671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 5.0, 4.0, 5.0, 5.0, 10.0, 12.0, 23.0, 55.0, 76.0, 136.0, 264.0, 856.0, 4447.0, 8220793.0, 157089.0, 3456.0, 730.0, 251.0, 140.0, 67.0, 39.0, 32.0, 26.0, 15.0, 6.0, 11.0, 9.0, 9.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.8764762878418, -51.318721771240234, -49.760963439941406, -48.203208923339844, -46.645450592041016, -45.08769607543945, -43.529937744140625, -41.97218322753906, -40.414424896240234, -38.85667037963867, -37.298912048339844, -35.74115753173828, -34.18339920043945, -32.62564468383789, -31.067886352539062, -29.5101318359375, -27.952375411987305, -26.39461898803711, -24.836862564086914, -23.27910614013672, -21.721349716186523, -20.163593292236328, -18.605838775634766, -17.048080444335938, -15.490324974060059, -13.932568550109863, -12.374812126159668, -10.817056655883789, -9.259300231933594, -7.70154333114624, -6.143787384033203, -4.586030960083008, -3.0282745361328125, -1.4705182313919067, 0.08723807334899902, 1.6449942588806152, 3.2027506828308105, 4.760507106781006, 6.318263053894043, 7.876019477844238, 9.433775901794434, 10.991532325744629, 12.549288749694824, 14.107044219970703, 15.664800643920898, 17.222557067871094, 18.78031349182129, 20.338069915771484, 21.89582633972168, 23.453582763671875, 25.01133918762207, 26.569095611572266, 28.12685203552246, 29.684608459472656, 31.24236297607422, 32.80012130737305, 34.35787582397461, 35.91563034057617, 37.473388671875, 39.03114318847656, 40.58890151977539, 42.14665603637695, 43.70441436767578, 45.262168884277344, 46.81992721557617]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.03524017333984, -86.53360748291016, -84.031982421875, -81.53034973144531, -79.02871704101562, -76.52708435058594, -74.02545166015625, -71.5238265991211, -69.0221939086914, -66.52056121826172, -64.01893615722656, -61.517303466796875, -59.01567077636719, -56.5140380859375, -54.01240921020508, -51.510780334472656, -49.00914764404297, -46.50751495361328, -44.00588607788086, -41.50425720214844, -39.00262451171875, -36.50099182128906, -33.99936294555664, -31.497732162475586, -28.99610137939453, -26.494470596313477, -23.992839813232422, -21.491209030151367, -18.989578247070312, -16.487947463989258, -13.986316680908203, -11.484685897827148, -8.983055114746094, -6.481424331665039, -3.9797935485839844, -1.4781627655029297, 1.023468017578125, 3.5250988006591797, 6.026729583740234, 8.528360366821289, 11.029991149902344, 13.531621932983398, 16.033252716064453, 18.534883499145508, 21.036514282226562, 23.538145065307617, 26.039775848388672, 28.541406631469727, 31.04303741455078, 33.54467010498047, 36.04629898071289, 38.54792785644531, 41.049560546875, 43.55119323730469, 46.05282211303711, 48.55445098876953, 51.05608367919922, 53.557716369628906, 56.05934524536133, 58.56097412109375, 61.06260681152344, 63.564239501953125, 66.06587219238281, 68.56749725341797, 71.06912994384766]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 11.0, 17.0, 16.0, 23.0, 49.0, 64.0, 116.0, 194.0, 373.0, 911.0, 2339.0, 8467.0, 36631.0, 175235.0, 228851.0, 53943.0, 11926.0, 3112.0, 1003.0, 434.0, 231.0, 122.0, 70.0, 49.0, 34.0, 11.0, 6.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.25, -46.042236328125, -44.83447265625, -43.626708984375, -42.4189453125, -41.211181640625, -40.00341796875, -38.795654296875, -37.587890625, -36.380126953125, -35.17236328125, -33.964599609375, -32.7568359375, -31.549072265625, -30.34130859375, -29.133544921875, -27.92578125, -26.718017578125, -25.51025390625, -24.302490234375, -23.0947265625, -21.886962890625, -20.67919921875, -19.471435546875, -18.263671875, -17.055908203125, -15.84814453125, -14.640380859375, -13.4326171875, -12.224853515625, -11.01708984375, -9.809326171875, -8.6015625, -7.393798828125, -6.18603515625, -4.978271484375, -3.7705078125, -2.562744140625, -1.35498046875, -0.147216796875, 1.060546875, 2.268310546875, 3.47607421875, 4.683837890625, 5.8916015625, 7.099365234375, 8.30712890625, 9.514892578125, 10.72265625, 11.930419921875, 13.13818359375, 14.345947265625, 15.5537109375, 16.761474609375, 17.96923828125, 19.177001953125, 20.384765625, 21.592529296875, 22.80029296875, 24.008056640625, 25.2158203125, 26.423583984375, 27.63134765625, 28.839111328125, 30.046875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 9.0, 14.0, 18.0, 19.0, 44.0, 32.0, 65.0, 78.0, 105.0, 117.0, 100.0, 86.0, 75.0, 76.0, 52.0, 25.0, 27.0, 23.0, 12.0, 6.0, 9.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.625, -8.42034912109375, -8.2156982421875, -8.01104736328125, -7.806396484375, -7.60174560546875, -7.3970947265625, -7.19244384765625, -6.98779296875, -6.78314208984375, -6.5784912109375, -6.37384033203125, -6.169189453125, -5.96453857421875, -5.7598876953125, -5.55523681640625, -5.3505859375, -5.14593505859375, -4.9412841796875, -4.73663330078125, -4.531982421875, -4.32733154296875, -4.1226806640625, -3.91802978515625, -3.71337890625, -3.50872802734375, -3.3040771484375, -3.09942626953125, -2.894775390625, -2.69012451171875, -2.4854736328125, -2.28082275390625, -2.076171875, -1.87152099609375, -1.6668701171875, -1.46221923828125, -1.257568359375, -1.05291748046875, -0.8482666015625, -0.64361572265625, -0.43896484375, -0.23431396484375, -0.0296630859375, 0.17498779296875, 0.379638671875, 0.58428955078125, 0.7889404296875, 0.99359130859375, 1.1982421875, 1.40289306640625, 1.6075439453125, 1.81219482421875, 2.016845703125, 2.22149658203125, 2.4261474609375, 2.63079833984375, 2.83544921875, 3.04010009765625, 3.2447509765625, 3.44940185546875, 3.654052734375, 3.85870361328125, 4.0633544921875, 4.26800537109375, 4.47265625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 10.0, 15.0, 22.0, 65.0, 116.0, 115.0, 68.0, 32.0, 13.0, 9.0, 4.0, 4.0, 7.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.691261291503906, -17.985809326171875, -16.280357360839844, -14.574905395507812, -12.869453430175781, -11.164000511169434, -9.458548545837402, -7.753096580505371, -6.04764461517334, -4.342192649841309, -2.6367404460906982, -0.9312882423400879, 0.7741637229919434, 2.479616165161133, 4.185068130493164, 5.890520095825195, 7.595972061157227, 9.301424026489258, 11.006875991821289, 12.71232795715332, 14.417779922485352, 16.123233795166016, 17.828685760498047, 19.534137725830078, 21.23958969116211, 22.94504165649414, 24.650493621826172, 26.355945587158203, 28.061397552490234, 29.766849517822266, 31.472301483154297, 33.17775344848633, 34.88320541381836, 36.58865737915039, 38.29410934448242, 39.99956130981445, 41.705013275146484, 43.410465240478516, 45.11591720581055, 46.82136917114258, 48.52682113647461, 50.23227310180664, 51.93772506713867, 53.6431770324707, 55.348628997802734, 57.054080963134766, 58.7595329284668, 60.46498489379883, 62.170440673828125, 63.875892639160156, 65.58134460449219, 67.28679656982422, 68.99224853515625, 70.69770050048828, 72.40315246582031, 74.10860443115234, 75.81405639648438, 77.5195083618164, 79.22496032714844, 80.93041229248047, 82.6358642578125, 84.34131622314453, 86.04676818847656, 87.7522201538086, 89.45767211914062]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 12.0, 11.0, 11.0, 23.0, 32.0, 34.0, 54.0, 54.0, 52.0, 55.0, 36.0, 21.0, 14.0, 6.0, 9.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.25200653076172, -25.577444076538086, -24.90287971496582, -24.228317260742188, -23.553752899169922, -22.87919044494629, -22.204627990722656, -21.53006362915039, -20.855501174926758, -20.180938720703125, -19.50637435913086, -18.831811904907227, -18.157249450683594, -17.482685089111328, -16.808122634887695, -16.133560180664062, -15.458995819091797, -14.784432411193848, -14.109869003295898, -13.435306549072266, -12.760743141174316, -12.086179733276367, -11.411617279052734, -10.737053871154785, -10.062490463256836, -9.387927055358887, -8.713363647460938, -8.038801193237305, -7.3642377853393555, -6.689674377441406, -6.015111446380615, -5.340548515319824, -4.665983200073242, -3.991420030593872, -3.316856861114502, -2.642293691635132, -1.9677305221557617, -1.2931673526763916, -0.6186041831970215, 0.05595874786376953, 0.7305221557617188, 1.4050853252410889, 2.079648494720459, 2.754211664199829, 3.428774833679199, 4.103338241577148, 4.7779011726379395, 5.4524641036987305, 6.12702751159668, 6.801590919494629, 7.47615385055542, 8.150716781616211, 8.82528018951416, 9.49984359741211, 10.174406051635742, 10.848969459533691, 11.52353286743164, 12.19809627532959, 12.872659683227539, 13.547222137451172, 14.221785545349121, 14.89634895324707, 15.570911407470703, 16.24547576904297, 16.9200382232666]}, "eval/loss": 5.550400733947754, "eval/wer": 1.6345101150337167, "eval/runtime": 689.3225, "eval/samples_per_second": 3.833, "eval/steps_per_second": 0.48} \ No newline at end of file +{"train/loss": 4.1412, "train/learning_rate": 2.377019002375297e-05, "train/epoch": 5.04, "train/global_step": 4500, "_runtime": 26336, "_timestamp": 1646973575, "_step": 4502, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 8.0, 16.0, 19.0, 16.0, 25.0, 26.0, 23.0, 31.0, 30.0, 27.0, 35.0, 43.0, 48.0, 44.0, 37.0, 37.0, 44.0, 41.0, 40.0, 62.0, 32.0, 43.0, 42.0, 20.0, 22.0, 22.0, 20.0, 21.0, 15.0, 9.0, 8.0, 19.0, 13.0, 3.0, 12.0, 5.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0], "bins": [-42.2806282043457, -41.339698791503906, -40.39876937866211, -39.45783996582031, -38.516910552978516, -37.57598114013672, -36.63505172729492, -35.694122314453125, -34.75318908691406, -33.812259674072266, -32.87133026123047, -31.930400848388672, -30.989471435546875, -30.048542022705078, -29.10761070251465, -28.16668128967285, -27.225753784179688, -26.28482437133789, -25.343894958496094, -24.402965545654297, -23.4620361328125, -22.521106719970703, -21.580175399780273, -20.639245986938477, -19.69831657409668, -18.757387161254883, -17.816457748413086, -16.87552833557129, -15.934597969055176, -14.993668556213379, -14.052738189697266, -13.111808776855469, -12.170879364013672, -11.229949951171875, -10.289020538330078, -9.348090171813965, -8.407160758972168, -7.466231346130371, -6.525301456451416, -5.584371566772461, -4.643442153930664, -3.702512502670288, -2.761582851409912, -1.8206532001495361, -0.8797235488891602, 0.06120586395263672, 1.0021357536315918, 1.9430656433105469, 2.8839950561523438, 3.8249247074127197, 4.765854358673096, 5.706784248352051, 6.647713661193848, 7.5886430740356445, 8.529573440551758, 9.470502853393555, 10.411432266235352, 11.352361679077148, 12.293291091918945, 13.234221458435059, 14.175150871276855, 15.116080284118652, 16.057010650634766, 16.997940063476562, 17.93886947631836]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 8.0, 4.0, 4.0, 11.0, 11.0, 16.0, 14.0, 17.0, 19.0, 28.0, 15.0, 24.0, 36.0, 22.0, 28.0, 33.0, 37.0, 48.0, 33.0, 50.0, 43.0, 40.0, 33.0, 42.0, 30.0, 37.0, 29.0, 36.0, 35.0, 29.0, 26.0, 20.0, 20.0, 18.0, 15.0, 15.0, 14.0, 8.0, 8.0, 10.0, 9.0, 15.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-29.311256408691406, -28.399648666381836, -27.488040924072266, -26.576435089111328, -25.664827346801758, -24.753219604492188, -23.84161376953125, -22.93000602722168, -22.01839828491211, -21.10679054260254, -20.19518280029297, -19.28357696533203, -18.37196922302246, -17.46036148071289, -16.548755645751953, -15.637147903442383, -14.725540161132812, -13.813932418823242, -12.902325630187988, -11.990718841552734, -11.079111099243164, -10.167503356933594, -9.25589656829834, -8.344289779663086, -7.432682037353516, -6.5210747718811035, -5.609467506408691, -4.697860240936279, -3.786252975463867, -2.874645709991455, -1.963038444519043, -1.0514311790466309, -0.13982391357421875, 0.7717833518981934, 1.6833906173706055, 2.5949978828430176, 3.5066051483154297, 4.418212413787842, 5.329819679260254, 6.241426944732666, 7.153034210205078, 8.064641952514648, 8.976248741149902, 9.887855529785156, 10.799463272094727, 11.711071014404297, 12.62267780303955, 13.534284591674805, 14.445892333984375, 15.357500076293945, 16.269107818603516, 17.180713653564453, 18.092321395874023, 19.003929138183594, 19.91553497314453, 20.8271427154541, 21.738750457763672, 22.650358200073242, 23.561965942382812, 24.47357177734375, 25.38517951965332, 26.29678726196289, 27.208393096923828, 28.1200008392334, 29.03160858154297]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 15.0, 24.0, 40.0, 62.0, 114.0, 172.0, 290.0, 473.0, 764.0, 1333.0, 2112.0, 3487.0, 5759.0, 9340.0, 15651.0, 25496.0, 41852.0, 67260.0, 107386.0, 165906.0, 246856.0, 346236.0, 451914.0, 523195.0, 534264.0, 476618.0, 378867.0, 275181.0, 187836.0, 122050.0, 78364.0, 48769.0, 29970.0, 18265.0, 11198.0, 6773.0, 4091.0, 2444.0, 1536.0, 933.0, 565.0, 314.0, 198.0, 122.0, 72.0, 41.0, 30.0, 20.0, 11.0, 9.0, 5.0, 3.0, 1.0, 2.0], "bins": [-25.78125, -25.0263671875, -24.271484375, -23.5166015625, -22.76171875, -22.0068359375, -21.251953125, -20.4970703125, -19.7421875, -18.9873046875, -18.232421875, -17.4775390625, -16.72265625, -15.9677734375, -15.212890625, -14.4580078125, -13.703125, -12.9482421875, -12.193359375, -11.4384765625, -10.68359375, -9.9287109375, -9.173828125, -8.4189453125, -7.6640625, -6.9091796875, -6.154296875, -5.3994140625, -4.64453125, -3.8896484375, -3.134765625, -2.3798828125, -1.625, -0.8701171875, -0.115234375, 0.6396484375, 1.39453125, 2.1494140625, 2.904296875, 3.6591796875, 4.4140625, 5.1689453125, 5.923828125, 6.6787109375, 7.43359375, 8.1884765625, 8.943359375, 9.6982421875, 10.453125, 11.2080078125, 11.962890625, 12.7177734375, 13.47265625, 14.2275390625, 14.982421875, 15.7373046875, 16.4921875, 17.2470703125, 18.001953125, 18.7568359375, 19.51171875, 20.2666015625, 21.021484375, 21.7763671875, 22.53125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 6.0, 5.0, 11.0, 12.0, 13.0, 22.0, 24.0, 21.0, 24.0, 20.0, 23.0, 36.0, 31.0, 33.0, 42.0, 55.0, 51.0, 50.0, 40.0, 51.0, 36.0, 46.0, 39.0, 40.0, 36.0, 29.0, 29.0, 31.0, 20.0, 21.0, 17.0, 19.0, 16.0, 9.0, 9.0, 12.0, 8.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.328125, -27.482421875, -26.63671875, -25.791015625, -24.9453125, -24.099609375, -23.25390625, -22.408203125, -21.5625, -20.716796875, -19.87109375, -19.025390625, -18.1796875, -17.333984375, -16.48828125, -15.642578125, -14.796875, -13.951171875, -13.10546875, -12.259765625, -11.4140625, -10.568359375, -9.72265625, -8.876953125, -8.03125, -7.185546875, -6.33984375, -5.494140625, -4.6484375, -3.802734375, -2.95703125, -2.111328125, -1.265625, -0.419921875, 0.42578125, 1.271484375, 2.1171875, 2.962890625, 3.80859375, 4.654296875, 5.5, 6.345703125, 7.19140625, 8.037109375, 8.8828125, 9.728515625, 10.57421875, 11.419921875, 12.265625, 13.111328125, 13.95703125, 14.802734375, 15.6484375, 16.494140625, 17.33984375, 18.185546875, 19.03125, 19.876953125, 20.72265625, 21.568359375, 22.4140625, 23.259765625, 24.10546875, 24.951171875, 25.796875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 9.0, 20.0, 37.0, 59.0, 113.0, 226.0, 379.0, 584.0, 992.0, 1585.0, 2686.0, 4576.0, 7191.0, 11699.0, 18647.0, 29025.0, 44407.0, 66810.0, 98627.0, 139641.0, 191471.0, 250466.0, 314180.0, 370967.0, 409960.0, 419632.0, 396815.0, 350473.0, 292866.0, 228847.0, 171265.0, 123068.0, 85538.0, 57256.0, 38031.0, 24893.0, 15760.0, 9962.0, 6111.0, 3782.0, 2303.0, 1395.0, 802.0, 464.0, 274.0, 156.0, 108.0, 58.0, 37.0, 9.0, 14.0, 3.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-20.046875, -19.40673828125, -18.7666015625, -18.12646484375, -17.486328125, -16.84619140625, -16.2060546875, -15.56591796875, -14.92578125, -14.28564453125, -13.6455078125, -13.00537109375, -12.365234375, -11.72509765625, -11.0849609375, -10.44482421875, -9.8046875, -9.16455078125, -8.5244140625, -7.88427734375, -7.244140625, -6.60400390625, -5.9638671875, -5.32373046875, -4.68359375, -4.04345703125, -3.4033203125, -2.76318359375, -2.123046875, -1.48291015625, -0.8427734375, -0.20263671875, 0.4375, 1.07763671875, 1.7177734375, 2.35791015625, 2.998046875, 3.63818359375, 4.2783203125, 4.91845703125, 5.55859375, 6.19873046875, 6.8388671875, 7.47900390625, 8.119140625, 8.75927734375, 9.3994140625, 10.03955078125, 10.6796875, 11.31982421875, 11.9599609375, 12.60009765625, 13.240234375, 13.88037109375, 14.5205078125, 15.16064453125, 15.80078125, 16.44091796875, 17.0810546875, 17.72119140625, 18.361328125, 19.00146484375, 19.6416015625, 20.28173828125, 20.921875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 10.0, 12.0, 20.0, 19.0, 29.0, 33.0, 29.0, 38.0, 59.0, 81.0, 93.0, 92.0, 114.0, 117.0, 145.0, 144.0, 150.0, 213.0, 182.0, 200.0, 192.0, 187.0, 189.0, 200.0, 193.0, 137.0, 150.0, 148.0, 126.0, 119.0, 108.0, 80.0, 82.0, 63.0, 56.0, 39.0, 34.0, 41.0, 34.0, 19.0, 17.0, 21.0, 11.0, 8.0, 11.0, 3.0, 2.0, 4.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 4.0], "bins": [-9.9140625, -9.5814208984375, -9.248779296875, -8.9161376953125, -8.58349609375, -8.2508544921875, -7.918212890625, -7.5855712890625, -7.2529296875, -6.9202880859375, -6.587646484375, -6.2550048828125, -5.92236328125, -5.5897216796875, -5.257080078125, -4.9244384765625, -4.591796875, -4.2591552734375, -3.926513671875, -3.5938720703125, -3.26123046875, -2.9285888671875, -2.595947265625, -2.2633056640625, -1.9306640625, -1.5980224609375, -1.265380859375, -0.9327392578125, -0.60009765625, -0.2674560546875, 0.065185546875, 0.3978271484375, 0.73046875, 1.0631103515625, 1.395751953125, 1.7283935546875, 2.06103515625, 2.3936767578125, 2.726318359375, 3.0589599609375, 3.3916015625, 3.7242431640625, 4.056884765625, 4.3895263671875, 4.72216796875, 5.0548095703125, 5.387451171875, 5.7200927734375, 6.052734375, 6.3853759765625, 6.718017578125, 7.0506591796875, 7.38330078125, 7.7159423828125, 8.048583984375, 8.3812255859375, 8.7138671875, 9.0465087890625, 9.379150390625, 9.7117919921875, 10.04443359375, 10.3770751953125, 10.709716796875, 11.0423583984375, 11.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 11.0, 13.0, 11.0, 16.0, 22.0, 31.0, 29.0, 31.0, 34.0, 41.0, 38.0, 35.0, 49.0, 42.0, 61.0, 43.0, 34.0, 60.0, 44.0, 41.0, 45.0, 44.0, 41.0, 22.0, 29.0, 28.0, 15.0, 14.0, 20.0, 13.0, 15.0, 6.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.362350463867188, -30.337923049926758, -29.313495635986328, -28.28907012939453, -27.2646427154541, -26.240215301513672, -25.215787887573242, -24.191360473632812, -23.166934967041016, -22.142507553100586, -21.118080139160156, -20.09365463256836, -19.06922721862793, -18.0447998046875, -17.02037239074707, -15.99594497680664, -14.971517562866211, -13.947090148925781, -12.922663688659668, -11.898236274719238, -10.873809814453125, -9.849382400512695, -8.824954986572266, -7.800528049468994, -6.776101112365723, -5.751674175262451, -4.72724723815918, -3.70281982421875, -2.6783928871154785, -1.653965950012207, -0.6295385360717773, 0.39488840103149414, 1.4193153381347656, 2.443742275238037, 3.4681694507598877, 4.492596626281738, 5.51702356338501, 6.541450500488281, 7.565877914428711, 8.59030532836914, 9.614731788635254, 10.639159202575684, 11.663585662841797, 12.688013076782227, 13.712440490722656, 14.73686695098877, 15.7612943649292, 16.785720825195312, 17.810148239135742, 18.834575653076172, 19.8590030670166, 20.88343048095703, 21.907855987548828, 22.932283401489258, 23.956710815429688, 24.981138229370117, 26.005565643310547, 27.029993057250977, 28.054420471191406, 29.078845977783203, 30.103273391723633, 31.127700805664062, 32.152130126953125, 33.17655563354492, 34.20098114013672]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 5.0, 3.0, 11.0, 10.0, 16.0, 8.0, 16.0, 23.0, 25.0, 22.0, 23.0, 28.0, 25.0, 31.0, 38.0, 49.0, 27.0, 47.0, 39.0, 36.0, 43.0, 41.0, 41.0, 41.0, 28.0, 30.0, 40.0, 40.0, 26.0, 29.0, 25.0, 17.0, 20.0, 8.0, 12.0, 16.0, 12.0, 4.0, 12.0, 7.0, 2.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-32.368343353271484, -31.437801361083984, -30.507261276245117, -29.57672119140625, -28.64617919921875, -27.71563720703125, -26.785097122192383, -25.854557037353516, -24.924015045166016, -23.993473052978516, -23.06293296813965, -22.13239288330078, -21.20185089111328, -20.27130889892578, -19.340768814086914, -18.410228729248047, -17.479686737060547, -16.549144744873047, -15.61860466003418, -14.688063621520996, -13.757522583007812, -12.826981544494629, -11.896440505981445, -10.965899467468262, -10.035358428955078, -9.104817390441895, -8.174276351928711, -7.243735313415527, -6.313194274902344, -5.38265323638916, -4.452112197875977, -3.521571159362793, -2.5910301208496094, -1.6604890823364258, -0.7299480438232422, 0.2005929946899414, 1.131134033203125, 2.0616750717163086, 2.992216110229492, 3.922757148742676, 4.853298187255859, 5.783839225769043, 6.714380264282227, 7.64492130279541, 8.575462341308594, 9.506003379821777, 10.436544418334961, 11.367085456848145, 12.297626495361328, 13.228167533874512, 14.158708572387695, 15.089249610900879, 16.019790649414062, 16.950332641601562, 17.88087272644043, 18.811412811279297, 19.741954803466797, 20.672496795654297, 21.603036880493164, 22.53357696533203, 23.46411895751953, 24.39466094970703, 25.3252010345459, 26.255741119384766, 27.186283111572266]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 8.0, 4.0, 7.0, 9.0, 13.0, 17.0, 38.0, 42.0, 46.0, 67.0, 104.0, 104.0, 157.0, 261.0, 365.0, 512.0, 816.0, 1129.0, 1839.0, 2883.0, 4514.0, 7381.0, 12738.0, 23542.0, 46088.0, 99954.0, 230889.0, 317081.0, 153661.0, 68052.0, 32768.0, 17429.0, 9788.0, 5814.0, 3557.0, 2298.0, 1473.0, 1021.0, 695.0, 404.0, 272.0, 190.0, 153.0, 102.0, 66.0, 56.0, 38.0, 38.0, 24.0, 16.0, 17.0, 5.0, 10.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.0, -18.3720703125, -17.744140625, -17.1162109375, -16.48828125, -15.8603515625, -15.232421875, -14.6044921875, -13.9765625, -13.3486328125, -12.720703125, -12.0927734375, -11.46484375, -10.8369140625, -10.208984375, -9.5810546875, -8.953125, -8.3251953125, -7.697265625, -7.0693359375, -6.44140625, -5.8134765625, -5.185546875, -4.5576171875, -3.9296875, -3.3017578125, -2.673828125, -2.0458984375, -1.41796875, -0.7900390625, -0.162109375, 0.4658203125, 1.09375, 1.7216796875, 2.349609375, 2.9775390625, 3.60546875, 4.2333984375, 4.861328125, 5.4892578125, 6.1171875, 6.7451171875, 7.373046875, 8.0009765625, 8.62890625, 9.2568359375, 9.884765625, 10.5126953125, 11.140625, 11.7685546875, 12.396484375, 13.0244140625, 13.65234375, 14.2802734375, 14.908203125, 15.5361328125, 16.1640625, 16.7919921875, 17.419921875, 18.0478515625, 18.67578125, 19.3037109375, 19.931640625, 20.5595703125, 21.1875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 9.0, 5.0, 6.0, 4.0, 12.0, 8.0, 15.0, 8.0, 18.0, 21.0, 26.0, 23.0, 22.0, 29.0, 26.0, 29.0, 38.0, 48.0, 26.0, 50.0, 42.0, 37.0, 39.0, 40.0, 45.0, 39.0, 27.0, 31.0, 37.0, 42.0, 30.0, 28.0, 22.0, 19.0, 18.0, 9.0, 11.0, 15.0, 13.0, 6.0, 9.0, 7.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-32.1875, -31.26416015625, -30.3408203125, -29.41748046875, -28.494140625, -27.57080078125, -26.6474609375, -25.72412109375, -24.80078125, -23.87744140625, -22.9541015625, -22.03076171875, -21.107421875, -20.18408203125, -19.2607421875, -18.33740234375, -17.4140625, -16.49072265625, -15.5673828125, -14.64404296875, -13.720703125, -12.79736328125, -11.8740234375, -10.95068359375, -10.02734375, -9.10400390625, -8.1806640625, -7.25732421875, -6.333984375, -5.41064453125, -4.4873046875, -3.56396484375, -2.640625, -1.71728515625, -0.7939453125, 0.12939453125, 1.052734375, 1.97607421875, 2.8994140625, 3.82275390625, 4.74609375, 5.66943359375, 6.5927734375, 7.51611328125, 8.439453125, 9.36279296875, 10.2861328125, 11.20947265625, 12.1328125, 13.05615234375, 13.9794921875, 14.90283203125, 15.826171875, 16.74951171875, 17.6728515625, 18.59619140625, 19.51953125, 20.44287109375, 21.3662109375, 22.28955078125, 23.212890625, 24.13623046875, 25.0595703125, 25.98291015625, 26.90625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 8.0, 8.0, 13.0, 16.0, 19.0, 26.0, 31.0, 40.0, 57.0, 61.0, 107.0, 147.0, 238.0, 293.0, 459.0, 737.0, 1280.0, 2222.0, 4199.0, 9109.0, 24001.0, 96661.0, 623176.0, 220860.0, 38998.0, 12852.0, 5719.0, 2842.0, 1596.0, 953.0, 582.0, 391.0, 231.0, 176.0, 115.0, 92.0, 58.0, 48.0, 39.0, 26.0, 30.0, 9.0, 12.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -31.00634765625, -30.0283203125, -29.05029296875, -28.072265625, -27.09423828125, -26.1162109375, -25.13818359375, -24.16015625, -23.18212890625, -22.2041015625, -21.22607421875, -20.248046875, -19.27001953125, -18.2919921875, -17.31396484375, -16.3359375, -15.35791015625, -14.3798828125, -13.40185546875, -12.423828125, -11.44580078125, -10.4677734375, -9.48974609375, -8.51171875, -7.53369140625, -6.5556640625, -5.57763671875, -4.599609375, -3.62158203125, -2.6435546875, -1.66552734375, -0.6875, 0.29052734375, 1.2685546875, 2.24658203125, 3.224609375, 4.20263671875, 5.1806640625, 6.15869140625, 7.13671875, 8.11474609375, 9.0927734375, 10.07080078125, 11.048828125, 12.02685546875, 13.0048828125, 13.98291015625, 14.9609375, 15.93896484375, 16.9169921875, 17.89501953125, 18.873046875, 19.85107421875, 20.8291015625, 21.80712890625, 22.78515625, 23.76318359375, 24.7412109375, 25.71923828125, 26.697265625, 27.67529296875, 28.6533203125, 29.63134765625, 30.609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 11.0, 8.0, 6.0, 9.0, 17.0, 10.0, 16.0, 22.0, 18.0, 30.0, 22.0, 28.0, 30.0, 38.0, 28.0, 33.0, 28.0, 37.0, 39.0, 36.0, 34.0, 41.0, 41.0, 41.0, 40.0, 35.0, 30.0, 34.0, 40.0, 27.0, 24.0, 23.0, 18.0, 21.0, 8.0, 14.0, 9.0, 14.0, 6.0, 6.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0], "bins": [-23.4375, -22.77880859375, -22.1201171875, -21.46142578125, -20.802734375, -20.14404296875, -19.4853515625, -18.82666015625, -18.16796875, -17.50927734375, -16.8505859375, -16.19189453125, -15.533203125, -14.87451171875, -14.2158203125, -13.55712890625, -12.8984375, -12.23974609375, -11.5810546875, -10.92236328125, -10.263671875, -9.60498046875, -8.9462890625, -8.28759765625, -7.62890625, -6.97021484375, -6.3115234375, -5.65283203125, -4.994140625, -4.33544921875, -3.6767578125, -3.01806640625, -2.359375, -1.70068359375, -1.0419921875, -0.38330078125, 0.275390625, 0.93408203125, 1.5927734375, 2.25146484375, 2.91015625, 3.56884765625, 4.2275390625, 4.88623046875, 5.544921875, 6.20361328125, 6.8623046875, 7.52099609375, 8.1796875, 8.83837890625, 9.4970703125, 10.15576171875, 10.814453125, 11.47314453125, 12.1318359375, 12.79052734375, 13.44921875, 14.10791015625, 14.7666015625, 15.42529296875, 16.083984375, 16.74267578125, 17.4013671875, 18.06005859375, 18.71875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 9.0, 6.0, 12.0, 25.0, 31.0, 44.0, 90.0, 135.0, 206.0, 338.0, 661.0, 1342.0, 2769.0, 6786.0, 21086.0, 121588.0, 761989.0, 100739.0, 18908.0, 6286.0, 2629.0, 1182.0, 699.0, 356.0, 213.0, 125.0, 75.0, 59.0, 46.0, 29.0, 18.0, 18.0, 9.0, 12.0, 2.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.703125, -19.1142578125, -18.525390625, -17.9365234375, -17.34765625, -16.7587890625, -16.169921875, -15.5810546875, -14.9921875, -14.4033203125, -13.814453125, -13.2255859375, -12.63671875, -12.0478515625, -11.458984375, -10.8701171875, -10.28125, -9.6923828125, -9.103515625, -8.5146484375, -7.92578125, -7.3369140625, -6.748046875, -6.1591796875, -5.5703125, -4.9814453125, -4.392578125, -3.8037109375, -3.21484375, -2.6259765625, -2.037109375, -1.4482421875, -0.859375, -0.2705078125, 0.318359375, 0.9072265625, 1.49609375, 2.0849609375, 2.673828125, 3.2626953125, 3.8515625, 4.4404296875, 5.029296875, 5.6181640625, 6.20703125, 6.7958984375, 7.384765625, 7.9736328125, 8.5625, 9.1513671875, 9.740234375, 10.3291015625, 10.91796875, 11.5068359375, 12.095703125, 12.6845703125, 13.2734375, 13.8623046875, 14.451171875, 15.0400390625, 15.62890625, 16.2177734375, 16.806640625, 17.3955078125, 17.984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 8.0, 8.0, 8.0, 8.0, 5.0, 8.0, 10.0, 19.0, 17.0, 18.0, 21.0, 19.0, 34.0, 49.0, 56.0, 55.0, 87.0, 93.0, 80.0, 67.0, 56.0, 51.0, 39.0, 26.0, 45.0, 20.0, 17.0, 8.0, 7.0, 7.0, 10.0, 6.0, 5.0, 7.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0009813308715820312, -0.0009532496333122253, -0.0009251683950424194, -0.0008970871567726135, -0.0008690059185028076, -0.0008409246802330017, -0.0008128434419631958, -0.0007847622036933899, -0.000756680965423584, -0.0007285997271537781, -0.0007005184888839722, -0.0006724372506141663, -0.0006443560123443604, -0.0006162747740745544, -0.0005881935358047485, -0.0005601122975349426, -0.0005320310592651367, -0.0005039498209953308, -0.0004758685827255249, -0.000447787344455719, -0.0004197061061859131, -0.0003916248679161072, -0.00036354362964630127, -0.00033546239137649536, -0.00030738115310668945, -0.00027929991483688354, -0.00025121867656707764, -0.00022313743829727173, -0.00019505620002746582, -0.0001669749617576599, -0.000138893723487854, -0.0001108124852180481, -8.273124694824219e-05, -5.465000867843628e-05, -2.656877040863037e-05, 1.5124678611755371e-06, 2.9593706130981445e-05, 5.7674944400787354e-05, 8.575618267059326e-05, 0.00011383742094039917, 0.00014191865921020508, 0.00016999989748001099, 0.0001980811357498169, 0.0002261623740196228, 0.0002542436122894287, 0.0002823248505592346, 0.00031040608882904053, 0.00033848732709884644, 0.00036656856536865234, 0.00039464980363845825, 0.00042273104190826416, 0.00045081228017807007, 0.000478893518447876, 0.0005069747567176819, 0.0005350559949874878, 0.0005631372332572937, 0.0005912184715270996, 0.0006192997097969055, 0.0006473809480667114, 0.0006754621863365173, 0.0007035434246063232, 0.0007316246628761292, 0.0007597059011459351, 0.000787787139415741, 0.0008158683776855469]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 9.0, 12.0, 11.0, 15.0, 20.0, 24.0, 36.0, 63.0, 115.0, 201.0, 336.0, 595.0, 1147.0, 2180.0, 4291.0, 9007.0, 19823.0, 50064.0, 184376.0, 511050.0, 179172.0, 48586.0, 19533.0, 8955.0, 4227.0, 2139.0, 1154.0, 564.0, 354.0, 175.0, 104.0, 69.0, 37.0, 30.0, 15.0, 19.0, 9.0, 15.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.8701171875, -15.349609375, -14.8291015625, -14.30859375, -13.7880859375, -13.267578125, -12.7470703125, -12.2265625, -11.7060546875, -11.185546875, -10.6650390625, -10.14453125, -9.6240234375, -9.103515625, -8.5830078125, -8.0625, -7.5419921875, -7.021484375, -6.5009765625, -5.98046875, -5.4599609375, -4.939453125, -4.4189453125, -3.8984375, -3.3779296875, -2.857421875, -2.3369140625, -1.81640625, -1.2958984375, -0.775390625, -0.2548828125, 0.265625, 0.7861328125, 1.306640625, 1.8271484375, 2.34765625, 2.8681640625, 3.388671875, 3.9091796875, 4.4296875, 4.9501953125, 5.470703125, 5.9912109375, 6.51171875, 7.0322265625, 7.552734375, 8.0732421875, 8.59375, 9.1142578125, 9.634765625, 10.1552734375, 10.67578125, 11.1962890625, 11.716796875, 12.2373046875, 12.7578125, 13.2783203125, 13.798828125, 14.3193359375, 14.83984375, 15.3603515625, 15.880859375, 16.4013671875, 16.921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 8.0, 12.0, 17.0, 25.0, 48.0, 82.0, 124.0, 163.0, 150.0, 116.0, 95.0, 64.0, 43.0, 19.0, 13.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.81634521484375, -7.6170654296875, -7.41778564453125, -7.218505859375, -7.01922607421875, -6.8199462890625, -6.62066650390625, -6.42138671875, -6.22210693359375, -6.0228271484375, -5.82354736328125, -5.624267578125, -5.42498779296875, -5.2257080078125, -5.02642822265625, -4.8271484375, -4.62786865234375, -4.4285888671875, -4.22930908203125, -4.030029296875, -3.83074951171875, -3.6314697265625, -3.43218994140625, -3.23291015625, -3.03363037109375, -2.8343505859375, -2.63507080078125, -2.435791015625, -2.23651123046875, -2.0372314453125, -1.83795166015625, -1.638671875, -1.43939208984375, -1.2401123046875, -1.04083251953125, -0.841552734375, -0.64227294921875, -0.4429931640625, -0.24371337890625, -0.04443359375, 0.15484619140625, 0.3541259765625, 0.55340576171875, 0.752685546875, 0.95196533203125, 1.1512451171875, 1.35052490234375, 1.5498046875, 1.74908447265625, 1.9483642578125, 2.14764404296875, 2.346923828125, 2.54620361328125, 2.7454833984375, 2.94476318359375, 3.14404296875, 3.34332275390625, 3.5426025390625, 3.74188232421875, 3.941162109375, 4.14044189453125, 4.3397216796875, 4.53900146484375, 4.73828125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 10.0, 21.0, 15.0, 15.0, 21.0, 30.0, 30.0, 31.0, 29.0, 39.0, 44.0, 56.0, 37.0, 47.0, 41.0, 41.0, 60.0, 45.0, 41.0, 47.0, 41.0, 38.0, 37.0, 27.0, 32.0, 18.0, 21.0, 10.0, 15.0, 15.0, 10.0, 12.0, 6.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.02405548095703, -30.0318546295166, -29.039653778076172, -28.047454833984375, -27.055253982543945, -26.063053131103516, -25.07085418701172, -24.07865333557129, -23.08645248413086, -22.09425163269043, -21.10205078125, -20.109851837158203, -19.117650985717773, -18.125450134277344, -17.133251190185547, -16.141050338745117, -15.148849487304688, -14.156648635864258, -13.164448738098145, -12.172248840332031, -11.180047988891602, -10.187847137451172, -9.195647239685059, -8.203447341918945, -7.211246490478516, -6.219046115875244, -5.226845741271973, -4.234645366668701, -3.2424449920654297, -2.250244617462158, -1.2580442428588867, -0.26584386825561523, 0.7263565063476562, 1.7185568809509277, 2.710757255554199, 3.7029576301574707, 4.695158004760742, 5.687358379364014, 6.679558753967285, 7.671759128570557, 8.663959503173828, 9.656160354614258, 10.648360252380371, 11.640560150146484, 12.632761001586914, 13.624961853027344, 14.617161750793457, 15.60936164855957, 16.6015625, 17.59376335144043, 18.58596420288086, 19.578163146972656, 20.570363998413086, 21.562564849853516, 22.554763793945312, 23.546964645385742, 24.539165496826172, 25.5313663482666, 26.52356719970703, 27.515766143798828, 28.507966995239258, 29.500167846679688, 30.492366790771484, 31.484567642211914, 32.476768493652344]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 4.0, 11.0, 14.0, 13.0, 13.0, 16.0, 32.0, 18.0, 22.0, 22.0, 26.0, 29.0, 32.0, 45.0, 42.0, 43.0, 44.0, 31.0, 40.0, 39.0, 44.0, 44.0, 37.0, 29.0, 36.0, 46.0, 23.0, 33.0, 25.0, 18.0, 18.0, 14.0, 11.0, 15.0, 10.0, 9.0, 9.0, 5.0, 4.0, 8.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-32.05927276611328, -31.126136779785156, -30.193002700805664, -29.25986671447754, -28.326732635498047, -27.393596649169922, -26.460460662841797, -25.527326583862305, -24.594192504882812, -23.661056518554688, -22.727922439575195, -21.79478645324707, -20.861652374267578, -19.928516387939453, -18.995380401611328, -18.062246322631836, -17.12911033630371, -16.195974349975586, -15.262840270996094, -14.329704284667969, -13.396570205688477, -12.463434219360352, -11.530299186706543, -10.597164154052734, -9.664029121398926, -8.730894088745117, -7.797759056091309, -6.864623546600342, -5.931488513946533, -4.998353481292725, -4.065217971801758, -3.132082939147949, -2.1989479064941406, -1.2658127546310425, -0.33267760276794434, 0.6004576683044434, 1.533592700958252, 2.4667277336120605, 3.3998632431030273, 4.332998275756836, 5.2661333084106445, 6.199268341064453, 7.132403373718262, 8.06553840637207, 8.998674392700195, 9.931808471679688, 10.864944458007812, 11.798079490661621, 12.73121452331543, 13.664349555969238, 14.597484588623047, 15.530620574951172, 16.463754653930664, 17.39689064025879, 18.33002471923828, 19.263160705566406, 20.19629669189453, 21.129432678222656, 22.06256675720215, 22.995702743530273, 23.928836822509766, 24.86197280883789, 25.795108795166016, 26.728242874145508, 27.661376953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 12.0, 19.0, 22.0, 35.0, 64.0, 86.0, 133.0, 211.0, 333.0, 494.0, 886.0, 1379.0, 2119.0, 3444.0, 5245.0, 7960.0, 11976.0, 17436.0, 25465.0, 35153.0, 47023.0, 60169.0, 73561.0, 85950.0, 94194.0, 96629.0, 94190.0, 86228.0, 74175.0, 61007.0, 47767.0, 35878.0, 25623.0, 18297.0, 12277.0, 8304.0, 5297.0, 3444.0, 2217.0, 1424.0, 900.0, 572.0, 359.0, 218.0, 154.0, 74.0, 67.0, 27.0, 23.0, 14.0, 13.0, 3.0, 2.0, 2.0, 2.0], "bins": [-19.40625, -18.84423828125, -18.2822265625, -17.72021484375, -17.158203125, -16.59619140625, -16.0341796875, -15.47216796875, -14.91015625, -14.34814453125, -13.7861328125, -13.22412109375, -12.662109375, -12.10009765625, -11.5380859375, -10.97607421875, -10.4140625, -9.85205078125, -9.2900390625, -8.72802734375, -8.166015625, -7.60400390625, -7.0419921875, -6.47998046875, -5.91796875, -5.35595703125, -4.7939453125, -4.23193359375, -3.669921875, -3.10791015625, -2.5458984375, -1.98388671875, -1.421875, -0.85986328125, -0.2978515625, 0.26416015625, 0.826171875, 1.38818359375, 1.9501953125, 2.51220703125, 3.07421875, 3.63623046875, 4.1982421875, 4.76025390625, 5.322265625, 5.88427734375, 6.4462890625, 7.00830078125, 7.5703125, 8.13232421875, 8.6943359375, 9.25634765625, 9.818359375, 10.38037109375, 10.9423828125, 11.50439453125, 12.06640625, 12.62841796875, 13.1904296875, 13.75244140625, 14.314453125, 14.87646484375, 15.4384765625, 16.00048828125, 16.5625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 6.0, 10.0, 15.0, 13.0, 12.0, 20.0, 30.0, 16.0, 25.0, 20.0, 26.0, 32.0, 32.0, 46.0, 37.0, 42.0, 43.0, 35.0, 41.0, 38.0, 39.0, 43.0, 43.0, 28.0, 38.0, 38.0, 27.0, 33.0, 23.0, 24.0, 18.0, 10.0, 15.0, 14.0, 9.0, 10.0, 8.0, 4.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-31.140625, -30.2333984375, -29.326171875, -28.4189453125, -27.51171875, -26.6044921875, -25.697265625, -24.7900390625, -23.8828125, -22.9755859375, -22.068359375, -21.1611328125, -20.25390625, -19.3466796875, -18.439453125, -17.5322265625, -16.625, -15.7177734375, -14.810546875, -13.9033203125, -12.99609375, -12.0888671875, -11.181640625, -10.2744140625, -9.3671875, -8.4599609375, -7.552734375, -6.6455078125, -5.73828125, -4.8310546875, -3.923828125, -3.0166015625, -2.109375, -1.2021484375, -0.294921875, 0.6123046875, 1.51953125, 2.4267578125, 3.333984375, 4.2412109375, 5.1484375, 6.0556640625, 6.962890625, 7.8701171875, 8.77734375, 9.6845703125, 10.591796875, 11.4990234375, 12.40625, 13.3134765625, 14.220703125, 15.1279296875, 16.03515625, 16.9423828125, 17.849609375, 18.7568359375, 19.6640625, 20.5712890625, 21.478515625, 22.3857421875, 23.29296875, 24.2001953125, 25.107421875, 26.0146484375, 26.921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 7.0, 9.0, 11.0, 34.0, 41.0, 85.0, 107.0, 175.0, 261.0, 464.0, 676.0, 1224.0, 1888.0, 3096.0, 5073.0, 8119.0, 12829.0, 19772.0, 29826.0, 43772.0, 60545.0, 80324.0, 97941.0, 110806.0, 114377.0, 109277.0, 95053.0, 76410.0, 57757.0, 40983.0, 27832.0, 18386.0, 11972.0, 7440.0, 4528.0, 2884.0, 1724.0, 1052.0, 677.0, 385.0, 262.0, 165.0, 103.0, 66.0, 45.0, 27.0, 24.0, 13.0, 7.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.515625, -21.798828125, -21.08203125, -20.365234375, -19.6484375, -18.931640625, -18.21484375, -17.498046875, -16.78125, -16.064453125, -15.34765625, -14.630859375, -13.9140625, -13.197265625, -12.48046875, -11.763671875, -11.046875, -10.330078125, -9.61328125, -8.896484375, -8.1796875, -7.462890625, -6.74609375, -6.029296875, -5.3125, -4.595703125, -3.87890625, -3.162109375, -2.4453125, -1.728515625, -1.01171875, -0.294921875, 0.421875, 1.138671875, 1.85546875, 2.572265625, 3.2890625, 4.005859375, 4.72265625, 5.439453125, 6.15625, 6.873046875, 7.58984375, 8.306640625, 9.0234375, 9.740234375, 10.45703125, 11.173828125, 11.890625, 12.607421875, 13.32421875, 14.041015625, 14.7578125, 15.474609375, 16.19140625, 16.908203125, 17.625, 18.341796875, 19.05859375, 19.775390625, 20.4921875, 21.208984375, 21.92578125, 22.642578125, 23.359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 1.0, 4.0, 4.0, 7.0, 3.0, 10.0, 12.0, 14.0, 8.0, 15.0, 9.0, 19.0, 16.0, 23.0, 20.0, 29.0, 32.0, 31.0, 32.0, 31.0, 27.0, 35.0, 46.0, 42.0, 46.0, 34.0, 53.0, 33.0, 49.0, 41.0, 31.0, 29.0, 33.0, 32.0, 19.0, 20.0, 22.0, 19.0, 15.0, 7.0, 8.0, 8.0, 7.0, 7.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-19.796875, -19.2080078125, -18.619140625, -18.0302734375, -17.44140625, -16.8525390625, -16.263671875, -15.6748046875, -15.0859375, -14.4970703125, -13.908203125, -13.3193359375, -12.73046875, -12.1416015625, -11.552734375, -10.9638671875, -10.375, -9.7861328125, -9.197265625, -8.6083984375, -8.01953125, -7.4306640625, -6.841796875, -6.2529296875, -5.6640625, -5.0751953125, -4.486328125, -3.8974609375, -3.30859375, -2.7197265625, -2.130859375, -1.5419921875, -0.953125, -0.3642578125, 0.224609375, 0.8134765625, 1.40234375, 1.9912109375, 2.580078125, 3.1689453125, 3.7578125, 4.3466796875, 4.935546875, 5.5244140625, 6.11328125, 6.7021484375, 7.291015625, 7.8798828125, 8.46875, 9.0576171875, 9.646484375, 10.2353515625, 10.82421875, 11.4130859375, 12.001953125, 12.5908203125, 13.1796875, 13.7685546875, 14.357421875, 14.9462890625, 15.53515625, 16.1240234375, 16.712890625, 17.3017578125, 17.890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 11.0, 20.0, 28.0, 45.0, 55.0, 89.0, 131.0, 171.0, 269.0, 396.0, 655.0, 1007.0, 1557.0, 2368.0, 3517.0, 5201.0, 7879.0, 11564.0, 16819.0, 23806.0, 33451.0, 44492.0, 57865.0, 71588.0, 83015.0, 92657.0, 96831.0, 94337.0, 87673.0, 76162.0, 62197.0, 49281.0, 37058.0, 27111.0, 19159.0, 13198.0, 8956.0, 6118.0, 4121.0, 2633.0, 1749.0, 1173.0, 722.0, 499.0, 329.0, 190.0, 142.0, 95.0, 51.0, 52.0, 28.0, 9.0, 15.0, 6.0, 3.0, 3.0, 2.0, 1.0], "bins": [-6.125, -5.93756103515625, -5.7501220703125, -5.56268310546875, -5.375244140625, -5.18780517578125, -5.0003662109375, -4.81292724609375, -4.62548828125, -4.43804931640625, -4.2506103515625, -4.06317138671875, -3.875732421875, -3.68829345703125, -3.5008544921875, -3.31341552734375, -3.1259765625, -2.93853759765625, -2.7510986328125, -2.56365966796875, -2.376220703125, -2.18878173828125, -2.0013427734375, -1.81390380859375, -1.62646484375, -1.43902587890625, -1.2515869140625, -1.06414794921875, -0.876708984375, -0.68927001953125, -0.5018310546875, -0.31439208984375, -0.126953125, 0.06048583984375, 0.2479248046875, 0.43536376953125, 0.622802734375, 0.81024169921875, 0.9976806640625, 1.18511962890625, 1.37255859375, 1.55999755859375, 1.7474365234375, 1.93487548828125, 2.122314453125, 2.30975341796875, 2.4971923828125, 2.68463134765625, 2.8720703125, 3.05950927734375, 3.2469482421875, 3.43438720703125, 3.621826171875, 3.80926513671875, 3.9967041015625, 4.18414306640625, 4.37158203125, 4.55902099609375, 4.7464599609375, 4.93389892578125, 5.121337890625, 5.30877685546875, 5.4962158203125, 5.68365478515625, 5.87109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 6.0, 14.0, 5.0, 11.0, 14.0, 16.0, 23.0, 27.0, 27.0, 21.0, 30.0, 34.0, 42.0, 36.0, 44.0, 49.0, 42.0, 53.0, 50.0, 53.0, 36.0, 36.0, 36.0, 30.0, 31.0, 36.0, 31.0, 20.0, 21.0, 17.0, 14.0, 18.0, 12.0, 11.0, 9.0, 6.0, 7.0, 11.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007643699645996094, -0.0007395818829536438, -0.0007147938013076782, -0.0006900057196617126, -0.0006652176380157471, -0.0006404295563697815, -0.0006156414747238159, -0.0005908533930778503, -0.0005660653114318848, -0.0005412772297859192, -0.0005164891481399536, -0.000491701066493988, -0.00046691298484802246, -0.0004421249032020569, -0.0004173368215560913, -0.00039254873991012573, -0.00036776065826416016, -0.0003429725766181946, -0.000318184494972229, -0.00029339641332626343, -0.00026860833168029785, -0.00024382025003433228, -0.0002190321683883667, -0.00019424408674240112, -0.00016945600509643555, -0.00014466792345046997, -0.0001198798418045044, -9.509176015853882e-05, -7.030367851257324e-05, -4.5515596866607666e-05, -2.072751522064209e-05, 4.060566425323486e-06, 2.8848648071289062e-05, 5.363672971725464e-05, 7.842481136322021e-05, 0.00010321289300918579, 0.00012800097465515137, 0.00015278905630111694, 0.00017757713794708252, 0.0002023652195930481, 0.00022715330123901367, 0.00025194138288497925, 0.0002767294645309448, 0.0003015175461769104, 0.000326305627822876, 0.00035109370946884155, 0.00037588179111480713, 0.0004006698727607727, 0.0004254579544067383, 0.00045024603605270386, 0.00047503411769866943, 0.000499822199344635, 0.0005246102809906006, 0.0005493983626365662, 0.0005741864442825317, 0.0005989745259284973, 0.0006237626075744629, 0.0006485506892204285, 0.000673338770866394, 0.0006981268525123596, 0.0007229149341583252, 0.0007477030158042908, 0.0007724910974502563, 0.0007972791790962219, 0.0008220672607421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 8.0, 9.0, 19.0, 20.0, 31.0, 56.0, 87.0, 170.0, 242.0, 379.0, 656.0, 1043.0, 1690.0, 2578.0, 4326.0, 6763.0, 10494.0, 15962.0, 23950.0, 34718.0, 48289.0, 64183.0, 80696.0, 94946.0, 104122.0, 106168.0, 100359.0, 88745.0, 73026.0, 57045.0, 41802.0, 29389.0, 20129.0, 13182.0, 8662.0, 5481.0, 3406.0, 2198.0, 1299.0, 868.0, 515.0, 309.0, 209.0, 119.0, 86.0, 41.0, 28.0, 22.0, 12.0, 11.0, 4.0, 0.0, 4.0, 0.0, 2.0], "bins": [-6.8046875, -6.60614013671875, -6.4075927734375, -6.20904541015625, -6.010498046875, -5.81195068359375, -5.6134033203125, -5.41485595703125, -5.21630859375, -5.01776123046875, -4.8192138671875, -4.62066650390625, -4.422119140625, -4.22357177734375, -4.0250244140625, -3.82647705078125, -3.6279296875, -3.42938232421875, -3.2308349609375, -3.03228759765625, -2.833740234375, -2.63519287109375, -2.4366455078125, -2.23809814453125, -2.03955078125, -1.84100341796875, -1.6424560546875, -1.44390869140625, -1.245361328125, -1.04681396484375, -0.8482666015625, -0.64971923828125, -0.451171875, -0.25262451171875, -0.0540771484375, 0.14447021484375, 0.343017578125, 0.54156494140625, 0.7401123046875, 0.93865966796875, 1.13720703125, 1.33575439453125, 1.5343017578125, 1.73284912109375, 1.931396484375, 2.12994384765625, 2.3284912109375, 2.52703857421875, 2.7255859375, 2.92413330078125, 3.1226806640625, 3.32122802734375, 3.519775390625, 3.71832275390625, 3.9168701171875, 4.11541748046875, 4.31396484375, 4.51251220703125, 4.7110595703125, 4.90960693359375, 5.108154296875, 5.30670166015625, 5.5052490234375, 5.70379638671875, 5.90234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 4.0, 7.0, 7.0, 9.0, 14.0, 15.0, 22.0, 17.0, 13.0, 19.0, 19.0, 20.0, 26.0, 28.0, 36.0, 33.0, 45.0, 50.0, 41.0, 46.0, 65.0, 36.0, 46.0, 33.0, 38.0, 32.0, 29.0, 37.0, 25.0, 26.0, 11.0, 21.0, 20.0, 10.0, 15.0, 16.0, 16.0, 10.0, 12.0, 6.0, 2.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.77734375, -2.6912841796875, -2.605224609375, -2.5191650390625, -2.43310546875, -2.3470458984375, -2.260986328125, -2.1749267578125, -2.0888671875, -2.0028076171875, -1.916748046875, -1.8306884765625, -1.74462890625, -1.6585693359375, -1.572509765625, -1.4864501953125, -1.400390625, -1.3143310546875, -1.228271484375, -1.1422119140625, -1.05615234375, -0.9700927734375, -0.884033203125, -0.7979736328125, -0.7119140625, -0.6258544921875, -0.539794921875, -0.4537353515625, -0.36767578125, -0.2816162109375, -0.195556640625, -0.1094970703125, -0.0234375, 0.0626220703125, 0.148681640625, 0.2347412109375, 0.32080078125, 0.4068603515625, 0.492919921875, 0.5789794921875, 0.6650390625, 0.7510986328125, 0.837158203125, 0.9232177734375, 1.00927734375, 1.0953369140625, 1.181396484375, 1.2674560546875, 1.353515625, 1.4395751953125, 1.525634765625, 1.6116943359375, 1.69775390625, 1.7838134765625, 1.869873046875, 1.9559326171875, 2.0419921875, 2.1280517578125, 2.214111328125, 2.3001708984375, 2.38623046875, 2.4722900390625, 2.558349609375, 2.6444091796875, 2.73046875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 4.0, 6.0, 6.0, 8.0, 21.0, 27.0, 21.0, 26.0, 25.0, 31.0, 38.0, 26.0, 37.0, 40.0, 43.0, 53.0, 49.0, 48.0, 36.0, 53.0, 48.0, 50.0, 46.0, 40.0, 40.0, 30.0, 21.0, 22.0, 17.0, 19.0, 18.0, 13.0, 10.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.00973892211914, -33.00271987915039, -31.99570083618164, -30.98868179321289, -29.98166275024414, -28.97464370727539, -27.96762466430664, -26.96060562133789, -25.95358657836914, -24.94656753540039, -23.93954849243164, -22.93252944946289, -21.92551040649414, -20.91849136352539, -19.91147232055664, -18.90445327758789, -17.89743423461914, -16.89041519165039, -15.88339614868164, -14.87637710571289, -13.86935806274414, -12.86233901977539, -11.85531997680664, -10.84830093383789, -9.84128189086914, -8.83426284790039, -7.827243804931641, -6.820224761962891, -5.813205718994141, -4.806186676025391, -3.7991676330566406, -2.7921485900878906, -1.7851276397705078, -0.7781085968017578, 0.2289104461669922, 1.2359294891357422, 2.242948532104492, 3.249967575073242, 4.256986618041992, 5.264005661010742, 6.271024703979492, 7.278043746948242, 8.285062789916992, 9.292081832885742, 10.299100875854492, 11.306119918823242, 12.313138961791992, 13.320158004760742, 14.327177047729492, 15.334196090698242, 16.341215133666992, 17.348234176635742, 18.355253219604492, 19.362272262573242, 20.369291305541992, 21.376310348510742, 22.383329391479492, 23.390348434448242, 24.397367477416992, 25.404386520385742, 26.411405563354492, 27.418424606323242, 28.425443649291992, 29.432462692260742, 30.439481735229492]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 9.0, 3.0, 12.0, 5.0, 15.0, 15.0, 13.0, 19.0, 20.0, 27.0, 27.0, 29.0, 26.0, 36.0, 38.0, 38.0, 44.0, 47.0, 36.0, 49.0, 41.0, 49.0, 51.0, 42.0, 38.0, 38.0, 31.0, 33.0, 25.0, 27.0, 18.0, 15.0, 14.0, 15.0, 12.0, 16.0, 7.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.078758239746094, -33.99924087524414, -32.91972351074219, -31.84020233154297, -30.760684967041016, -29.681167602539062, -28.601648330688477, -27.52212905883789, -26.442611694335938, -25.363094329833984, -24.2835750579834, -23.204055786132812, -22.12453842163086, -21.045021057128906, -19.96550178527832, -18.885982513427734, -17.80646514892578, -16.726947784423828, -15.647428512573242, -14.567910194396973, -13.488391876220703, -12.408873558044434, -11.329355239868164, -10.249836921691895, -9.170318603515625, -8.090800285339355, -7.011281967163086, -5.931763648986816, -4.852245330810547, -3.7727270126342773, -2.693208694458008, -1.6136903762817383, -0.5341758728027344, 0.5453424453735352, 1.6248607635498047, 2.704379081726074, 3.7838973999023438, 4.863415718078613, 5.942934036254883, 7.022452354431152, 8.101970672607422, 9.181488990783691, 10.261007308959961, 11.34052562713623, 12.4200439453125, 13.49956226348877, 14.579080581665039, 15.658598899841309, 16.738117218017578, 17.81763458251953, 18.897153854370117, 19.976673126220703, 21.056190490722656, 22.13570785522461, 23.215227127075195, 24.29474639892578, 25.374263763427734, 26.453781127929688, 27.533300399780273, 28.61281967163086, 29.692337036132812, 30.771854400634766, 31.85137367248535, 32.93089294433594, 34.01041030883789]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [4.0, 4.0, 4.0, 6.0, 9.0, 13.0, 32.0, 54.0, 60.0, 110.0, 174.0, 307.0, 497.0, 725.0, 1202.0, 1936.0, 3138.0, 4779.0, 7441.0, 11435.0, 17490.0, 27008.0, 40591.0, 60231.0, 88018.0, 125173.0, 172733.0, 229529.0, 291424.0, 348141.0, 393263.0, 412416.0, 403051.0, 365763.0, 310372.0, 248143.0, 189923.0, 139491.0, 98387.0, 68084.0, 46121.0, 30528.0, 20287.0, 13202.0, 8476.0, 5397.0, 3470.0, 2126.0, 1303.0, 852.0, 517.0, 337.0, 201.0, 119.0, 82.0, 47.0, 31.0, 16.0, 15.0, 3.0, 5.0, 1.0, 4.0, 3.0], "bins": [-18.6875, -18.09716796875, -17.5068359375, -16.91650390625, -16.326171875, -15.73583984375, -15.1455078125, -14.55517578125, -13.96484375, -13.37451171875, -12.7841796875, -12.19384765625, -11.603515625, -11.01318359375, -10.4228515625, -9.83251953125, -9.2421875, -8.65185546875, -8.0615234375, -7.47119140625, -6.880859375, -6.29052734375, -5.7001953125, -5.10986328125, -4.51953125, -3.92919921875, -3.3388671875, -2.74853515625, -2.158203125, -1.56787109375, -0.9775390625, -0.38720703125, 0.203125, 0.79345703125, 1.3837890625, 1.97412109375, 2.564453125, 3.15478515625, 3.7451171875, 4.33544921875, 4.92578125, 5.51611328125, 6.1064453125, 6.69677734375, 7.287109375, 7.87744140625, 8.4677734375, 9.05810546875, 9.6484375, 10.23876953125, 10.8291015625, 11.41943359375, 12.009765625, 12.60009765625, 13.1904296875, 13.78076171875, 14.37109375, 14.96142578125, 15.5517578125, 16.14208984375, 16.732421875, 17.32275390625, 17.9130859375, 18.50341796875, 19.09375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 8.0, 2.0, 11.0, 7.0, 14.0, 16.0, 14.0, 17.0, 19.0, 26.0, 29.0, 26.0, 30.0, 32.0, 40.0, 35.0, 48.0, 38.0, 46.0, 40.0, 43.0, 50.0, 57.0, 37.0, 33.0, 40.0, 35.0, 33.0, 29.0, 29.0, 13.0, 16.0, 17.0, 12.0, 15.0, 11.0, 8.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.96875, -28.0791015625, -27.189453125, -26.2998046875, -25.41015625, -24.5205078125, -23.630859375, -22.7412109375, -21.8515625, -20.9619140625, -20.072265625, -19.1826171875, -18.29296875, -17.4033203125, -16.513671875, -15.6240234375, -14.734375, -13.8447265625, -12.955078125, -12.0654296875, -11.17578125, -10.2861328125, -9.396484375, -8.5068359375, -7.6171875, -6.7275390625, -5.837890625, -4.9482421875, -4.05859375, -3.1689453125, -2.279296875, -1.3896484375, -0.5, 0.3896484375, 1.279296875, 2.1689453125, 3.05859375, 3.9482421875, 4.837890625, 5.7275390625, 6.6171875, 7.5068359375, 8.396484375, 9.2861328125, 10.17578125, 11.0654296875, 11.955078125, 12.8447265625, 13.734375, 14.6240234375, 15.513671875, 16.4033203125, 17.29296875, 18.1826171875, 19.072265625, 19.9619140625, 20.8515625, 21.7412109375, 22.630859375, 23.5205078125, 24.41015625, 25.2998046875, 26.189453125, 27.0791015625, 27.96875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 12.0, 11.0, 20.0, 38.0, 59.0, 106.0, 187.0, 284.0, 441.0, 785.0, 1274.0, 2100.0, 3513.0, 5644.0, 9132.0, 14367.0, 22137.0, 33526.0, 50264.0, 73135.0, 103312.0, 140963.0, 184990.0, 234650.0, 283578.0, 328631.0, 358362.0, 371410.0, 364286.0, 339574.0, 299538.0, 250954.0, 201603.0, 154409.0, 113955.0, 81890.0, 57109.0, 38622.0, 25347.0, 16558.0, 10502.0, 6654.0, 4069.0, 2478.0, 1467.0, 912.0, 576.0, 333.0, 200.0, 135.0, 70.0, 51.0, 27.0, 22.0, 7.0, 3.0, 4.0, 0.0, 3.0], "bins": [-18.890625, -18.312255859375, -17.73388671875, -17.155517578125, -16.5771484375, -15.998779296875, -15.42041015625, -14.842041015625, -14.263671875, -13.685302734375, -13.10693359375, -12.528564453125, -11.9501953125, -11.371826171875, -10.79345703125, -10.215087890625, -9.63671875, -9.058349609375, -8.47998046875, -7.901611328125, -7.3232421875, -6.744873046875, -6.16650390625, -5.588134765625, -5.009765625, -4.431396484375, -3.85302734375, -3.274658203125, -2.6962890625, -2.117919921875, -1.53955078125, -0.961181640625, -0.3828125, 0.195556640625, 0.77392578125, 1.352294921875, 1.9306640625, 2.509033203125, 3.08740234375, 3.665771484375, 4.244140625, 4.822509765625, 5.40087890625, 5.979248046875, 6.5576171875, 7.135986328125, 7.71435546875, 8.292724609375, 8.87109375, 9.449462890625, 10.02783203125, 10.606201171875, 11.1845703125, 11.762939453125, 12.34130859375, 12.919677734375, 13.498046875, 14.076416015625, 14.65478515625, 15.233154296875, 15.8115234375, 16.389892578125, 16.96826171875, 17.546630859375, 18.125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 8.0, 5.0, 11.0, 8.0, 12.0, 15.0, 20.0, 27.0, 30.0, 47.0, 52.0, 71.0, 65.0, 85.0, 95.0, 103.0, 122.0, 139.0, 162.0, 170.0, 183.0, 188.0, 189.0, 186.0, 203.0, 222.0, 201.0, 174.0, 169.0, 162.0, 127.0, 129.0, 118.0, 95.0, 86.0, 70.0, 75.0, 49.0, 44.0, 40.0, 20.0, 25.0, 17.0, 14.0, 11.0, 4.0, 7.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.21875, -10.8544921875, -10.490234375, -10.1259765625, -9.76171875, -9.3974609375, -9.033203125, -8.6689453125, -8.3046875, -7.9404296875, -7.576171875, -7.2119140625, -6.84765625, -6.4833984375, -6.119140625, -5.7548828125, -5.390625, -5.0263671875, -4.662109375, -4.2978515625, -3.93359375, -3.5693359375, -3.205078125, -2.8408203125, -2.4765625, -2.1123046875, -1.748046875, -1.3837890625, -1.01953125, -0.6552734375, -0.291015625, 0.0732421875, 0.4375, 0.8017578125, 1.166015625, 1.5302734375, 1.89453125, 2.2587890625, 2.623046875, 2.9873046875, 3.3515625, 3.7158203125, 4.080078125, 4.4443359375, 4.80859375, 5.1728515625, 5.537109375, 5.9013671875, 6.265625, 6.6298828125, 6.994140625, 7.3583984375, 7.72265625, 8.0869140625, 8.451171875, 8.8154296875, 9.1796875, 9.5439453125, 9.908203125, 10.2724609375, 10.63671875, 11.0009765625, 11.365234375, 11.7294921875, 12.09375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 3.0, 9.0, 11.0, 10.0, 9.0, 14.0, 21.0, 21.0, 33.0, 22.0, 28.0, 20.0, 42.0, 36.0, 35.0, 45.0, 49.0, 45.0, 53.0, 52.0, 45.0, 51.0, 33.0, 46.0, 45.0, 33.0, 31.0, 35.0, 13.0, 20.0, 13.0, 19.0, 14.0, 13.0, 6.0, 7.0, 3.0, 2.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.720937728881836, -26.782974243164062, -25.845012664794922, -24.90704917907715, -23.969085693359375, -23.031124114990234, -22.09316062927246, -21.155197143554688, -20.217235565185547, -19.279272079467773, -18.341310501098633, -17.40334701538086, -16.465383529663086, -15.527420997619629, -14.589458465576172, -13.651494979858398, -12.713531494140625, -11.775568962097168, -10.837605476379395, -9.899642944335938, -8.961679458618164, -8.023716926574707, -7.08575439453125, -6.147791385650635, -5.2098283767700195, -4.271865367889404, -3.333902597427368, -2.395939826965332, -1.4579768180847168, -0.5200138092041016, 0.41794872283935547, 1.3559117317199707, 2.293872833251953, 3.2318358421325684, 4.169798851013184, 5.107761383056641, 6.045724391937256, 6.983687400817871, 7.921649932861328, 8.859613418579102, 9.797575950622559, 10.735538482666016, 11.673501968383789, 12.611464500427246, 13.549427032470703, 14.487390518188477, 15.425353050231934, 16.36331558227539, 17.301279067993164, 18.239242553710938, 19.177204132080078, 20.11516761779785, 21.053131103515625, 21.991092681884766, 22.92905616760254, 23.867019653320312, 24.804981231689453, 25.742944717407227, 26.680906295776367, 27.61886978149414, 28.556833267211914, 29.494796752929688, 30.432758331298828, 31.3707218170166, 32.308685302734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 3.0, 7.0, 6.0, 12.0, 20.0, 14.0, 16.0, 21.0, 18.0, 23.0, 21.0, 25.0, 18.0, 36.0, 50.0, 35.0, 37.0, 39.0, 40.0, 35.0, 50.0, 60.0, 45.0, 40.0, 39.0, 30.0, 29.0, 35.0, 33.0, 28.0, 23.0, 15.0, 15.0, 16.0, 18.0, 9.0, 9.0, 7.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.87775802612305, -34.811649322509766, -33.74553680419922, -32.67942810058594, -31.613317489624023, -30.54720687866211, -29.481098175048828, -28.414987564086914, -27.348876953125, -26.282766342163086, -25.216655731201172, -24.15054702758789, -23.084436416625977, -22.018325805664062, -20.95221710205078, -19.886106491088867, -18.819995880126953, -17.75388526916504, -16.687774658203125, -15.621665954589844, -14.55555534362793, -13.489444732666016, -12.423335075378418, -11.35722541809082, -10.291114807128906, -9.225004196166992, -8.158894538879395, -7.092784404754639, -6.026674270629883, -4.960564136505127, -3.894454002380371, -2.8283438682556152, -1.762237548828125, -0.6961274147033691, 0.3699827194213867, 1.4360928535461426, 2.5022029876708984, 3.5683131217956543, 4.63442325592041, 5.700533390045166, 6.766643524169922, 7.832753658294678, 8.898863792419434, 9.964973449707031, 11.031084060668945, 12.09719467163086, 13.163304328918457, 14.229413986206055, 15.295524597167969, 16.361635208129883, 17.427745819091797, 18.493854522705078, 19.559965133666992, 20.626075744628906, 21.692184448242188, 22.7582950592041, 23.824405670166016, 24.89051628112793, 25.956626892089844, 27.022735595703125, 28.08884620666504, 29.154956817626953, 30.221065521240234, 31.28717613220215, 32.35328674316406]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 18.0, 23.0, 29.0, 49.0, 71.0, 117.0, 130.0, 152.0, 247.0, 345.0, 485.0, 743.0, 1067.0, 1503.0, 2293.0, 3380.0, 5297.0, 8345.0, 13388.0, 22767.0, 40809.0, 73486.0, 134892.0, 218203.0, 216293.0, 133081.0, 72052.0, 39352.0, 22818.0, 13222.0, 8186.0, 5216.0, 3399.0, 2174.0, 1507.0, 1023.0, 700.0, 489.0, 347.0, 230.0, 206.0, 125.0, 86.0, 61.0, 60.0, 31.0, 15.0, 17.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.71875, -15.227294921875, -14.73583984375, -14.244384765625, -13.7529296875, -13.261474609375, -12.77001953125, -12.278564453125, -11.787109375, -11.295654296875, -10.80419921875, -10.312744140625, -9.8212890625, -9.329833984375, -8.83837890625, -8.346923828125, -7.85546875, -7.364013671875, -6.87255859375, -6.381103515625, -5.8896484375, -5.398193359375, -4.90673828125, -4.415283203125, -3.923828125, -3.432373046875, -2.94091796875, -2.449462890625, -1.9580078125, -1.466552734375, -0.97509765625, -0.483642578125, 0.0078125, 0.499267578125, 0.99072265625, 1.482177734375, 1.9736328125, 2.465087890625, 2.95654296875, 3.447998046875, 3.939453125, 4.430908203125, 4.92236328125, 5.413818359375, 5.9052734375, 6.396728515625, 6.88818359375, 7.379638671875, 7.87109375, 8.362548828125, 8.85400390625, 9.345458984375, 9.8369140625, 10.328369140625, 10.81982421875, 11.311279296875, 11.802734375, 12.294189453125, 12.78564453125, 13.277099609375, 13.7685546875, 14.260009765625, 14.75146484375, 15.242919921875, 15.734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 3.0, 5.0, 9.0, 13.0, 16.0, 13.0, 19.0, 20.0, 18.0, 25.0, 19.0, 26.0, 17.0, 38.0, 48.0, 37.0, 33.0, 44.0, 38.0, 33.0, 49.0, 64.0, 42.0, 41.0, 39.0, 28.0, 34.0, 33.0, 29.0, 32.0, 23.0, 13.0, 18.0, 16.0, 16.0, 9.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.90625, -34.84375, -33.78125, -32.71875, -31.65625, -30.59375, -29.53125, -28.46875, -27.40625, -26.34375, -25.28125, -24.21875, -23.15625, -22.09375, -21.03125, -19.96875, -18.90625, -17.84375, -16.78125, -15.71875, -14.65625, -13.59375, -12.53125, -11.46875, -10.40625, -9.34375, -8.28125, -7.21875, -6.15625, -5.09375, -4.03125, -2.96875, -1.90625, -0.84375, 0.21875, 1.28125, 2.34375, 3.40625, 4.46875, 5.53125, 6.59375, 7.65625, 8.71875, 9.78125, 10.84375, 11.90625, 12.96875, 14.03125, 15.09375, 16.15625, 17.21875, 18.28125, 19.34375, 20.40625, 21.46875, 22.53125, 23.59375, 24.65625, 25.71875, 26.78125, 27.84375, 28.90625, 29.96875, 31.03125, 32.09375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 6.0, 10.0, 17.0, 21.0, 36.0, 48.0, 63.0, 94.0, 88.0, 155.0, 210.0, 267.0, 410.0, 566.0, 925.0, 1494.0, 2458.0, 4293.0, 7998.0, 16067.0, 37714.0, 109062.0, 357736.0, 337165.0, 101517.0, 35869.0, 15605.0, 7679.0, 4109.0, 2366.0, 1459.0, 899.0, 632.0, 422.0, 319.0, 233.0, 155.0, 104.0, 86.0, 57.0, 44.0, 25.0, 26.0, 13.0, 10.0, 5.0, 5.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-19.65625, -19.06005859375, -18.4638671875, -17.86767578125, -17.271484375, -16.67529296875, -16.0791015625, -15.48291015625, -14.88671875, -14.29052734375, -13.6943359375, -13.09814453125, -12.501953125, -11.90576171875, -11.3095703125, -10.71337890625, -10.1171875, -9.52099609375, -8.9248046875, -8.32861328125, -7.732421875, -7.13623046875, -6.5400390625, -5.94384765625, -5.34765625, -4.75146484375, -4.1552734375, -3.55908203125, -2.962890625, -2.36669921875, -1.7705078125, -1.17431640625, -0.578125, 0.01806640625, 0.6142578125, 1.21044921875, 1.806640625, 2.40283203125, 2.9990234375, 3.59521484375, 4.19140625, 4.78759765625, 5.3837890625, 5.97998046875, 6.576171875, 7.17236328125, 7.7685546875, 8.36474609375, 8.9609375, 9.55712890625, 10.1533203125, 10.74951171875, 11.345703125, 11.94189453125, 12.5380859375, 13.13427734375, 13.73046875, 14.32666015625, 14.9228515625, 15.51904296875, 16.115234375, 16.71142578125, 17.3076171875, 17.90380859375, 18.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 2.0, 3.0, 4.0, 3.0, 6.0, 9.0, 10.0, 17.0, 19.0, 11.0, 15.0, 22.0, 22.0, 28.0, 26.0, 30.0, 36.0, 30.0, 39.0, 31.0, 27.0, 45.0, 56.0, 44.0, 36.0, 33.0, 33.0, 28.0, 44.0, 33.0, 27.0, 25.0, 25.0, 18.0, 24.0, 22.0, 22.0, 15.0, 14.0, 10.0, 9.0, 9.0, 5.0, 4.0, 3.0, 7.0, 11.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-21.109375, -20.427001953125, -19.74462890625, -19.062255859375, -18.3798828125, -17.697509765625, -17.01513671875, -16.332763671875, -15.650390625, -14.968017578125, -14.28564453125, -13.603271484375, -12.9208984375, -12.238525390625, -11.55615234375, -10.873779296875, -10.19140625, -9.509033203125, -8.82666015625, -8.144287109375, -7.4619140625, -6.779541015625, -6.09716796875, -5.414794921875, -4.732421875, -4.050048828125, -3.36767578125, -2.685302734375, -2.0029296875, -1.320556640625, -0.63818359375, 0.044189453125, 0.7265625, 1.408935546875, 2.09130859375, 2.773681640625, 3.4560546875, 4.138427734375, 4.82080078125, 5.503173828125, 6.185546875, 6.867919921875, 7.55029296875, 8.232666015625, 8.9150390625, 9.597412109375, 10.27978515625, 10.962158203125, 11.64453125, 12.326904296875, 13.00927734375, 13.691650390625, 14.3740234375, 15.056396484375, 15.73876953125, 16.421142578125, 17.103515625, 17.785888671875, 18.46826171875, 19.150634765625, 19.8330078125, 20.515380859375, 21.19775390625, 21.880126953125, 22.5625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 11.0, 13.0, 9.0, 29.0, 37.0, 58.0, 92.0, 125.0, 181.0, 328.0, 555.0, 1099.0, 2369.0, 5645.0, 17061.0, 81225.0, 774723.0, 129503.0, 22472.0, 7021.0, 2911.0, 1395.0, 710.0, 359.0, 196.0, 124.0, 91.0, 56.0, 39.0, 31.0, 14.0, 12.0, 14.0, 11.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.34375, -26.420166015625, -25.49658203125, -24.572998046875, -23.6494140625, -22.725830078125, -21.80224609375, -20.878662109375, -19.955078125, -19.031494140625, -18.10791015625, -17.184326171875, -16.2607421875, -15.337158203125, -14.41357421875, -13.489990234375, -12.56640625, -11.642822265625, -10.71923828125, -9.795654296875, -8.8720703125, -7.948486328125, -7.02490234375, -6.101318359375, -5.177734375, -4.254150390625, -3.33056640625, -2.406982421875, -1.4833984375, -0.559814453125, 0.36376953125, 1.287353515625, 2.2109375, 3.134521484375, 4.05810546875, 4.981689453125, 5.9052734375, 6.828857421875, 7.75244140625, 8.676025390625, 9.599609375, 10.523193359375, 11.44677734375, 12.370361328125, 13.2939453125, 14.217529296875, 15.14111328125, 16.064697265625, 16.98828125, 17.911865234375, 18.83544921875, 19.759033203125, 20.6826171875, 21.606201171875, 22.52978515625, 23.453369140625, 24.376953125, 25.300537109375, 26.22412109375, 27.147705078125, 28.0712890625, 28.994873046875, 29.91845703125, 30.842041015625, 31.765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 7.0, 2.0, 7.0, 3.0, 8.0, 10.0, 19.0, 13.0, 20.0, 21.0, 37.0, 44.0, 84.0, 89.0, 114.0, 106.0, 79.0, 78.0, 54.0, 31.0, 32.0, 27.0, 16.0, 7.0, 9.0, 14.0, 13.0, 12.0, 8.0, 4.0, 4.0, 8.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014438629150390625, -0.0013903379440307617, -0.001336812973022461, -0.0012832880020141602, -0.0012297630310058594, -0.0011762380599975586, -0.0011227130889892578, -0.001069188117980957, -0.0010156631469726562, -0.0009621381759643555, -0.0009086132049560547, -0.0008550882339477539, -0.0008015632629394531, -0.0007480382919311523, -0.0006945133209228516, -0.0006409883499145508, -0.00058746337890625, -0.0005339384078979492, -0.00048041343688964844, -0.00042688846588134766, -0.0003733634948730469, -0.0003198385238647461, -0.0002663135528564453, -0.00021278858184814453, -0.00015926361083984375, -0.00010573863983154297, -5.221366882324219e-05, 1.3113021850585938e-06, 5.4836273193359375e-05, 0.00010836124420166016, 0.00016188621520996094, 0.00021541118621826172, 0.0002689361572265625, 0.0003224611282348633, 0.00037598609924316406, 0.00042951107025146484, 0.0004830360412597656, 0.0005365610122680664, 0.0005900859832763672, 0.000643610954284668, 0.0006971359252929688, 0.0007506608963012695, 0.0008041858673095703, 0.0008577108383178711, 0.0009112358093261719, 0.0009647607803344727, 0.0010182857513427734, 0.0010718107223510742, 0.001125335693359375, 0.0011788606643676758, 0.0012323856353759766, 0.0012859106063842773, 0.0013394355773925781, 0.001392960548400879, 0.0014464855194091797, 0.0015000104904174805, 0.0015535354614257812, 0.001607060432434082, 0.0016605854034423828, 0.0017141103744506836, 0.0017676353454589844, 0.0018211603164672852, 0.001874685287475586, 0.0019282102584838867, 0.0019817352294921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 7.0, 9.0, 8.0, 12.0, 14.0, 14.0, 14.0, 31.0, 36.0, 52.0, 74.0, 97.0, 144.0, 202.0, 258.0, 384.0, 583.0, 836.0, 1296.0, 1825.0, 2645.0, 4300.0, 6866.0, 11932.0, 21765.0, 45192.0, 111620.0, 307512.0, 314733.0, 115521.0, 45858.0, 22455.0, 12209.0, 7032.0, 4282.0, 2744.0, 1879.0, 1218.0, 855.0, 586.0, 422.0, 306.0, 181.0, 169.0, 102.0, 76.0, 60.0, 43.0, 38.0, 16.0, 12.0, 13.0, 2.0, 8.0, 5.0, 4.0, 0.0, 2.0], "bins": [-16.28125, -15.8026123046875, -15.323974609375, -14.8453369140625, -14.36669921875, -13.8880615234375, -13.409423828125, -12.9307861328125, -12.4521484375, -11.9735107421875, -11.494873046875, -11.0162353515625, -10.53759765625, -10.0589599609375, -9.580322265625, -9.1016845703125, -8.623046875, -8.1444091796875, -7.665771484375, -7.1871337890625, -6.70849609375, -6.2298583984375, -5.751220703125, -5.2725830078125, -4.7939453125, -4.3153076171875, -3.836669921875, -3.3580322265625, -2.87939453125, -2.4007568359375, -1.922119140625, -1.4434814453125, -0.96484375, -0.4862060546875, -0.007568359375, 0.4710693359375, 0.94970703125, 1.4283447265625, 1.906982421875, 2.3856201171875, 2.8642578125, 3.3428955078125, 3.821533203125, 4.3001708984375, 4.77880859375, 5.2574462890625, 5.736083984375, 6.2147216796875, 6.693359375, 7.1719970703125, 7.650634765625, 8.1292724609375, 8.60791015625, 9.0865478515625, 9.565185546875, 10.0438232421875, 10.5224609375, 11.0010986328125, 11.479736328125, 11.9583740234375, 12.43701171875, 12.9156494140625, 13.394287109375, 13.8729248046875, 14.3515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 8.0, 5.0, 13.0, 8.0, 11.0, 17.0, 44.0, 39.0, 84.0, 94.0, 116.0, 117.0, 115.0, 104.0, 60.0, 44.0, 38.0, 25.0, 17.0, 8.0, 4.0, 10.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.82904052734375, -4.6151123046875, -4.40118408203125, -4.187255859375, -3.97332763671875, -3.7593994140625, -3.54547119140625, -3.33154296875, -3.11761474609375, -2.9036865234375, -2.68975830078125, -2.475830078125, -2.26190185546875, -2.0479736328125, -1.83404541015625, -1.6201171875, -1.40618896484375, -1.1922607421875, -0.97833251953125, -0.764404296875, -0.55047607421875, -0.3365478515625, -0.12261962890625, 0.09130859375, 0.30523681640625, 0.5191650390625, 0.73309326171875, 0.947021484375, 1.16094970703125, 1.3748779296875, 1.58880615234375, 1.802734375, 2.01666259765625, 2.2305908203125, 2.44451904296875, 2.658447265625, 2.87237548828125, 3.0863037109375, 3.30023193359375, 3.51416015625, 3.72808837890625, 3.9420166015625, 4.15594482421875, 4.369873046875, 4.58380126953125, 4.7977294921875, 5.01165771484375, 5.2255859375, 5.43951416015625, 5.6534423828125, 5.86737060546875, 6.081298828125, 6.29522705078125, 6.5091552734375, 6.72308349609375, 6.93701171875, 7.15093994140625, 7.3648681640625, 7.57879638671875, 7.792724609375, 8.00665283203125, 8.2205810546875, 8.43450927734375, 8.6484375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 3.0, 9.0, 7.0, 16.0, 10.0, 19.0, 19.0, 18.0, 26.0, 28.0, 29.0, 29.0, 33.0, 32.0, 39.0, 46.0, 51.0, 51.0, 51.0, 48.0, 36.0, 51.0, 44.0, 48.0, 44.0, 28.0, 30.0, 21.0, 14.0, 23.0, 19.0, 10.0, 13.0, 15.0, 2.0, 12.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.0669002532959, -25.13973617553711, -24.21257209777832, -23.28540802001953, -22.358243942260742, -21.431079864501953, -20.503915786743164, -19.576751708984375, -18.649587631225586, -17.722423553466797, -16.795259475708008, -15.868095397949219, -14.94093132019043, -14.01376724243164, -13.086603164672852, -12.159439086914062, -11.232275009155273, -10.305110931396484, -9.377946853637695, -8.450782775878906, -7.523618698120117, -6.596454620361328, -5.669290542602539, -4.74212646484375, -3.814962387084961, -2.887798309326172, -1.9606342315673828, -1.0334701538085938, -0.10630607604980469, 0.8208580017089844, 1.7480220794677734, 2.6751861572265625, 3.6023483276367188, 4.529512405395508, 5.456676483154297, 6.383840560913086, 7.311004638671875, 8.238168716430664, 9.165332794189453, 10.092496871948242, 11.019660949707031, 11.94682502746582, 12.87398910522461, 13.801153182983398, 14.728317260742188, 15.655481338500977, 16.582645416259766, 17.509809494018555, 18.436973571777344, 19.364137649536133, 20.291301727294922, 21.21846580505371, 22.1456298828125, 23.07279396057129, 23.999958038330078, 24.927122116088867, 25.854286193847656, 26.781450271606445, 27.708614349365234, 28.635778427124023, 29.562942504882812, 30.4901065826416, 31.41727066040039, 32.34443664550781, 33.27159881591797]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 6.0, 3.0, 10.0, 16.0, 17.0, 18.0, 15.0, 16.0, 25.0, 21.0, 19.0, 31.0, 21.0, 37.0, 48.0, 40.0, 40.0, 39.0, 32.0, 35.0, 54.0, 58.0, 41.0, 39.0, 39.0, 39.0, 22.0, 32.0, 31.0, 21.0, 22.0, 19.0, 13.0, 17.0, 15.0, 9.0, 10.0, 4.0, 5.0, 10.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.96949005126953, -34.92582321166992, -33.88215637207031, -32.8384895324707, -31.794822692871094, -30.751155853271484, -29.707489013671875, -28.663822174072266, -27.620155334472656, -26.576488494873047, -25.532821655273438, -24.489154815673828, -23.44548797607422, -22.40182113647461, -21.358154296875, -20.31448745727539, -19.27082061767578, -18.227153778076172, -17.183486938476562, -16.139820098876953, -15.096153259277344, -14.052486419677734, -13.008819580078125, -11.965152740478516, -10.921485900878906, -9.877819061279297, -8.834152221679688, -7.790485382080078, -6.746818542480469, -5.703151702880859, -4.65948486328125, -3.6158180236816406, -2.572154998779297, -1.5284881591796875, -0.4848213195800781, 0.5588455200195312, 1.6025123596191406, 2.64617919921875, 3.6898460388183594, 4.733512878417969, 5.777179718017578, 6.8208465576171875, 7.864513397216797, 8.908180236816406, 9.951847076416016, 10.995513916015625, 12.039180755615234, 13.082847595214844, 14.126514434814453, 15.170181274414062, 16.213848114013672, 17.25751495361328, 18.30118179321289, 19.3448486328125, 20.38851547241211, 21.43218231201172, 22.475849151611328, 23.519515991210938, 24.563182830810547, 25.606849670410156, 26.650516510009766, 27.694183349609375, 28.737850189208984, 29.781517028808594, 30.825183868408203]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 16.0, 9.0, 32.0, 36.0, 84.0, 125.0, 213.0, 360.0, 547.0, 822.0, 1378.0, 2191.0, 3355.0, 5320.0, 8102.0, 12024.0, 18077.0, 25895.0, 35914.0, 48836.0, 62687.0, 77572.0, 89858.0, 98392.0, 99691.0, 95926.0, 85968.0, 72783.0, 57897.0, 43957.0, 32266.0, 22760.0, 15821.0, 10293.0, 7033.0, 4512.0, 2895.0, 1787.0, 1176.0, 712.0, 482.0, 302.0, 176.0, 122.0, 68.0, 40.0, 21.0, 11.0, 9.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.515625, -17.905029296875, -17.29443359375, -16.683837890625, -16.0732421875, -15.462646484375, -14.85205078125, -14.241455078125, -13.630859375, -13.020263671875, -12.40966796875, -11.799072265625, -11.1884765625, -10.577880859375, -9.96728515625, -9.356689453125, -8.74609375, -8.135498046875, -7.52490234375, -6.914306640625, -6.3037109375, -5.693115234375, -5.08251953125, -4.471923828125, -3.861328125, -3.250732421875, -2.64013671875, -2.029541015625, -1.4189453125, -0.808349609375, -0.19775390625, 0.412841796875, 1.0234375, 1.634033203125, 2.24462890625, 2.855224609375, 3.4658203125, 4.076416015625, 4.68701171875, 5.297607421875, 5.908203125, 6.518798828125, 7.12939453125, 7.739990234375, 8.3505859375, 8.961181640625, 9.57177734375, 10.182373046875, 10.79296875, 11.403564453125, 12.01416015625, 12.624755859375, 13.2353515625, 13.845947265625, 14.45654296875, 15.067138671875, 15.677734375, 16.288330078125, 16.89892578125, 17.509521484375, 18.1201171875, 18.730712890625, 19.34130859375, 19.951904296875, 20.5625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 11.0, 17.0, 18.0, 15.0, 15.0, 16.0, 27.0, 20.0, 23.0, 28.0, 26.0, 38.0, 45.0, 37.0, 43.0, 39.0, 29.0, 44.0, 53.0, 54.0, 40.0, 37.0, 41.0, 38.0, 14.0, 39.0, 28.0, 23.0, 23.0, 15.0, 13.0, 18.0, 12.0, 11.0, 8.0, 5.0, 5.0, 9.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-34.4375, -33.4296875, -32.421875, -31.4140625, -30.40625, -29.3984375, -28.390625, -27.3828125, -26.375, -25.3671875, -24.359375, -23.3515625, -22.34375, -21.3359375, -20.328125, -19.3203125, -18.3125, -17.3046875, -16.296875, -15.2890625, -14.28125, -13.2734375, -12.265625, -11.2578125, -10.25, -9.2421875, -8.234375, -7.2265625, -6.21875, -5.2109375, -4.203125, -3.1953125, -2.1875, -1.1796875, -0.171875, 0.8359375, 1.84375, 2.8515625, 3.859375, 4.8671875, 5.875, 6.8828125, 7.890625, 8.8984375, 9.90625, 10.9140625, 11.921875, 12.9296875, 13.9375, 14.9453125, 15.953125, 16.9609375, 17.96875, 18.9765625, 19.984375, 20.9921875, 22.0, 23.0078125, 24.015625, 25.0234375, 26.03125, 27.0390625, 28.046875, 29.0546875, 30.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 10.0, 14.0, 21.0, 31.0, 54.0, 77.0, 137.0, 217.0, 328.0, 489.0, 804.0, 1284.0, 1916.0, 3066.0, 4594.0, 7357.0, 10789.0, 16323.0, 24186.0, 34338.0, 47484.0, 63155.0, 79886.0, 94340.0, 104237.0, 106012.0, 100631.0, 88551.0, 72129.0, 56391.0, 41399.0, 29089.0, 20339.0, 13477.0, 8972.0, 5836.0, 3771.0, 2443.0, 1598.0, 997.0, 650.0, 417.0, 273.0, 163.0, 98.0, 65.0, 35.0, 29.0, 13.0, 9.0, 10.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.078125, -21.3720703125, -20.666015625, -19.9599609375, -19.25390625, -18.5478515625, -17.841796875, -17.1357421875, -16.4296875, -15.7236328125, -15.017578125, -14.3115234375, -13.60546875, -12.8994140625, -12.193359375, -11.4873046875, -10.78125, -10.0751953125, -9.369140625, -8.6630859375, -7.95703125, -7.2509765625, -6.544921875, -5.8388671875, -5.1328125, -4.4267578125, -3.720703125, -3.0146484375, -2.30859375, -1.6025390625, -0.896484375, -0.1904296875, 0.515625, 1.2216796875, 1.927734375, 2.6337890625, 3.33984375, 4.0458984375, 4.751953125, 5.4580078125, 6.1640625, 6.8701171875, 7.576171875, 8.2822265625, 8.98828125, 9.6943359375, 10.400390625, 11.1064453125, 11.8125, 12.5185546875, 13.224609375, 13.9306640625, 14.63671875, 15.3427734375, 16.048828125, 16.7548828125, 17.4609375, 18.1669921875, 18.873046875, 19.5791015625, 20.28515625, 20.9912109375, 21.697265625, 22.4033203125, 23.109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 9.0, 6.0, 9.0, 7.0, 12.0, 16.0, 14.0, 20.0, 21.0, 23.0, 28.0, 27.0, 41.0, 39.0, 30.0, 35.0, 41.0, 39.0, 43.0, 47.0, 37.0, 40.0, 41.0, 34.0, 38.0, 50.0, 27.0, 31.0, 32.0, 21.0, 17.0, 22.0, 16.0, 10.0, 15.0, 15.0, 5.0, 7.0, 9.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-23.71875, -23.041748046875, -22.36474609375, -21.687744140625, -21.0107421875, -20.333740234375, -19.65673828125, -18.979736328125, -18.302734375, -17.625732421875, -16.94873046875, -16.271728515625, -15.5947265625, -14.917724609375, -14.24072265625, -13.563720703125, -12.88671875, -12.209716796875, -11.53271484375, -10.855712890625, -10.1787109375, -9.501708984375, -8.82470703125, -8.147705078125, -7.470703125, -6.793701171875, -6.11669921875, -5.439697265625, -4.7626953125, -4.085693359375, -3.40869140625, -2.731689453125, -2.0546875, -1.377685546875, -0.70068359375, -0.023681640625, 0.6533203125, 1.330322265625, 2.00732421875, 2.684326171875, 3.361328125, 4.038330078125, 4.71533203125, 5.392333984375, 6.0693359375, 6.746337890625, 7.42333984375, 8.100341796875, 8.77734375, 9.454345703125, 10.13134765625, 10.808349609375, 11.4853515625, 12.162353515625, 12.83935546875, 13.516357421875, 14.193359375, 14.870361328125, 15.54736328125, 16.224365234375, 16.9013671875, 17.578369140625, 18.25537109375, 18.932373046875, 19.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 15.0, 14.0, 20.0, 30.0, 34.0, 78.0, 102.0, 167.0, 220.0, 355.0, 527.0, 882.0, 1517.0, 2416.0, 4035.0, 6786.0, 12517.0, 22800.0, 43154.0, 81357.0, 136573.0, 186757.0, 192970.0, 150532.0, 92975.0, 50793.0, 26834.0, 14409.0, 7917.0, 4769.0, 2649.0, 1602.0, 1004.0, 598.0, 411.0, 254.0, 163.0, 109.0, 67.0, 37.0, 39.0, 21.0, 12.0, 7.0, 11.0, 1.0, 2.0, 6.0, 2.0, 3.0, 1.0], "bins": [-16.703125, -16.2275390625, -15.751953125, -15.2763671875, -14.80078125, -14.3251953125, -13.849609375, -13.3740234375, -12.8984375, -12.4228515625, -11.947265625, -11.4716796875, -10.99609375, -10.5205078125, -10.044921875, -9.5693359375, -9.09375, -8.6181640625, -8.142578125, -7.6669921875, -7.19140625, -6.7158203125, -6.240234375, -5.7646484375, -5.2890625, -4.8134765625, -4.337890625, -3.8623046875, -3.38671875, -2.9111328125, -2.435546875, -1.9599609375, -1.484375, -1.0087890625, -0.533203125, -0.0576171875, 0.41796875, 0.8935546875, 1.369140625, 1.8447265625, 2.3203125, 2.7958984375, 3.271484375, 3.7470703125, 4.22265625, 4.6982421875, 5.173828125, 5.6494140625, 6.125, 6.6005859375, 7.076171875, 7.5517578125, 8.02734375, 8.5029296875, 8.978515625, 9.4541015625, 9.9296875, 10.4052734375, 10.880859375, 11.3564453125, 11.83203125, 12.3076171875, 12.783203125, 13.2587890625, 13.734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 3.0, 2.0, 9.0, 11.0, 11.0, 21.0, 40.0, 40.0, 53.0, 47.0, 75.0, 84.0, 75.0, 83.0, 86.0, 61.0, 63.0, 44.0, 50.0, 26.0, 32.0, 12.0, 20.0, 12.0, 8.0, 4.0, 7.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0018835067749023438, -0.0018233805894851685, -0.0017632544040679932, -0.0017031282186508179, -0.0016430020332336426, -0.0015828758478164673, -0.001522749662399292, -0.0014626234769821167, -0.0014024972915649414, -0.0013423711061477661, -0.0012822449207305908, -0.0012221187353134155, -0.0011619925498962402, -0.001101866364479065, -0.0010417401790618896, -0.0009816139936447144, -0.0009214878082275391, -0.0008613616228103638, -0.0008012354373931885, -0.0007411092519760132, -0.0006809830665588379, -0.0006208568811416626, -0.0005607306957244873, -0.000500604510307312, -0.0004404783248901367, -0.0003803521394729614, -0.00032022595405578613, -0.00026009976863861084, -0.00019997358322143555, -0.00013984739780426025, -7.972121238708496e-05, -1.9595026969909668e-05, 4.0531158447265625e-05, 0.00010065734386444092, 0.0001607835292816162, 0.0002209097146987915, 0.0002810359001159668, 0.0003411620855331421, 0.0004012882709503174, 0.0004614144563674927, 0.000521540641784668, 0.0005816668272018433, 0.0006417930126190186, 0.0007019191980361938, 0.0007620453834533691, 0.0008221715688705444, 0.0008822977542877197, 0.000942423939704895, 0.0010025501251220703, 0.0010626763105392456, 0.001122802495956421, 0.0011829286813735962, 0.0012430548667907715, 0.0013031810522079468, 0.001363307237625122, 0.0014234334230422974, 0.0014835596084594727, 0.001543685793876648, 0.0016038119792938232, 0.0016639381647109985, 0.0017240643501281738, 0.0017841905355453491, 0.0018443167209625244, 0.0019044429063796997, 0.001964569091796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 8.0, 8.0, 10.0, 25.0, 29.0, 38.0, 48.0, 54.0, 100.0, 108.0, 138.0, 240.0, 318.0, 447.0, 625.0, 1007.0, 1615.0, 2629.0, 4664.0, 8482.0, 15914.0, 30758.0, 59860.0, 105678.0, 161799.0, 193671.0, 177134.0, 125069.0, 73883.0, 39259.0, 19915.0, 10539.0, 5703.0, 3205.0, 1917.0, 1163.0, 780.0, 497.0, 352.0, 203.0, 168.0, 118.0, 97.0, 71.0, 55.0, 44.0, 28.0, 30.0, 15.0, 8.0, 7.0, 12.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0], "bins": [-14.421875, -13.966552734375, -13.51123046875, -13.055908203125, -12.6005859375, -12.145263671875, -11.68994140625, -11.234619140625, -10.779296875, -10.323974609375, -9.86865234375, -9.413330078125, -8.9580078125, -8.502685546875, -8.04736328125, -7.592041015625, -7.13671875, -6.681396484375, -6.22607421875, -5.770751953125, -5.3154296875, -4.860107421875, -4.40478515625, -3.949462890625, -3.494140625, -3.038818359375, -2.58349609375, -2.128173828125, -1.6728515625, -1.217529296875, -0.76220703125, -0.306884765625, 0.1484375, 0.603759765625, 1.05908203125, 1.514404296875, 1.9697265625, 2.425048828125, 2.88037109375, 3.335693359375, 3.791015625, 4.246337890625, 4.70166015625, 5.156982421875, 5.6123046875, 6.067626953125, 6.52294921875, 6.978271484375, 7.43359375, 7.888916015625, 8.34423828125, 8.799560546875, 9.2548828125, 9.710205078125, 10.16552734375, 10.620849609375, 11.076171875, 11.531494140625, 11.98681640625, 12.442138671875, 12.8974609375, 13.352783203125, 13.80810546875, 14.263427734375, 14.71875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 10.0, 15.0, 20.0, 26.0, 25.0, 33.0, 37.0, 50.0, 48.0, 57.0, 58.0, 66.0, 66.0, 69.0, 51.0, 59.0, 61.0, 41.0, 35.0, 41.0, 23.0, 30.0, 25.0, 6.0, 7.0, 13.0, 2.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.35546875, -5.19158935546875, -5.0277099609375, -4.86383056640625, -4.699951171875, -4.53607177734375, -4.3721923828125, -4.20831298828125, -4.04443359375, -3.88055419921875, -3.7166748046875, -3.55279541015625, -3.388916015625, -3.22503662109375, -3.0611572265625, -2.89727783203125, -2.7333984375, -2.56951904296875, -2.4056396484375, -2.24176025390625, -2.077880859375, -1.91400146484375, -1.7501220703125, -1.58624267578125, -1.42236328125, -1.25848388671875, -1.0946044921875, -0.93072509765625, -0.766845703125, -0.60296630859375, -0.4390869140625, -0.27520751953125, -0.111328125, 0.05255126953125, 0.2164306640625, 0.38031005859375, 0.544189453125, 0.70806884765625, 0.8719482421875, 1.03582763671875, 1.19970703125, 1.36358642578125, 1.5274658203125, 1.69134521484375, 1.855224609375, 2.01910400390625, 2.1829833984375, 2.34686279296875, 2.5107421875, 2.67462158203125, 2.8385009765625, 3.00238037109375, 3.166259765625, 3.33013916015625, 3.4940185546875, 3.65789794921875, 3.82177734375, 3.98565673828125, 4.1495361328125, 4.31341552734375, 4.477294921875, 4.64117431640625, 4.8050537109375, 4.96893310546875, 5.1328125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 8.0, 5.0, 9.0, 11.0, 10.0, 23.0, 27.0, 17.0, 18.0, 21.0, 21.0, 34.0, 31.0, 34.0, 35.0, 55.0, 40.0, 50.0, 33.0, 44.0, 49.0, 46.0, 44.0, 41.0, 41.0, 30.0, 27.0, 33.0, 27.0, 22.0, 19.0, 21.0, 15.0, 7.0, 13.0, 11.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.40153694152832, -25.504350662231445, -24.607166290283203, -23.709980010986328, -22.812793731689453, -21.91560935974121, -21.018423080444336, -20.121238708496094, -19.22405242919922, -18.326866149902344, -17.4296817779541, -16.532495498657227, -15.635310173034668, -14.73812484741211, -13.840938568115234, -12.943753242492676, -12.0465669631958, -11.149381637573242, -10.252195358276367, -9.355010032653809, -8.45782470703125, -7.560638904571533, -6.663453102111816, -5.766267776489258, -4.869081974029541, -3.9718964099884033, -3.0747108459472656, -2.177525043487549, -1.2803394794464111, -0.38315391540527344, 0.5140318870544434, 1.411217212677002, 2.3084030151367188, 3.2055885791778564, 4.102774143218994, 4.999959945678711, 5.8971452713012695, 6.794331073760986, 7.691516876220703, 8.588702201843262, 9.48588752746582, 10.383072853088379, 11.280259132385254, 12.177444458007812, 13.074629783630371, 13.97181510925293, 14.869001388549805, 15.766186714172363, 16.663372039794922, 17.560558319091797, 18.45774269104004, 19.354928970336914, 20.25211524963379, 21.14929962158203, 22.046485900878906, 22.94367218017578, 23.840858459472656, 24.73804473876953, 25.635229110717773, 26.53241539001465, 27.429601669311523, 28.326786041259766, 29.22397232055664, 30.121158599853516, 31.018342971801758]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 5.0, 6.0, 13.0, 10.0, 11.0, 11.0, 14.0, 22.0, 21.0, 21.0, 17.0, 22.0, 36.0, 25.0, 39.0, 25.0, 28.0, 39.0, 44.0, 34.0, 32.0, 33.0, 39.0, 41.0, 44.0, 40.0, 30.0, 24.0, 37.0, 17.0, 26.0, 28.0, 25.0, 17.0, 15.0, 19.0, 18.0, 11.0, 11.0, 13.0, 4.0, 6.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-34.50358963012695, -33.491119384765625, -32.47864532470703, -31.466175079345703, -30.453704833984375, -29.441232681274414, -28.428760528564453, -27.416290283203125, -26.403818130493164, -25.391345977783203, -24.378875732421875, -23.366403579711914, -22.353931427001953, -21.341461181640625, -20.328989028930664, -19.316516876220703, -18.304046630859375, -17.291574478149414, -16.279104232788086, -15.266632080078125, -14.25416088104248, -13.241689682006836, -12.229217529296875, -11.21674633026123, -10.204275131225586, -9.191803932189941, -8.179332733154297, -7.166860580444336, -6.154389381408691, -5.141918182373047, -4.129446506500244, -3.1169748306274414, -2.1045055389404297, -1.092034101486206, -0.07956266403198242, 0.9329087734222412, 1.9453802108764648, 2.9578514099121094, 3.970323085784912, 4.982794761657715, 5.995265960693359, 7.007737159729004, 8.020208358764648, 9.03268051147461, 10.045151710510254, 11.057622909545898, 12.07009506225586, 13.082566261291504, 14.095037460327148, 15.107508659362793, 16.119979858398438, 17.1324520111084, 18.14492416381836, 19.157394409179688, 20.16986656188965, 21.18233871459961, 22.194808959960938, 23.2072811126709, 24.219751358032227, 25.232223510742188, 26.244693756103516, 27.257165908813477, 28.269638061523438, 29.282108306884766, 30.294580459594727]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 14.0, 16.0, 38.0, 57.0, 84.0, 166.0, 294.0, 484.0, 815.0, 1371.0, 2323.0, 3772.0, 6365.0, 10268.0, 17325.0, 27574.0, 44424.0, 69763.0, 105849.0, 156601.0, 220681.0, 294707.0, 369235.0, 430508.0, 457799.0, 447563.0, 400792.0, 330665.0, 254637.0, 183811.0, 127947.0, 84498.0, 54695.0, 34708.0, 21475.0, 13036.0, 8079.0, 4806.0, 2891.0, 1657.0, 1013.0, 618.0, 354.0, 206.0, 118.0, 62.0, 48.0, 38.0, 12.0, 9.0, 9.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-22.03125, -21.358154296875, -20.68505859375, -20.011962890625, -19.3388671875, -18.665771484375, -17.99267578125, -17.319580078125, -16.646484375, -15.973388671875, -15.30029296875, -14.627197265625, -13.9541015625, -13.281005859375, -12.60791015625, -11.934814453125, -11.26171875, -10.588623046875, -9.91552734375, -9.242431640625, -8.5693359375, -7.896240234375, -7.22314453125, -6.550048828125, -5.876953125, -5.203857421875, -4.53076171875, -3.857666015625, -3.1845703125, -2.511474609375, -1.83837890625, -1.165283203125, -0.4921875, 0.180908203125, 0.85400390625, 1.527099609375, 2.2001953125, 2.873291015625, 3.54638671875, 4.219482421875, 4.892578125, 5.565673828125, 6.23876953125, 6.911865234375, 7.5849609375, 8.258056640625, 8.93115234375, 9.604248046875, 10.27734375, 10.950439453125, 11.62353515625, 12.296630859375, 12.9697265625, 13.642822265625, 14.31591796875, 14.989013671875, 15.662109375, 16.335205078125, 17.00830078125, 17.681396484375, 18.3544921875, 19.027587890625, 19.70068359375, 20.373779296875, 21.046875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 2.0, 8.0, 10.0, 9.0, 14.0, 7.0, 13.0, 20.0, 22.0, 16.0, 26.0, 15.0, 33.0, 31.0, 33.0, 35.0, 24.0, 37.0, 43.0, 41.0, 33.0, 27.0, 32.0, 45.0, 48.0, 47.0, 25.0, 26.0, 34.0, 25.0, 21.0, 29.0, 27.0, 16.0, 19.0, 16.0, 10.0, 19.0, 13.0, 13.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-29.703125, -28.838134765625, -27.97314453125, -27.108154296875, -26.2431640625, -25.378173828125, -24.51318359375, -23.648193359375, -22.783203125, -21.918212890625, -21.05322265625, -20.188232421875, -19.3232421875, -18.458251953125, -17.59326171875, -16.728271484375, -15.86328125, -14.998291015625, -14.13330078125, -13.268310546875, -12.4033203125, -11.538330078125, -10.67333984375, -9.808349609375, -8.943359375, -8.078369140625, -7.21337890625, -6.348388671875, -5.4833984375, -4.618408203125, -3.75341796875, -2.888427734375, -2.0234375, -1.158447265625, -0.29345703125, 0.571533203125, 1.4365234375, 2.301513671875, 3.16650390625, 4.031494140625, 4.896484375, 5.761474609375, 6.62646484375, 7.491455078125, 8.3564453125, 9.221435546875, 10.08642578125, 10.951416015625, 11.81640625, 12.681396484375, 13.54638671875, 14.411376953125, 15.2763671875, 16.141357421875, 17.00634765625, 17.871337890625, 18.736328125, 19.601318359375, 20.46630859375, 21.331298828125, 22.1962890625, 23.061279296875, 23.92626953125, 24.791259765625, 25.65625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 9.0, 12.0, 20.0, 40.0, 77.0, 108.0, 190.0, 354.0, 609.0, 953.0, 1747.0, 2809.0, 4515.0, 7413.0, 11748.0, 18302.0, 27792.0, 42135.0, 61085.0, 88167.0, 121028.0, 162091.0, 207877.0, 256047.0, 301280.0, 338585.0, 361547.0, 364416.0, 351017.0, 319259.0, 276569.0, 229001.0, 181822.0, 138182.0, 102507.0, 72033.0, 49436.0, 33386.0, 22457.0, 14278.0, 8973.0, 5711.0, 3501.0, 2085.0, 1275.0, 773.0, 456.0, 266.0, 150.0, 82.0, 54.0, 24.0, 13.0, 13.0, 7.0, 7.0, 1.0, 1.0], "bins": [-19.34375, -18.761474609375, -18.17919921875, -17.596923828125, -17.0146484375, -16.432373046875, -15.85009765625, -15.267822265625, -14.685546875, -14.103271484375, -13.52099609375, -12.938720703125, -12.3564453125, -11.774169921875, -11.19189453125, -10.609619140625, -10.02734375, -9.445068359375, -8.86279296875, -8.280517578125, -7.6982421875, -7.115966796875, -6.53369140625, -5.951416015625, -5.369140625, -4.786865234375, -4.20458984375, -3.622314453125, -3.0400390625, -2.457763671875, -1.87548828125, -1.293212890625, -0.7109375, -0.128662109375, 0.45361328125, 1.035888671875, 1.6181640625, 2.200439453125, 2.78271484375, 3.364990234375, 3.947265625, 4.529541015625, 5.11181640625, 5.694091796875, 6.2763671875, 6.858642578125, 7.44091796875, 8.023193359375, 8.60546875, 9.187744140625, 9.77001953125, 10.352294921875, 10.9345703125, 11.516845703125, 12.09912109375, 12.681396484375, 13.263671875, 13.845947265625, 14.42822265625, 15.010498046875, 15.5927734375, 16.175048828125, 16.75732421875, 17.339599609375, 17.921875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 6.0, 10.0, 9.0, 17.0, 16.0, 26.0, 25.0, 37.0, 55.0, 61.0, 57.0, 72.0, 120.0, 116.0, 139.0, 138.0, 153.0, 160.0, 185.0, 203.0, 183.0, 180.0, 197.0, 170.0, 218.0, 184.0, 190.0, 172.0, 157.0, 113.0, 114.0, 100.0, 89.0, 76.0, 68.0, 58.0, 44.0, 31.0, 36.0, 21.0, 17.0, 10.0, 12.0, 8.0, 8.0, 10.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.09375, -10.6961669921875, -10.298583984375, -9.9010009765625, -9.50341796875, -9.1058349609375, -8.708251953125, -8.3106689453125, -7.9130859375, -7.5155029296875, -7.117919921875, -6.7203369140625, -6.32275390625, -5.9251708984375, -5.527587890625, -5.1300048828125, -4.732421875, -4.3348388671875, -3.937255859375, -3.5396728515625, -3.14208984375, -2.7445068359375, -2.346923828125, -1.9493408203125, -1.5517578125, -1.1541748046875, -0.756591796875, -0.3590087890625, 0.03857421875, 0.4361572265625, 0.833740234375, 1.2313232421875, 1.62890625, 2.0264892578125, 2.424072265625, 2.8216552734375, 3.21923828125, 3.6168212890625, 4.014404296875, 4.4119873046875, 4.8095703125, 5.2071533203125, 5.604736328125, 6.0023193359375, 6.39990234375, 6.7974853515625, 7.195068359375, 7.5926513671875, 7.990234375, 8.3878173828125, 8.785400390625, 9.1829833984375, 9.58056640625, 9.9781494140625, 10.375732421875, 10.7733154296875, 11.1708984375, 11.5684814453125, 11.966064453125, 12.3636474609375, 12.76123046875, 13.1588134765625, 13.556396484375, 13.9539794921875, 14.3515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 10.0, 11.0, 14.0, 13.0, 18.0, 27.0, 23.0, 29.0, 24.0, 30.0, 31.0, 43.0, 35.0, 36.0, 39.0, 44.0, 41.0, 41.0, 46.0, 47.0, 42.0, 37.0, 36.0, 35.0, 30.0, 25.0, 31.0, 24.0, 20.0, 14.0, 25.0, 10.0, 15.0, 10.0, 6.0, 9.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.26859474182129, -26.371686935424805, -25.474777221679688, -24.577869415283203, -23.680959701538086, -22.7840518951416, -21.887142181396484, -20.990234375, -20.093326568603516, -19.19641876220703, -18.299509048461914, -17.40260124206543, -16.505691528320312, -15.608783721923828, -14.711874961853027, -13.814966201782227, -12.918057441711426, -12.021148681640625, -11.124239921569824, -10.227331161499023, -9.330423355102539, -8.433514595031738, -7.5366058349609375, -6.639697551727295, -5.742788791656494, -4.845880031585693, -3.948971748352051, -3.05206298828125, -2.1551544666290283, -1.2582459449768066, -0.36133718490600586, 0.5355710983276367, 1.4324798583984375, 2.329388380050659, 3.226296901702881, 4.123205661773682, 5.020113945007324, 5.917022705078125, 6.813931465148926, 7.710839748382568, 8.607748031616211, 9.504656791687012, 10.401565551757812, 11.298473358154297, 12.195382118225098, 13.092290878295898, 13.9891996383667, 14.8861083984375, 15.7830171585083, 16.6799259185791, 17.576833724975586, 18.473743438720703, 19.370651245117188, 20.267559051513672, 21.16446876525879, 22.061376571655273, 22.95828628540039, 23.855194091796875, 24.752103805541992, 25.649011611938477, 26.545921325683594, 27.442829132080078, 28.339736938476562, 29.23664665222168, 30.133554458618164]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 12.0, 15.0, 21.0, 15.0, 20.0, 31.0, 27.0, 35.0, 33.0, 29.0, 37.0, 35.0, 42.0, 37.0, 50.0, 50.0, 29.0, 41.0, 46.0, 41.0, 45.0, 34.0, 24.0, 36.0, 37.0, 23.0, 25.0, 19.0, 15.0, 13.0, 12.0, 18.0, 14.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.478355407714844, -36.3380241394043, -35.197696685791016, -34.05736541748047, -32.91703414916992, -31.77670669555664, -30.636375427246094, -29.49604606628418, -28.355716705322266, -27.21538734436035, -26.075056076049805, -24.93472671508789, -23.794397354125977, -22.654067993164062, -21.513736724853516, -20.3734073638916, -19.233076095581055, -18.09274673461914, -16.952415466308594, -15.81208610534668, -14.671756744384766, -13.531426429748535, -12.391096115112305, -11.25076675415039, -10.11043643951416, -8.97010612487793, -7.829776763916016, -6.689446449279785, -5.549116611480713, -4.408786773681641, -3.26845645904541, -2.128126621246338, -0.9877967834472656, 0.1525331735610962, 1.292863130569458, 2.4331932067871094, 3.5735230445861816, 4.713852882385254, 5.854183197021484, 6.994513034820557, 8.134842872619629, 9.27517318725586, 10.415502548217773, 11.555832862854004, 12.696163177490234, 13.836492538452148, 14.976822853088379, 16.11715316772461, 17.257482528686523, 18.397811889648438, 19.538143157958984, 20.6784725189209, 21.818801879882812, 22.95913314819336, 24.099462509155273, 25.239791870117188, 26.380123138427734, 27.52045249938965, 28.660783767700195, 29.80111312866211, 30.941442489624023, 32.08177185058594, 33.222103118896484, 34.36243438720703, 35.50276184082031]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 9.0, 11.0, 18.0, 18.0, 22.0, 45.0, 58.0, 80.0, 120.0, 152.0, 257.0, 337.0, 479.0, 757.0, 1222.0, 2213.0, 4052.0, 9352.0, 27548.0, 93404.0, 311827.0, 397540.0, 135087.0, 39462.0, 12887.0, 5011.0, 2444.0, 1385.0, 890.0, 605.0, 374.0, 276.0, 181.0, 125.0, 86.0, 75.0, 43.0, 29.0, 24.0, 16.0, 11.0, 9.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.296875, -26.473388671875, -25.64990234375, -24.826416015625, -24.0029296875, -23.179443359375, -22.35595703125, -21.532470703125, -20.708984375, -19.885498046875, -19.06201171875, -18.238525390625, -17.4150390625, -16.591552734375, -15.76806640625, -14.944580078125, -14.12109375, -13.297607421875, -12.47412109375, -11.650634765625, -10.8271484375, -10.003662109375, -9.18017578125, -8.356689453125, -7.533203125, -6.709716796875, -5.88623046875, -5.062744140625, -4.2392578125, -3.415771484375, -2.59228515625, -1.768798828125, -0.9453125, -0.121826171875, 0.70166015625, 1.525146484375, 2.3486328125, 3.172119140625, 3.99560546875, 4.819091796875, 5.642578125, 6.466064453125, 7.28955078125, 8.113037109375, 8.9365234375, 9.760009765625, 10.58349609375, 11.406982421875, 12.23046875, 13.053955078125, 13.87744140625, 14.700927734375, 15.5244140625, 16.347900390625, 17.17138671875, 17.994873046875, 18.818359375, 19.641845703125, 20.46533203125, 21.288818359375, 22.1123046875, 22.935791015625, 23.75927734375, 24.582763671875, 25.40625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 12.0, 13.0, 20.0, 17.0, 19.0, 31.0, 24.0, 37.0, 35.0, 26.0, 34.0, 36.0, 40.0, 41.0, 46.0, 52.0, 32.0, 37.0, 46.0, 44.0, 40.0, 37.0, 30.0, 31.0, 39.0, 25.0, 24.0, 19.0, 15.0, 14.0, 13.0, 18.0, 12.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.5, -36.36572265625, -35.2314453125, -34.09716796875, -32.962890625, -31.82861328125, -30.6943359375, -29.56005859375, -28.42578125, -27.29150390625, -26.1572265625, -25.02294921875, -23.888671875, -22.75439453125, -21.6201171875, -20.48583984375, -19.3515625, -18.21728515625, -17.0830078125, -15.94873046875, -14.814453125, -13.68017578125, -12.5458984375, -11.41162109375, -10.27734375, -9.14306640625, -8.0087890625, -6.87451171875, -5.740234375, -4.60595703125, -3.4716796875, -2.33740234375, -1.203125, -0.06884765625, 1.0654296875, 2.19970703125, 3.333984375, 4.46826171875, 5.6025390625, 6.73681640625, 7.87109375, 9.00537109375, 10.1396484375, 11.27392578125, 12.408203125, 13.54248046875, 14.6767578125, 15.81103515625, 16.9453125, 18.07958984375, 19.2138671875, 20.34814453125, 21.482421875, 22.61669921875, 23.7509765625, 24.88525390625, 26.01953125, 27.15380859375, 28.2880859375, 29.42236328125, 30.556640625, 31.69091796875, 32.8251953125, 33.95947265625, 35.09375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 7.0, 4.0, 8.0, 6.0, 24.0, 26.0, 35.0, 36.0, 53.0, 76.0, 119.0, 152.0, 226.0, 321.0, 446.0, 581.0, 779.0, 1160.0, 1826.0, 2818.0, 4257.0, 6973.0, 12240.0, 23768.0, 51487.0, 128793.0, 319255.0, 286491.0, 110467.0, 45567.0, 21159.0, 11078.0, 6461.0, 3876.0, 2470.0, 1608.0, 1154.0, 822.0, 542.0, 425.0, 273.0, 183.0, 177.0, 101.0, 51.0, 48.0, 33.0, 24.0, 25.0, 10.0, 13.0, 5.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-11.7109375, -11.319580078125, -10.92822265625, -10.536865234375, -10.1455078125, -9.754150390625, -9.36279296875, -8.971435546875, -8.580078125, -8.188720703125, -7.79736328125, -7.406005859375, -7.0146484375, -6.623291015625, -6.23193359375, -5.840576171875, -5.44921875, -5.057861328125, -4.66650390625, -4.275146484375, -3.8837890625, -3.492431640625, -3.10107421875, -2.709716796875, -2.318359375, -1.927001953125, -1.53564453125, -1.144287109375, -0.7529296875, -0.361572265625, 0.02978515625, 0.421142578125, 0.8125, 1.203857421875, 1.59521484375, 1.986572265625, 2.3779296875, 2.769287109375, 3.16064453125, 3.552001953125, 3.943359375, 4.334716796875, 4.72607421875, 5.117431640625, 5.5087890625, 5.900146484375, 6.29150390625, 6.682861328125, 7.07421875, 7.465576171875, 7.85693359375, 8.248291015625, 8.6396484375, 9.031005859375, 9.42236328125, 9.813720703125, 10.205078125, 10.596435546875, 10.98779296875, 11.379150390625, 11.7705078125, 12.161865234375, 12.55322265625, 12.944580078125, 13.3359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 7.0, 6.0, 8.0, 11.0, 6.0, 5.0, 9.0, 16.0, 21.0, 17.0, 18.0, 27.0, 21.0, 26.0, 38.0, 28.0, 29.0, 31.0, 37.0, 39.0, 35.0, 50.0, 34.0, 37.0, 37.0, 37.0, 30.0, 32.0, 37.0, 38.0, 36.0, 29.0, 18.0, 25.0, 17.0, 17.0, 15.0, 9.0, 15.0, 15.0, 1.0, 7.0, 6.0, 9.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-25.234375, -24.44873046875, -23.6630859375, -22.87744140625, -22.091796875, -21.30615234375, -20.5205078125, -19.73486328125, -18.94921875, -18.16357421875, -17.3779296875, -16.59228515625, -15.806640625, -15.02099609375, -14.2353515625, -13.44970703125, -12.6640625, -11.87841796875, -11.0927734375, -10.30712890625, -9.521484375, -8.73583984375, -7.9501953125, -7.16455078125, -6.37890625, -5.59326171875, -4.8076171875, -4.02197265625, -3.236328125, -2.45068359375, -1.6650390625, -0.87939453125, -0.09375, 0.69189453125, 1.4775390625, 2.26318359375, 3.048828125, 3.83447265625, 4.6201171875, 5.40576171875, 6.19140625, 6.97705078125, 7.7626953125, 8.54833984375, 9.333984375, 10.11962890625, 10.9052734375, 11.69091796875, 12.4765625, 13.26220703125, 14.0478515625, 14.83349609375, 15.619140625, 16.40478515625, 17.1904296875, 17.97607421875, 18.76171875, 19.54736328125, 20.3330078125, 21.11865234375, 21.904296875, 22.68994140625, 23.4755859375, 24.26123046875, 25.046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 11.0, 7.0, 14.0, 13.0, 28.0, 42.0, 43.0, 49.0, 86.0, 93.0, 111.0, 165.0, 204.0, 239.0, 365.0, 462.0, 735.0, 1140.0, 1992.0, 3970.0, 11529.0, 75847.0, 859214.0, 71268.0, 11195.0, 4052.0, 1937.0, 1107.0, 705.0, 497.0, 328.0, 232.0, 223.0, 155.0, 117.0, 72.0, 59.0, 65.0, 38.0, 33.0, 33.0, 26.0, 14.0, 10.0, 11.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.5625, -33.46484375, -32.3671875, -31.26953125, -30.171875, -29.07421875, -27.9765625, -26.87890625, -25.78125, -24.68359375, -23.5859375, -22.48828125, -21.390625, -20.29296875, -19.1953125, -18.09765625, -17.0, -15.90234375, -14.8046875, -13.70703125, -12.609375, -11.51171875, -10.4140625, -9.31640625, -8.21875, -7.12109375, -6.0234375, -4.92578125, -3.828125, -2.73046875, -1.6328125, -0.53515625, 0.5625, 1.66015625, 2.7578125, 3.85546875, 4.953125, 6.05078125, 7.1484375, 8.24609375, 9.34375, 10.44140625, 11.5390625, 12.63671875, 13.734375, 14.83203125, 15.9296875, 17.02734375, 18.125, 19.22265625, 20.3203125, 21.41796875, 22.515625, 23.61328125, 24.7109375, 25.80859375, 26.90625, 28.00390625, 29.1015625, 30.19921875, 31.296875, 32.39453125, 33.4921875, 34.58984375, 35.6875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 10.0, 8.0, 16.0, 14.0, 40.0, 55.0, 105.0, 132.0, 175.0, 148.0, 108.0, 75.0, 45.0, 19.0, 11.0, 8.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00211334228515625, -0.0020556747913360596, -0.001998007297515869, -0.0019403398036956787, -0.0018826723098754883, -0.0018250048160552979, -0.0017673373222351074, -0.001709669828414917, -0.0016520023345947266, -0.0015943348407745361, -0.0015366673469543457, -0.0014789998531341553, -0.0014213323593139648, -0.0013636648654937744, -0.001305997371673584, -0.0012483298778533936, -0.0011906623840332031, -0.0011329948902130127, -0.0010753273963928223, -0.0010176599025726318, -0.0009599924087524414, -0.000902324914932251, -0.0008446574211120605, -0.0007869899272918701, -0.0007293224334716797, -0.0006716549396514893, -0.0006139874458312988, -0.0005563199520111084, -0.000498652458190918, -0.00044098496437072754, -0.0003833174705505371, -0.0003256499767303467, -0.00026798248291015625, -0.00021031498908996582, -0.0001526474952697754, -9.498000144958496e-05, -3.731250762939453e-05, 2.03549861907959e-05, 7.802248001098633e-05, 0.00013568997383117676, 0.0001933574676513672, 0.0002510249614715576, 0.00030869245529174805, 0.0003663599491119385, 0.0004240274429321289, 0.00048169493675231934, 0.0005393624305725098, 0.0005970299243927002, 0.0006546974182128906, 0.0007123649120330811, 0.0007700324058532715, 0.0008276998996734619, 0.0008853673934936523, 0.0009430348873138428, 0.0010007023811340332, 0.0010583698749542236, 0.001116037368774414, 0.0011737048625946045, 0.001231372356414795, 0.0012890398502349854, 0.0013467073440551758, 0.0014043748378753662, 0.0014620423316955566, 0.001519709825515747, 0.0015773773193359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 5.0, 9.0, 5.0, 9.0, 5.0, 11.0, 27.0, 34.0, 47.0, 62.0, 89.0, 122.0, 174.0, 275.0, 434.0, 698.0, 1046.0, 1768.0, 3225.0, 6769.0, 18212.0, 75054.0, 504355.0, 356931.0, 52204.0, 14060.0, 5725.0, 2786.0, 1618.0, 950.0, 613.0, 370.0, 272.0, 201.0, 120.0, 62.0, 56.0, 47.0, 23.0, 24.0, 13.0, 20.0, 10.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.125, -25.279296875, -24.43359375, -23.587890625, -22.7421875, -21.896484375, -21.05078125, -20.205078125, -19.359375, -18.513671875, -17.66796875, -16.822265625, -15.9765625, -15.130859375, -14.28515625, -13.439453125, -12.59375, -11.748046875, -10.90234375, -10.056640625, -9.2109375, -8.365234375, -7.51953125, -6.673828125, -5.828125, -4.982421875, -4.13671875, -3.291015625, -2.4453125, -1.599609375, -0.75390625, 0.091796875, 0.9375, 1.783203125, 2.62890625, 3.474609375, 4.3203125, 5.166015625, 6.01171875, 6.857421875, 7.703125, 8.548828125, 9.39453125, 10.240234375, 11.0859375, 11.931640625, 12.77734375, 13.623046875, 14.46875, 15.314453125, 16.16015625, 17.005859375, 17.8515625, 18.697265625, 19.54296875, 20.388671875, 21.234375, 22.080078125, 22.92578125, 23.771484375, 24.6171875, 25.462890625, 26.30859375, 27.154296875, 28.0]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 12.0, 21.0, 16.0, 25.0, 62.0, 146.0, 219.0, 200.0, 116.0, 45.0, 27.0, 31.0, 12.0, 11.0, 6.0, 7.0, 4.0, 8.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.4453125, -13.0802001953125, -12.715087890625, -12.3499755859375, -11.98486328125, -11.6197509765625, -11.254638671875, -10.8895263671875, -10.5244140625, -10.1593017578125, -9.794189453125, -9.4290771484375, -9.06396484375, -8.6988525390625, -8.333740234375, -7.9686279296875, -7.603515625, -7.2384033203125, -6.873291015625, -6.5081787109375, -6.14306640625, -5.7779541015625, -5.412841796875, -5.0477294921875, -4.6826171875, -4.3175048828125, -3.952392578125, -3.5872802734375, -3.22216796875, -2.8570556640625, -2.491943359375, -2.1268310546875, -1.76171875, -1.3966064453125, -1.031494140625, -0.6663818359375, -0.30126953125, 0.0638427734375, 0.428955078125, 0.7940673828125, 1.1591796875, 1.5242919921875, 1.889404296875, 2.2545166015625, 2.61962890625, 2.9847412109375, 3.349853515625, 3.7149658203125, 4.080078125, 4.4451904296875, 4.810302734375, 5.1754150390625, 5.54052734375, 5.9056396484375, 6.270751953125, 6.6358642578125, 7.0009765625, 7.3660888671875, 7.731201171875, 8.0963134765625, 8.46142578125, 8.8265380859375, 9.191650390625, 9.5567626953125, 9.921875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 10.0, 7.0, 16.0, 9.0, 16.0, 17.0, 27.0, 30.0, 26.0, 31.0, 37.0, 33.0, 38.0, 39.0, 35.0, 40.0, 36.0, 42.0, 45.0, 45.0, 49.0, 47.0, 31.0, 39.0, 30.0, 26.0, 29.0, 28.0, 21.0, 14.0, 21.0, 15.0, 14.0, 10.0, 7.0, 5.0, 7.0, 6.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.927095413208008, -26.02306365966797, -25.11903190612793, -24.21500015258789, -23.31096839904785, -22.406936645507812, -21.502906799316406, -20.598873138427734, -19.694843292236328, -18.79081153869629, -17.88677978515625, -16.98274803161621, -16.078716278076172, -15.174684524536133, -14.27065372467041, -13.366621971130371, -12.462589263916016, -11.558557510375977, -10.654525756835938, -9.750494003295898, -8.84646224975586, -7.9424309730529785, -7.038399696350098, -6.134367942810059, -5.2303361892700195, -4.3263044357299805, -3.4222729206085205, -2.5182414054870605, -1.6142096519470215, -0.7101778984069824, 0.19385337829589844, 1.0978851318359375, 2.0019149780273438, 2.905946731567383, 3.8099782466888428, 4.714009761810303, 5.618041515350342, 6.522073268890381, 7.426104545593262, 8.3301362991333, 9.23416805267334, 10.138199806213379, 11.042231559753418, 11.94626235961914, 12.85029411315918, 13.754325866699219, 14.658357620239258, 15.562389373779297, 16.466421127319336, 17.370452880859375, 18.274484634399414, 19.178516387939453, 20.082548141479492, 20.98657989501953, 21.890609741210938, 22.79464340209961, 23.698673248291016, 24.602705001831055, 25.506736755371094, 26.410768508911133, 27.314800262451172, 28.21883201599121, 29.12286376953125, 30.026893615722656, 30.930927276611328]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 3.0, 2.0, 6.0, 5.0, 6.0, 12.0, 16.0, 16.0, 22.0, 27.0, 22.0, 32.0, 35.0, 31.0, 42.0, 26.0, 34.0, 44.0, 41.0, 42.0, 48.0, 35.0, 37.0, 43.0, 42.0, 29.0, 44.0, 36.0, 37.0, 28.0, 23.0, 23.0, 12.0, 20.0, 14.0, 14.0, 11.0, 11.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-37.615440368652344, -36.495338439941406, -35.37523651123047, -34.25513458251953, -33.135032653808594, -32.014930725097656, -30.89483070373535, -29.774728775024414, -28.654626846313477, -27.53452491760254, -26.4144229888916, -25.294321060180664, -24.17422103881836, -23.054119110107422, -21.934017181396484, -20.813915252685547, -19.69381332397461, -18.573711395263672, -17.453609466552734, -16.333507537841797, -15.213406562805176, -14.093304634094238, -12.973203659057617, -11.85310173034668, -10.732999801635742, -9.612897872924805, -8.492795944213867, -7.372694969177246, -6.252593040466309, -5.132491111755371, -4.012389659881592, -2.8922882080078125, -1.772186279296875, -0.6520845890045166, 0.4680171012878418, 1.5881187915802002, 2.7082204818725586, 3.828322410583496, 4.948423862457275, 6.068525314331055, 7.188627243041992, 8.30872917175293, 9.428831100463867, 10.548932075500488, 11.669034004211426, 12.789135932922363, 13.909236907958984, 15.029338836669922, 16.14944076538086, 17.269542694091797, 18.389644622802734, 19.509746551513672, 20.62984848022461, 21.749950408935547, 22.87005043029785, 23.99015235900879, 25.110254287719727, 26.230356216430664, 27.3504581451416, 28.47056007385254, 29.590660095214844, 30.71076202392578, 31.83086395263672, 32.950965881347656, 34.071067810058594]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 17.0, 24.0, 30.0, 75.0, 96.0, 123.0, 223.0, 330.0, 530.0, 806.0, 1346.0, 2075.0, 3259.0, 5140.0, 7590.0, 11785.0, 17591.0, 25611.0, 35728.0, 48575.0, 62859.0, 77701.0, 90715.0, 99134.0, 101318.0, 95822.0, 86704.0, 73027.0, 57656.0, 44023.0, 32056.0, 22375.0, 15305.0, 10136.0, 6808.0, 4381.0, 2775.0, 1757.0, 1131.0, 743.0, 454.0, 224.0, 158.0, 121.0, 81.0, 52.0, 33.0, 16.0, 12.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0], "bins": [-20.8125, -20.18798828125, -19.5634765625, -18.93896484375, -18.314453125, -17.68994140625, -17.0654296875, -16.44091796875, -15.81640625, -15.19189453125, -14.5673828125, -13.94287109375, -13.318359375, -12.69384765625, -12.0693359375, -11.44482421875, -10.8203125, -10.19580078125, -9.5712890625, -8.94677734375, -8.322265625, -7.69775390625, -7.0732421875, -6.44873046875, -5.82421875, -5.19970703125, -4.5751953125, -3.95068359375, -3.326171875, -2.70166015625, -2.0771484375, -1.45263671875, -0.828125, -0.20361328125, 0.4208984375, 1.04541015625, 1.669921875, 2.29443359375, 2.9189453125, 3.54345703125, 4.16796875, 4.79248046875, 5.4169921875, 6.04150390625, 6.666015625, 7.29052734375, 7.9150390625, 8.53955078125, 9.1640625, 9.78857421875, 10.4130859375, 11.03759765625, 11.662109375, 12.28662109375, 12.9111328125, 13.53564453125, 14.16015625, 14.78466796875, 15.4091796875, 16.03369140625, 16.658203125, 17.28271484375, 17.9072265625, 18.53173828125, 19.15625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 5.0, 2.0, 5.0, 6.0, 5.0, 12.0, 13.0, 20.0, 19.0, 28.0, 22.0, 29.0, 36.0, 29.0, 43.0, 30.0, 31.0, 43.0, 38.0, 47.0, 48.0, 37.0, 33.0, 45.0, 38.0, 41.0, 32.0, 43.0, 37.0, 26.0, 24.0, 21.0, 15.0, 19.0, 12.0, 17.0, 11.0, 10.0, 7.0, 3.0, 8.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.78125, -35.68896484375, -34.5966796875, -33.50439453125, -32.412109375, -31.31982421875, -30.2275390625, -29.13525390625, -28.04296875, -26.95068359375, -25.8583984375, -24.76611328125, -23.673828125, -22.58154296875, -21.4892578125, -20.39697265625, -19.3046875, -18.21240234375, -17.1201171875, -16.02783203125, -14.935546875, -13.84326171875, -12.7509765625, -11.65869140625, -10.56640625, -9.47412109375, -8.3818359375, -7.28955078125, -6.197265625, -5.10498046875, -4.0126953125, -2.92041015625, -1.828125, -0.73583984375, 0.3564453125, 1.44873046875, 2.541015625, 3.63330078125, 4.7255859375, 5.81787109375, 6.91015625, 8.00244140625, 9.0947265625, 10.18701171875, 11.279296875, 12.37158203125, 13.4638671875, 14.55615234375, 15.6484375, 16.74072265625, 17.8330078125, 18.92529296875, 20.017578125, 21.10986328125, 22.2021484375, 23.29443359375, 24.38671875, 25.47900390625, 26.5712890625, 27.66357421875, 28.755859375, 29.84814453125, 30.9404296875, 32.03271484375, 33.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 12.0, 16.0, 30.0, 61.0, 82.0, 122.0, 182.0, 259.0, 407.0, 601.0, 910.0, 1312.0, 2069.0, 3164.0, 4642.0, 7025.0, 10514.0, 15387.0, 22772.0, 32191.0, 44423.0, 58744.0, 74013.0, 88219.0, 98326.0, 102356.0, 99225.0, 89657.0, 76025.0, 61103.0, 46437.0, 33920.0, 23937.0, 16589.0, 11363.0, 7607.0, 5058.0, 3281.0, 2232.0, 1433.0, 997.0, 632.0, 400.0, 265.0, 171.0, 130.0, 84.0, 55.0, 43.0, 22.0, 19.0, 15.0, 2.0, 1.0, 5.0, 3.0, 1.0], "bins": [-21.109375, -20.46142578125, -19.8134765625, -19.16552734375, -18.517578125, -17.86962890625, -17.2216796875, -16.57373046875, -15.92578125, -15.27783203125, -14.6298828125, -13.98193359375, -13.333984375, -12.68603515625, -12.0380859375, -11.39013671875, -10.7421875, -10.09423828125, -9.4462890625, -8.79833984375, -8.150390625, -7.50244140625, -6.8544921875, -6.20654296875, -5.55859375, -4.91064453125, -4.2626953125, -3.61474609375, -2.966796875, -2.31884765625, -1.6708984375, -1.02294921875, -0.375, 0.27294921875, 0.9208984375, 1.56884765625, 2.216796875, 2.86474609375, 3.5126953125, 4.16064453125, 4.80859375, 5.45654296875, 6.1044921875, 6.75244140625, 7.400390625, 8.04833984375, 8.6962890625, 9.34423828125, 9.9921875, 10.64013671875, 11.2880859375, 11.93603515625, 12.583984375, 13.23193359375, 13.8798828125, 14.52783203125, 15.17578125, 15.82373046875, 16.4716796875, 17.11962890625, 17.767578125, 18.41552734375, 19.0634765625, 19.71142578125, 20.359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 3.0, 7.0, 10.0, 8.0, 14.0, 15.0, 15.0, 19.0, 27.0, 11.0, 24.0, 28.0, 27.0, 24.0, 27.0, 33.0, 30.0, 30.0, 38.0, 44.0, 48.0, 37.0, 36.0, 39.0, 36.0, 30.0, 35.0, 37.0, 25.0, 35.0, 14.0, 23.0, 24.0, 25.0, 16.0, 14.0, 13.0, 12.0, 10.0, 8.0, 6.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-20.21875, -19.5732421875, -18.927734375, -18.2822265625, -17.63671875, -16.9912109375, -16.345703125, -15.7001953125, -15.0546875, -14.4091796875, -13.763671875, -13.1181640625, -12.47265625, -11.8271484375, -11.181640625, -10.5361328125, -9.890625, -9.2451171875, -8.599609375, -7.9541015625, -7.30859375, -6.6630859375, -6.017578125, -5.3720703125, -4.7265625, -4.0810546875, -3.435546875, -2.7900390625, -2.14453125, -1.4990234375, -0.853515625, -0.2080078125, 0.4375, 1.0830078125, 1.728515625, 2.3740234375, 3.01953125, 3.6650390625, 4.310546875, 4.9560546875, 5.6015625, 6.2470703125, 6.892578125, 7.5380859375, 8.18359375, 8.8291015625, 9.474609375, 10.1201171875, 10.765625, 11.4111328125, 12.056640625, 12.7021484375, 13.34765625, 13.9931640625, 14.638671875, 15.2841796875, 15.9296875, 16.5751953125, 17.220703125, 17.8662109375, 18.51171875, 19.1572265625, 19.802734375, 20.4482421875, 21.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 9.0, 11.0, 15.0, 28.0, 42.0, 72.0, 110.0, 165.0, 244.0, 425.0, 660.0, 983.0, 1653.0, 2815.0, 4910.0, 8827.0, 15688.0, 29387.0, 52817.0, 88610.0, 131027.0, 164372.0, 168520.0, 141725.0, 98716.0, 60383.0, 33857.0, 18505.0, 10111.0, 5592.0, 3191.0, 1926.0, 1182.0, 722.0, 425.0, 257.0, 192.0, 133.0, 83.0, 64.0, 45.0, 20.0, 8.0, 12.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.625, -12.2193603515625, -11.813720703125, -11.4080810546875, -11.00244140625, -10.5968017578125, -10.191162109375, -9.7855224609375, -9.3798828125, -8.9742431640625, -8.568603515625, -8.1629638671875, -7.75732421875, -7.3516845703125, -6.946044921875, -6.5404052734375, -6.134765625, -5.7291259765625, -5.323486328125, -4.9178466796875, -4.51220703125, -4.1065673828125, -3.700927734375, -3.2952880859375, -2.8896484375, -2.4840087890625, -2.078369140625, -1.6727294921875, -1.26708984375, -0.8614501953125, -0.455810546875, -0.0501708984375, 0.35546875, 0.7611083984375, 1.166748046875, 1.5723876953125, 1.97802734375, 2.3836669921875, 2.789306640625, 3.1949462890625, 3.6005859375, 4.0062255859375, 4.411865234375, 4.8175048828125, 5.22314453125, 5.6287841796875, 6.034423828125, 6.4400634765625, 6.845703125, 7.2513427734375, 7.656982421875, 8.0626220703125, 8.46826171875, 8.8739013671875, 9.279541015625, 9.6851806640625, 10.0908203125, 10.4964599609375, 10.902099609375, 11.3077392578125, 11.71337890625, 12.1190185546875, 12.524658203125, 12.9302978515625, 13.3359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 11.0, 16.0, 16.0, 18.0, 26.0, 33.0, 38.0, 37.0, 41.0, 49.0, 43.0, 64.0, 55.0, 61.0, 50.0, 58.0, 58.0, 44.0, 36.0, 45.0, 36.0, 32.0, 26.0, 20.0, 15.0, 17.0, 8.0, 5.0, 9.0, 3.0, 7.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011653900146484375, -0.0011249035596847534, -0.0010844171047210693, -0.0010439306497573853, -0.0010034441947937012, -0.0009629577398300171, -0.000922471284866333, -0.0008819848299026489, -0.0008414983749389648, -0.0008010119199752808, -0.0007605254650115967, -0.0007200390100479126, -0.0006795525550842285, -0.0006390661001205444, -0.0005985796451568604, -0.0005580931901931763, -0.0005176067352294922, -0.0004771202802658081, -0.000436633825302124, -0.00039614737033843994, -0.00035566091537475586, -0.0003151744604110718, -0.0002746880054473877, -0.0002342015504837036, -0.00019371509552001953, -0.00015322864055633545, -0.00011274218559265137, -7.225573062896729e-05, -3.17692756652832e-05, 8.717179298400879e-06, 4.920363426208496e-05, 8.969008922576904e-05, 0.00013017654418945312, 0.0001706629991531372, 0.0002111494541168213, 0.00025163590908050537, 0.00029212236404418945, 0.00033260881900787354, 0.0003730952739715576, 0.0004135817289352417, 0.0004540681838989258, 0.0004945546388626099, 0.0005350410938262939, 0.000575527548789978, 0.0006160140037536621, 0.0006565004587173462, 0.0006969869136810303, 0.0007374733686447144, 0.0007779598236083984, 0.0008184462785720825, 0.0008589327335357666, 0.0008994191884994507, 0.0009399056434631348, 0.0009803920984268188, 0.001020878553390503, 0.001061365008354187, 0.001101851463317871, 0.0011423379182815552, 0.0011828243732452393, 0.0012233108282089233, 0.0012637972831726074, 0.0013042837381362915, 0.0013447701930999756, 0.0013852566480636597, 0.0014257431030273438]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 5.0, 14.0, 16.0, 27.0, 38.0, 66.0, 112.0, 173.0, 312.0, 480.0, 904.0, 1668.0, 2903.0, 5780.0, 11264.0, 22708.0, 45325.0, 85753.0, 140835.0, 187699.0, 192769.0, 150685.0, 95055.0, 51478.0, 25789.0, 12674.0, 6450.0, 3370.0, 1800.0, 984.0, 571.0, 352.0, 200.0, 109.0, 72.0, 42.0, 26.0, 21.0, 11.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4921875, -13.9940185546875, -13.495849609375, -12.9976806640625, -12.49951171875, -12.0013427734375, -11.503173828125, -11.0050048828125, -10.5068359375, -10.0086669921875, -9.510498046875, -9.0123291015625, -8.51416015625, -8.0159912109375, -7.517822265625, -7.0196533203125, -6.521484375, -6.0233154296875, -5.525146484375, -5.0269775390625, -4.52880859375, -4.0306396484375, -3.532470703125, -3.0343017578125, -2.5361328125, -2.0379638671875, -1.539794921875, -1.0416259765625, -0.54345703125, -0.0452880859375, 0.452880859375, 0.9510498046875, 1.44921875, 1.9473876953125, 2.445556640625, 2.9437255859375, 3.44189453125, 3.9400634765625, 4.438232421875, 4.9364013671875, 5.4345703125, 5.9327392578125, 6.430908203125, 6.9290771484375, 7.42724609375, 7.9254150390625, 8.423583984375, 8.9217529296875, 9.419921875, 9.9180908203125, 10.416259765625, 10.9144287109375, 11.41259765625, 11.9107666015625, 12.408935546875, 12.9071044921875, 13.4052734375, 13.9034423828125, 14.401611328125, 14.8997802734375, 15.39794921875, 15.8961181640625, 16.394287109375, 16.8924560546875, 17.390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 5.0, 8.0, 10.0, 14.0, 14.0, 26.0, 30.0, 40.0, 50.0, 64.0, 50.0, 53.0, 68.0, 62.0, 57.0, 53.0, 58.0, 60.0, 54.0, 47.0, 37.0, 33.0, 24.0, 17.0, 17.0, 10.0, 9.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.59765625, -7.38006591796875, -7.1624755859375, -6.94488525390625, -6.727294921875, -6.50970458984375, -6.2921142578125, -6.07452392578125, -5.85693359375, -5.63934326171875, -5.4217529296875, -5.20416259765625, -4.986572265625, -4.76898193359375, -4.5513916015625, -4.33380126953125, -4.1162109375, -3.89862060546875, -3.6810302734375, -3.46343994140625, -3.245849609375, -3.02825927734375, -2.8106689453125, -2.59307861328125, -2.37548828125, -2.15789794921875, -1.9403076171875, -1.72271728515625, -1.505126953125, -1.28753662109375, -1.0699462890625, -0.85235595703125, -0.634765625, -0.41717529296875, -0.1995849609375, 0.01800537109375, 0.235595703125, 0.45318603515625, 0.6707763671875, 0.88836669921875, 1.10595703125, 1.32354736328125, 1.5411376953125, 1.75872802734375, 1.976318359375, 2.19390869140625, 2.4114990234375, 2.62908935546875, 2.8466796875, 3.06427001953125, 3.2818603515625, 3.49945068359375, 3.717041015625, 3.93463134765625, 4.1522216796875, 4.36981201171875, 4.58740234375, 4.80499267578125, 5.0225830078125, 5.24017333984375, 5.457763671875, 5.67535400390625, 5.8929443359375, 6.11053466796875, 6.328125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 4.0, 3.0, 11.0, 11.0, 10.0, 28.0, 10.0, 23.0, 23.0, 28.0, 33.0, 41.0, 33.0, 44.0, 45.0, 46.0, 26.0, 46.0, 56.0, 50.0, 37.0, 55.0, 32.0, 36.0, 37.0, 40.0, 34.0, 27.0, 21.0, 17.0, 20.0, 13.0, 14.0, 8.0, 11.0, 6.0, 6.0, 3.0, 8.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.083648681640625, -32.109161376953125, -31.134672164916992, -30.160184860229492, -29.18569564819336, -28.21120834350586, -27.236719131469727, -26.262231826782227, -25.287742614746094, -24.313255310058594, -23.33876609802246, -22.36427879333496, -21.389789581298828, -20.415302276611328, -19.440813064575195, -18.466325759887695, -17.491836547851562, -16.517349243164062, -15.54286003112793, -14.568371772766113, -13.593883514404297, -12.619396209716797, -11.644906997680664, -10.670419692993164, -9.695932388305664, -8.721444129943848, -7.746955871582031, -6.772467613220215, -5.797979354858398, -4.82349157333374, -3.849003314971924, -2.8745150566101074, -1.9000263214111328, -0.9255381226539612, 0.04895007610321045, 1.0234382152557373, 1.9979264736175537, 2.972414493560791, 3.9469027519226074, 4.921391010284424, 5.89587926864624, 6.870367527008057, 7.844855785369873, 8.819343566894531, 9.793831825256348, 10.768320083618164, 11.74280834197998, 12.717296600341797, 13.691784858703613, 14.66627311706543, 15.640761375427246, 16.615249633789062, 17.589736938476562, 18.564226150512695, 19.538713455200195, 20.513202667236328, 21.487689971923828, 22.462177276611328, 23.43666648864746, 24.41115379333496, 25.385643005371094, 26.360130310058594, 27.334619522094727, 28.309106826782227, 29.28359603881836]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 10.0, 12.0, 9.0, 7.0, 15.0, 13.0, 13.0, 26.0, 25.0, 23.0, 30.0, 49.0, 39.0, 35.0, 31.0, 31.0, 40.0, 43.0, 44.0, 32.0, 40.0, 44.0, 34.0, 28.0, 32.0, 41.0, 38.0, 39.0, 24.0, 31.0, 17.0, 16.0, 15.0, 10.0, 12.0, 5.0, 8.0, 8.0, 5.0, 2.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.82529830932617, -35.695011138916016, -34.564727783203125, -33.43444061279297, -32.30415344238281, -31.173870086669922, -30.043582916259766, -28.913297653198242, -27.78301239013672, -26.652727127075195, -25.522441864013672, -24.392154693603516, -23.261869430541992, -22.13158416748047, -21.001296997070312, -19.87101173400879, -18.740726470947266, -17.610441207885742, -16.48015594482422, -15.349868774414062, -14.219583511352539, -13.089298248291016, -11.959012031555176, -10.828725814819336, -9.698440551757812, -8.568155288696289, -7.437869071960449, -6.307583332061768, -5.177297592163086, -4.047011852264404, -2.9167261123657227, -1.786440372467041, -0.6561546325683594, 0.47413110733032227, 1.604416847229004, 2.7347025871276855, 3.864988327026367, 4.995274066925049, 6.1255598068237305, 7.255845546722412, 8.386131286621094, 9.516416549682617, 10.646702766418457, 11.776988983154297, 12.90727424621582, 14.037559509277344, 15.167845726013184, 16.298131942749023, 17.428417205810547, 18.55870246887207, 19.688987731933594, 20.81927490234375, 21.949560165405273, 23.079845428466797, 24.210132598876953, 25.340417861938477, 26.470703125, 27.600988388061523, 28.731273651123047, 29.861560821533203, 30.991846084594727, 32.12213134765625, 33.252418518066406, 34.3827018737793, 35.51298904418945]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 8.0, 5.0, 12.0, 16.0, 22.0, 36.0, 43.0, 107.0, 172.0, 355.0, 612.0, 1062.0, 1757.0, 3091.0, 5539.0, 9377.0, 16494.0, 28035.0, 47841.0, 78189.0, 124351.0, 190645.0, 275610.0, 371133.0, 455695.0, 506640.0, 504622.0, 450610.0, 364149.0, 269062.0, 185320.0, 120468.0, 75379.0, 45134.0, 26889.0, 15575.0, 8916.0, 4951.0, 2829.0, 1573.0, 820.0, 509.0, 296.0, 132.0, 84.0, 65.0, 30.0, 22.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.466552734375, -20.69873046875, -19.930908203125, -19.1630859375, -18.395263671875, -17.62744140625, -16.859619140625, -16.091796875, -15.323974609375, -14.55615234375, -13.788330078125, -13.0205078125, -12.252685546875, -11.48486328125, -10.717041015625, -9.94921875, -9.181396484375, -8.41357421875, -7.645751953125, -6.8779296875, -6.110107421875, -5.34228515625, -4.574462890625, -3.806640625, -3.038818359375, -2.27099609375, -1.503173828125, -0.7353515625, 0.032470703125, 0.80029296875, 1.568115234375, 2.3359375, 3.103759765625, 3.87158203125, 4.639404296875, 5.4072265625, 6.175048828125, 6.94287109375, 7.710693359375, 8.478515625, 9.246337890625, 10.01416015625, 10.781982421875, 11.5498046875, 12.317626953125, 13.08544921875, 13.853271484375, 14.62109375, 15.388916015625, 16.15673828125, 16.924560546875, 17.6923828125, 18.460205078125, 19.22802734375, 19.995849609375, 20.763671875, 21.531494140625, 22.29931640625, 23.067138671875, 23.8349609375, 24.602783203125, 25.37060546875, 26.138427734375, 26.90625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 12.0, 11.0, 9.0, 14.0, 15.0, 18.0, 18.0, 28.0, 18.0, 34.0, 46.0, 38.0, 38.0, 31.0, 31.0, 46.0, 36.0, 47.0, 37.0, 37.0, 30.0, 41.0, 31.0, 40.0, 29.0, 45.0, 32.0, 36.0, 21.0, 14.0, 19.0, 14.0, 17.0, 6.0, 7.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.34375, -30.385009765625, -29.42626953125, -28.467529296875, -27.5087890625, -26.550048828125, -25.59130859375, -24.632568359375, -23.673828125, -22.715087890625, -21.75634765625, -20.797607421875, -19.8388671875, -18.880126953125, -17.92138671875, -16.962646484375, -16.00390625, -15.045166015625, -14.08642578125, -13.127685546875, -12.1689453125, -11.210205078125, -10.25146484375, -9.292724609375, -8.333984375, -7.375244140625, -6.41650390625, -5.457763671875, -4.4990234375, -3.540283203125, -2.58154296875, -1.622802734375, -0.6640625, 0.294677734375, 1.25341796875, 2.212158203125, 3.1708984375, 4.129638671875, 5.08837890625, 6.047119140625, 7.005859375, 7.964599609375, 8.92333984375, 9.882080078125, 10.8408203125, 11.799560546875, 12.75830078125, 13.717041015625, 14.67578125, 15.634521484375, 16.59326171875, 17.552001953125, 18.5107421875, 19.469482421875, 20.42822265625, 21.386962890625, 22.345703125, 23.304443359375, 24.26318359375, 25.221923828125, 26.1806640625, 27.139404296875, 28.09814453125, 29.056884765625, 30.015625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [4.0, 5.0, 9.0, 13.0, 37.0, 33.0, 80.0, 154.0, 279.0, 482.0, 731.0, 1324.0, 2271.0, 3698.0, 6199.0, 10062.0, 16244.0, 25517.0, 39172.0, 58853.0, 85721.0, 120739.0, 163878.0, 212740.0, 266808.0, 314424.0, 354816.0, 375865.0, 379042.0, 359747.0, 323099.0, 274926.0, 224171.0, 173185.0, 128319.0, 91366.0, 63554.0, 42844.0, 27811.0, 17636.0, 11336.0, 6895.0, 4205.0, 2553.0, 1430.0, 878.0, 489.0, 278.0, 162.0, 88.0, 52.0, 33.0, 16.0, 12.0, 6.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.4375, -16.81689453125, -16.1962890625, -15.57568359375, -14.955078125, -14.33447265625, -13.7138671875, -13.09326171875, -12.47265625, -11.85205078125, -11.2314453125, -10.61083984375, -9.990234375, -9.36962890625, -8.7490234375, -8.12841796875, -7.5078125, -6.88720703125, -6.2666015625, -5.64599609375, -5.025390625, -4.40478515625, -3.7841796875, -3.16357421875, -2.54296875, -1.92236328125, -1.3017578125, -0.68115234375, -0.060546875, 0.56005859375, 1.1806640625, 1.80126953125, 2.421875, 3.04248046875, 3.6630859375, 4.28369140625, 4.904296875, 5.52490234375, 6.1455078125, 6.76611328125, 7.38671875, 8.00732421875, 8.6279296875, 9.24853515625, 9.869140625, 10.48974609375, 11.1103515625, 11.73095703125, 12.3515625, 12.97216796875, 13.5927734375, 14.21337890625, 14.833984375, 15.45458984375, 16.0751953125, 16.69580078125, 17.31640625, 17.93701171875, 18.5576171875, 19.17822265625, 19.798828125, 20.41943359375, 21.0400390625, 21.66064453125, 22.28125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 6.0, 17.0, 22.0, 24.0, 50.0, 38.0, 51.0, 81.0, 61.0, 94.0, 117.0, 119.0, 137.0, 151.0, 195.0, 191.0, 183.0, 208.0, 208.0, 219.0, 210.0, 187.0, 181.0, 186.0, 186.0, 154.0, 144.0, 123.0, 88.0, 100.0, 63.0, 61.0, 39.0, 34.0, 28.0, 24.0, 24.0, 16.0, 4.0, 12.0, 10.0, 6.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.52099609375, -11.0966796875, -10.67236328125, -10.248046875, -9.82373046875, -9.3994140625, -8.97509765625, -8.55078125, -8.12646484375, -7.7021484375, -7.27783203125, -6.853515625, -6.42919921875, -6.0048828125, -5.58056640625, -5.15625, -4.73193359375, -4.3076171875, -3.88330078125, -3.458984375, -3.03466796875, -2.6103515625, -2.18603515625, -1.76171875, -1.33740234375, -0.9130859375, -0.48876953125, -0.064453125, 0.35986328125, 0.7841796875, 1.20849609375, 1.6328125, 2.05712890625, 2.4814453125, 2.90576171875, 3.330078125, 3.75439453125, 4.1787109375, 4.60302734375, 5.02734375, 5.45166015625, 5.8759765625, 6.30029296875, 6.724609375, 7.14892578125, 7.5732421875, 7.99755859375, 8.421875, 8.84619140625, 9.2705078125, 9.69482421875, 10.119140625, 10.54345703125, 10.9677734375, 11.39208984375, 11.81640625, 12.24072265625, 12.6650390625, 13.08935546875, 13.513671875, 13.93798828125, 14.3623046875, 14.78662109375, 15.2109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 12.0, 3.0, 14.0, 4.0, 17.0, 17.0, 16.0, 21.0, 21.0, 19.0, 34.0, 35.0, 48.0, 33.0, 38.0, 40.0, 35.0, 37.0, 42.0, 47.0, 45.0, 40.0, 37.0, 31.0, 33.0, 43.0, 32.0, 33.0, 26.0, 27.0, 18.0, 23.0, 14.0, 14.0, 13.0, 7.0, 7.0, 6.0, 5.0, 1.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.96746826171875, -27.012842178344727, -26.058218002319336, -25.103591918945312, -24.148967742919922, -23.1943416595459, -22.239717483520508, -21.285091400146484, -20.330467224121094, -19.37584114074707, -18.42121696472168, -17.466590881347656, -16.511966705322266, -15.557340621948242, -14.602716445922852, -13.648090362548828, -12.693465232849121, -11.738840103149414, -10.784214973449707, -9.82958984375, -8.874964714050293, -7.920339107513428, -6.965713977813721, -6.011088848114014, -5.056463718414307, -4.1018385887146, -3.1472134590148926, -2.1925880908966064, -1.2379629611968994, -0.2833375930786133, 0.6712875366210938, 1.6259126663208008, 2.580537796020508, 3.535162925720215, 4.489788055419922, 5.444413185119629, 6.399038314819336, 7.353663921356201, 8.30828857421875, 9.262914657592773, 10.217538833618164, 11.172163963317871, 12.126789093017578, 13.081414222717285, 14.036039352416992, 14.990665435791016, 15.945289611816406, 16.89991569519043, 17.854541778564453, 18.809167861938477, 19.763792037963867, 20.71841812133789, 21.67304229736328, 22.627668380737305, 23.582292556762695, 24.53691864013672, 25.49154281616211, 26.446168899536133, 27.400793075561523, 28.355419158935547, 29.310043334960938, 30.26466941833496, 31.21929359436035, 32.173919677734375, 33.128543853759766]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 14.0, 7.0, 20.0, 19.0, 13.0, 19.0, 23.0, 23.0, 26.0, 26.0, 37.0, 38.0, 40.0, 43.0, 43.0, 45.0, 43.0, 42.0, 33.0, 34.0, 32.0, 32.0, 43.0, 40.0, 33.0, 41.0, 25.0, 25.0, 20.0, 18.0, 12.0, 19.0, 7.0, 8.0, 5.0, 6.0, 9.0, 4.0, 5.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-37.99674606323242, -36.858551025390625, -35.72035598754883, -34.58216094970703, -33.443965911865234, -32.30577087402344, -31.16757583618164, -30.029380798339844, -28.891185760498047, -27.75299072265625, -26.614795684814453, -25.476600646972656, -24.33840560913086, -23.200210571289062, -22.062015533447266, -20.92382049560547, -19.785627365112305, -18.647432327270508, -17.50923728942871, -16.371042251586914, -15.232847213745117, -14.09465217590332, -12.95645809173584, -11.818263053894043, -10.680068016052246, -9.54187297821045, -8.403677940368652, -7.265483379364014, -6.127288341522217, -4.98909330368042, -3.8508987426757812, -2.7127037048339844, -1.5745086669921875, -0.4363137483596802, 0.7018811702728271, 1.840075969696045, 2.978271007537842, 4.116466045379639, 5.254660606384277, 6.392855644226074, 7.531050682067871, 8.669245719909668, 9.807440757751465, 10.945634841918945, 12.083829879760742, 13.222024917602539, 14.360219955444336, 15.498414993286133, 16.63661003112793, 17.774805068969727, 18.913000106811523, 20.05119514465332, 21.189390182495117, 22.327585220336914, 23.465778350830078, 24.603973388671875, 25.742168426513672, 26.88036346435547, 28.018558502197266, 29.156753540039062, 30.29494857788086, 31.433143615722656, 32.57133865356445, 33.70953369140625, 34.84772872924805]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 8.0, 6.0, 12.0, 26.0, 39.0, 50.0, 82.0, 125.0, 218.0, 338.0, 521.0, 859.0, 1345.0, 2173.0, 3668.0, 6016.0, 10159.0, 17201.0, 28650.0, 49011.0, 80373.0, 127891.0, 178169.0, 184597.0, 137051.0, 88002.0, 53504.0, 31725.0, 18555.0, 10991.0, 6662.0, 4056.0, 2441.0, 1540.0, 939.0, 582.0, 381.0, 225.0, 142.0, 83.0, 71.0, 27.0, 19.0, 10.0, 7.0, 5.0, 9.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.4453125, -12.1004638671875, -11.755615234375, -11.4107666015625, -11.06591796875, -10.7210693359375, -10.376220703125, -10.0313720703125, -9.6865234375, -9.3416748046875, -8.996826171875, -8.6519775390625, -8.30712890625, -7.9622802734375, -7.617431640625, -7.2725830078125, -6.927734375, -6.5828857421875, -6.238037109375, -5.8931884765625, -5.54833984375, -5.2034912109375, -4.858642578125, -4.5137939453125, -4.1689453125, -3.8240966796875, -3.479248046875, -3.1343994140625, -2.78955078125, -2.4447021484375, -2.099853515625, -1.7550048828125, -1.41015625, -1.0653076171875, -0.720458984375, -0.3756103515625, -0.03076171875, 0.3140869140625, 0.658935546875, 1.0037841796875, 1.3486328125, 1.6934814453125, 2.038330078125, 2.3831787109375, 2.72802734375, 3.0728759765625, 3.417724609375, 3.7625732421875, 4.107421875, 4.4522705078125, 4.797119140625, 5.1419677734375, 5.48681640625, 5.8316650390625, 6.176513671875, 6.5213623046875, 6.8662109375, 7.2110595703125, 7.555908203125, 7.9007568359375, 8.24560546875, 8.5904541015625, 8.935302734375, 9.2801513671875, 9.625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 14.0, 10.0, 18.0, 19.0, 12.0, 19.0, 23.0, 24.0, 26.0, 27.0, 37.0, 38.0, 44.0, 38.0, 43.0, 46.0, 45.0, 39.0, 33.0, 33.0, 33.0, 35.0, 41.0, 40.0, 31.0, 42.0, 25.0, 24.0, 20.0, 20.0, 14.0, 15.0, 6.0, 9.0, 5.0, 6.0, 9.0, 5.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-37.71875, -36.5830078125, -35.447265625, -34.3115234375, -33.17578125, -32.0400390625, -30.904296875, -29.7685546875, -28.6328125, -27.4970703125, -26.361328125, -25.2255859375, -24.08984375, -22.9541015625, -21.818359375, -20.6826171875, -19.546875, -18.4111328125, -17.275390625, -16.1396484375, -15.00390625, -13.8681640625, -12.732421875, -11.5966796875, -10.4609375, -9.3251953125, -8.189453125, -7.0537109375, -5.91796875, -4.7822265625, -3.646484375, -2.5107421875, -1.375, -0.2392578125, 0.896484375, 2.0322265625, 3.16796875, 4.3037109375, 5.439453125, 6.5751953125, 7.7109375, 8.8466796875, 9.982421875, 11.1181640625, 12.25390625, 13.3896484375, 14.525390625, 15.6611328125, 16.796875, 17.9326171875, 19.068359375, 20.2041015625, 21.33984375, 22.4755859375, 23.611328125, 24.7470703125, 25.8828125, 27.0185546875, 28.154296875, 29.2900390625, 30.42578125, 31.5615234375, 32.697265625, 33.8330078125, 34.96875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 3.0, 10.0, 10.0, 13.0, 24.0, 24.0, 55.0, 55.0, 79.0, 155.0, 202.0, 270.0, 402.0, 608.0, 916.0, 1355.0, 2095.0, 3314.0, 5433.0, 9402.0, 17747.0, 37571.0, 93795.0, 260952.0, 356733.0, 147267.0, 55339.0, 24336.0, 12281.0, 6751.0, 3952.0, 2457.0, 1585.0, 1094.0, 712.0, 489.0, 356.0, 219.0, 148.0, 105.0, 77.0, 56.0, 30.0, 25.0, 13.0, 12.0, 18.0, 7.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.796875, -13.36865234375, -12.9404296875, -12.51220703125, -12.083984375, -11.65576171875, -11.2275390625, -10.79931640625, -10.37109375, -9.94287109375, -9.5146484375, -9.08642578125, -8.658203125, -8.22998046875, -7.8017578125, -7.37353515625, -6.9453125, -6.51708984375, -6.0888671875, -5.66064453125, -5.232421875, -4.80419921875, -4.3759765625, -3.94775390625, -3.51953125, -3.09130859375, -2.6630859375, -2.23486328125, -1.806640625, -1.37841796875, -0.9501953125, -0.52197265625, -0.09375, 0.33447265625, 0.7626953125, 1.19091796875, 1.619140625, 2.04736328125, 2.4755859375, 2.90380859375, 3.33203125, 3.76025390625, 4.1884765625, 4.61669921875, 5.044921875, 5.47314453125, 5.9013671875, 6.32958984375, 6.7578125, 7.18603515625, 7.6142578125, 8.04248046875, 8.470703125, 8.89892578125, 9.3271484375, 9.75537109375, 10.18359375, 10.61181640625, 11.0400390625, 11.46826171875, 11.896484375, 12.32470703125, 12.7529296875, 13.18115234375, 13.609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 9.0, 11.0, 17.0, 17.0, 17.0, 21.0, 15.0, 19.0, 32.0, 33.0, 27.0, 17.0, 55.0, 35.0, 46.0, 54.0, 43.0, 45.0, 54.0, 44.0, 31.0, 43.0, 59.0, 40.0, 28.0, 26.0, 31.0, 26.0, 18.0, 10.0, 16.0, 11.0, 8.0, 12.0, 9.0, 4.0, 3.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.8125, -28.83056640625, -27.8486328125, -26.86669921875, -25.884765625, -24.90283203125, -23.9208984375, -22.93896484375, -21.95703125, -20.97509765625, -19.9931640625, -19.01123046875, -18.029296875, -17.04736328125, -16.0654296875, -15.08349609375, -14.1015625, -13.11962890625, -12.1376953125, -11.15576171875, -10.173828125, -9.19189453125, -8.2099609375, -7.22802734375, -6.24609375, -5.26416015625, -4.2822265625, -3.30029296875, -2.318359375, -1.33642578125, -0.3544921875, 0.62744140625, 1.609375, 2.59130859375, 3.5732421875, 4.55517578125, 5.537109375, 6.51904296875, 7.5009765625, 8.48291015625, 9.46484375, 10.44677734375, 11.4287109375, 12.41064453125, 13.392578125, 14.37451171875, 15.3564453125, 16.33837890625, 17.3203125, 18.30224609375, 19.2841796875, 20.26611328125, 21.248046875, 22.22998046875, 23.2119140625, 24.19384765625, 25.17578125, 26.15771484375, 27.1396484375, 28.12158203125, 29.103515625, 30.08544921875, 31.0673828125, 32.04931640625, 33.03125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 11.0, 7.0, 12.0, 14.0, 29.0, 29.0, 44.0, 54.0, 67.0, 116.0, 172.0, 218.0, 354.0, 518.0, 889.0, 1415.0, 2447.0, 4769.0, 9889.0, 24461.0, 82446.0, 525674.0, 304192.0, 54565.0, 18298.0, 7878.0, 3973.0, 2210.0, 1344.0, 758.0, 504.0, 351.0, 241.0, 156.0, 119.0, 91.0, 53.0, 47.0, 35.0, 32.0, 21.0, 14.0, 9.0, 6.0, 10.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5546875, -14.0828857421875, -13.611083984375, -13.1392822265625, -12.66748046875, -12.1956787109375, -11.723876953125, -11.2520751953125, -10.7802734375, -10.3084716796875, -9.836669921875, -9.3648681640625, -8.89306640625, -8.4212646484375, -7.949462890625, -7.4776611328125, -7.005859375, -6.5340576171875, -6.062255859375, -5.5904541015625, -5.11865234375, -4.6468505859375, -4.175048828125, -3.7032470703125, -3.2314453125, -2.7596435546875, -2.287841796875, -1.8160400390625, -1.34423828125, -0.8724365234375, -0.400634765625, 0.0711669921875, 0.54296875, 1.0147705078125, 1.486572265625, 1.9583740234375, 2.43017578125, 2.9019775390625, 3.373779296875, 3.8455810546875, 4.3173828125, 4.7891845703125, 5.260986328125, 5.7327880859375, 6.20458984375, 6.6763916015625, 7.148193359375, 7.6199951171875, 8.091796875, 8.5635986328125, 9.035400390625, 9.5072021484375, 9.97900390625, 10.4508056640625, 10.922607421875, 11.3944091796875, 11.8662109375, 12.3380126953125, 12.809814453125, 13.2816162109375, 13.75341796875, 14.2252197265625, 14.697021484375, 15.1688232421875, 15.640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 2.0, 7.0, 9.0, 9.0, 10.0, 18.0, 27.0, 27.0, 25.0, 36.0, 42.0, 58.0, 55.0, 78.0, 85.0, 70.0, 78.0, 67.0, 57.0, 44.0, 40.0, 24.0, 28.0, 18.0, 17.0, 12.0, 12.0, 3.0, 9.0, 2.0, 4.0, 8.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007748603820800781, -0.0007491409778594971, -0.000723421573638916, -0.000697702169418335, -0.0006719827651977539, -0.0006462633609771729, -0.0006205439567565918, -0.0005948245525360107, -0.0005691051483154297, -0.0005433857440948486, -0.0005176663398742676, -0.0004919469356536865, -0.00046622753143310547, -0.0004405081272125244, -0.00041478872299194336, -0.0003890693187713623, -0.00036334991455078125, -0.0003376305103302002, -0.00031191110610961914, -0.0002861917018890381, -0.00026047229766845703, -0.00023475289344787598, -0.00020903348922729492, -0.00018331408500671387, -0.0001575946807861328, -0.00013187527656555176, -0.0001061558723449707, -8.043646812438965e-05, -5.4717063903808594e-05, -2.899765968322754e-05, -3.2782554626464844e-06, 2.244114875793457e-05, 4.8160552978515625e-05, 7.387995719909668e-05, 9.959936141967773e-05, 0.0001253187656402588, 0.00015103816986083984, 0.0001767575740814209, 0.00020247697830200195, 0.000228196382522583, 0.00025391578674316406, 0.0002796351909637451, 0.00030535459518432617, 0.0003310739994049072, 0.0003567934036254883, 0.00038251280784606934, 0.0004082322120666504, 0.00043395161628723145, 0.0004596710205078125, 0.00048539042472839355, 0.0005111098289489746, 0.0005368292331695557, 0.0005625486373901367, 0.0005882680416107178, 0.0006139874458312988, 0.0006397068500518799, 0.0006654262542724609, 0.000691145658493042, 0.000716865062713623, 0.0007425844669342041, 0.0007683038711547852, 0.0007940232753753662, 0.0008197426795959473, 0.0008454620838165283, 0.0008711814880371094]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 13.0, 21.0, 30.0, 32.0, 52.0, 78.0, 114.0, 160.0, 240.0, 442.0, 672.0, 1086.0, 1753.0, 2801.0, 4976.0, 8596.0, 15882.0, 31029.0, 63160.0, 136204.0, 263089.0, 258200.0, 132286.0, 61273.0, 30226.0, 15510.0, 8464.0, 4799.0, 2767.0, 1702.0, 1023.0, 640.0, 441.0, 235.0, 205.0, 112.0, 75.0, 57.0, 27.0, 24.0, 17.0, 15.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.6484375, -10.3255615234375, -10.002685546875, -9.6798095703125, -9.35693359375, -9.0340576171875, -8.711181640625, -8.3883056640625, -8.0654296875, -7.7425537109375, -7.419677734375, -7.0968017578125, -6.77392578125, -6.4510498046875, -6.128173828125, -5.8052978515625, -5.482421875, -5.1595458984375, -4.836669921875, -4.5137939453125, -4.19091796875, -3.8680419921875, -3.545166015625, -3.2222900390625, -2.8994140625, -2.5765380859375, -2.253662109375, -1.9307861328125, -1.60791015625, -1.2850341796875, -0.962158203125, -0.6392822265625, -0.31640625, 0.0064697265625, 0.329345703125, 0.6522216796875, 0.97509765625, 1.2979736328125, 1.620849609375, 1.9437255859375, 2.2666015625, 2.5894775390625, 2.912353515625, 3.2352294921875, 3.55810546875, 3.8809814453125, 4.203857421875, 4.5267333984375, 4.849609375, 5.1724853515625, 5.495361328125, 5.8182373046875, 6.14111328125, 6.4639892578125, 6.786865234375, 7.1097412109375, 7.4326171875, 7.7554931640625, 8.078369140625, 8.4012451171875, 8.72412109375, 9.0469970703125, 9.369873046875, 9.6927490234375, 10.015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 8.0, 11.0, 9.0, 15.0, 12.0, 17.0, 25.0, 25.0, 28.0, 48.0, 44.0, 52.0, 64.0, 70.0, 66.0, 69.0, 65.0, 73.0, 44.0, 25.0, 27.0, 26.0, 38.0, 22.0, 15.0, 5.0, 9.0, 11.0, 8.0, 9.0, 10.0, 9.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-5.35546875, -5.1971435546875, -5.038818359375, -4.8804931640625, -4.72216796875, -4.5638427734375, -4.405517578125, -4.2471923828125, -4.0888671875, -3.9305419921875, -3.772216796875, -3.6138916015625, -3.45556640625, -3.2972412109375, -3.138916015625, -2.9805908203125, -2.822265625, -2.6639404296875, -2.505615234375, -2.3472900390625, -2.18896484375, -2.0306396484375, -1.872314453125, -1.7139892578125, -1.5556640625, -1.3973388671875, -1.239013671875, -1.0806884765625, -0.92236328125, -0.7640380859375, -0.605712890625, -0.4473876953125, -0.2890625, -0.1307373046875, 0.027587890625, 0.1859130859375, 0.34423828125, 0.5025634765625, 0.660888671875, 0.8192138671875, 0.9775390625, 1.1358642578125, 1.294189453125, 1.4525146484375, 1.61083984375, 1.7691650390625, 1.927490234375, 2.0858154296875, 2.244140625, 2.4024658203125, 2.560791015625, 2.7191162109375, 2.87744140625, 3.0357666015625, 3.194091796875, 3.3524169921875, 3.5107421875, 3.6690673828125, 3.827392578125, 3.9857177734375, 4.14404296875, 4.3023681640625, 4.460693359375, 4.6190185546875, 4.77734375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 12.0, 5.0, 5.0, 9.0, 10.0, 14.0, 22.0, 20.0, 16.0, 16.0, 39.0, 25.0, 34.0, 38.0, 39.0, 42.0, 36.0, 39.0, 36.0, 41.0, 40.0, 46.0, 43.0, 35.0, 27.0, 34.0, 29.0, 39.0, 36.0, 31.0, 19.0, 26.0, 12.0, 19.0, 15.0, 9.0, 12.0, 7.0, 4.0, 3.0, 7.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.130355834960938, -26.19639015197754, -25.262422561645508, -24.32845687866211, -23.394489288330078, -22.46052360534668, -21.52655601501465, -20.59259033203125, -19.65862274169922, -18.72465705871582, -17.79068946838379, -16.85672378540039, -15.92275619506836, -14.988790512084961, -14.05482292175293, -13.120857238769531, -12.186890602111816, -11.252923965454102, -10.318957328796387, -9.384990692138672, -8.451024055480957, -7.5170578956604, -6.5830912590026855, -5.649124622344971, -4.715157985687256, -3.781191349029541, -2.847224712371826, -1.9132583141326904, -0.9792916774749756, -0.045325279235839844, 0.888641357421875, 1.8226079940795898, 2.7565746307373047, 3.6905412673950195, 4.624507904052734, 5.558474540710449, 6.492441177368164, 7.426407337188721, 8.360374450683594, 9.294340133666992, 10.228307723999023, 11.162274360656738, 12.096240997314453, 13.030207633972168, 13.964174270629883, 14.898139953613281, 15.832107543945312, 16.76607322692871, 17.70003890991211, 18.634004592895508, 19.56797218322754, 20.501937866210938, 21.43590545654297, 22.369871139526367, 23.3038387298584, 24.237804412841797, 25.171772003173828, 26.105737686157227, 27.039705276489258, 27.973670959472656, 28.907638549804688, 29.841604232788086, 30.775571823120117, 31.709537506103516, 32.64350509643555]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 5.0, 7.0, 13.0, 8.0, 18.0, 21.0, 17.0, 19.0, 16.0, 24.0, 22.0, 31.0, 35.0, 43.0, 42.0, 33.0, 52.0, 45.0, 41.0, 35.0, 39.0, 36.0, 35.0, 33.0, 41.0, 34.0, 36.0, 34.0, 25.0, 25.0, 20.0, 17.0, 24.0, 11.0, 8.0, 12.0, 4.0, 5.0, 8.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.621097564697266, -36.49016189575195, -35.359222412109375, -34.22828674316406, -33.097347259521484, -31.966411590576172, -30.835474014282227, -29.70453643798828, -28.573598861694336, -27.44266128540039, -26.311723709106445, -25.1807861328125, -24.049850463867188, -22.91891098022461, -21.787975311279297, -20.65703773498535, -19.526100158691406, -18.39516258239746, -17.264225006103516, -16.13328742980957, -15.002350807189941, -13.871413230895996, -12.740476608276367, -11.609539031982422, -10.478601455688477, -9.347663879394531, -8.216726303100586, -7.085789680480957, -5.954852104187012, -4.823914527893066, -3.6929774284362793, -2.562040328979492, -1.4310989379882812, -0.30016160011291504, 0.8307757377624512, 1.9617130756378174, 3.0926504135131836, 4.223587989807129, 5.354525089263916, 6.485462188720703, 7.616399765014648, 8.747337341308594, 9.878274917602539, 11.009211540222168, 12.140149116516113, 13.271086692810059, 14.402023315429688, 15.532960891723633, 16.663898468017578, 17.794836044311523, 18.92577362060547, 20.056711196899414, 21.18764877319336, 22.318584442138672, 23.449522018432617, 24.580459594726562, 25.711397171020508, 26.842334747314453, 27.9732723236084, 29.104209899902344, 30.235145568847656, 31.366085052490234, 32.49702072143555, 33.627960205078125, 34.75889587402344]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 12.0, 15.0, 45.0, 68.0, 104.0, 169.0, 282.0, 490.0, 766.0, 1211.0, 1967.0, 2961.0, 4677.0, 7216.0, 10561.0, 15787.0, 22565.0, 31629.0, 42777.0, 55448.0, 68776.0, 81891.0, 91611.0, 96003.0, 94813.0, 88911.0, 78452.0, 65461.0, 52493.0, 39785.0, 29020.0, 20952.0, 14106.0, 9667.0, 6571.0, 4179.0, 2573.0, 1740.0, 1074.0, 733.0, 411.0, 232.0, 163.0, 87.0, 42.0, 27.0, 20.0, 15.0, 2.0, 3.0, 0.0, 2.0], "bins": [-21.78125, -21.174072265625, -20.56689453125, -19.959716796875, -19.3525390625, -18.745361328125, -18.13818359375, -17.531005859375, -16.923828125, -16.316650390625, -15.70947265625, -15.102294921875, -14.4951171875, -13.887939453125, -13.28076171875, -12.673583984375, -12.06640625, -11.459228515625, -10.85205078125, -10.244873046875, -9.6376953125, -9.030517578125, -8.42333984375, -7.816162109375, -7.208984375, -6.601806640625, -5.99462890625, -5.387451171875, -4.7802734375, -4.173095703125, -3.56591796875, -2.958740234375, -2.3515625, -1.744384765625, -1.13720703125, -0.530029296875, 0.0771484375, 0.684326171875, 1.29150390625, 1.898681640625, 2.505859375, 3.113037109375, 3.72021484375, 4.327392578125, 4.9345703125, 5.541748046875, 6.14892578125, 6.756103515625, 7.36328125, 7.970458984375, 8.57763671875, 9.184814453125, 9.7919921875, 10.399169921875, 11.00634765625, 11.613525390625, 12.220703125, 12.827880859375, 13.43505859375, 14.042236328125, 14.6494140625, 15.256591796875, 15.86376953125, 16.470947265625, 17.078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 12.0, 7.0, 18.0, 20.0, 16.0, 20.0, 15.0, 24.0, 23.0, 32.0, 34.0, 34.0, 47.0, 33.0, 54.0, 45.0, 36.0, 42.0, 36.0, 36.0, 30.0, 38.0, 39.0, 36.0, 37.0, 33.0, 27.0, 28.0, 18.0, 18.0, 19.0, 14.0, 9.0, 11.0, 6.0, 5.0, 8.0, 6.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-36.625, -35.52783203125, -34.4306640625, -33.33349609375, -32.236328125, -31.13916015625, -30.0419921875, -28.94482421875, -27.84765625, -26.75048828125, -25.6533203125, -24.55615234375, -23.458984375, -22.36181640625, -21.2646484375, -20.16748046875, -19.0703125, -17.97314453125, -16.8759765625, -15.77880859375, -14.681640625, -13.58447265625, -12.4873046875, -11.39013671875, -10.29296875, -9.19580078125, -8.0986328125, -7.00146484375, -5.904296875, -4.80712890625, -3.7099609375, -2.61279296875, -1.515625, -0.41845703125, 0.6787109375, 1.77587890625, 2.873046875, 3.97021484375, 5.0673828125, 6.16455078125, 7.26171875, 8.35888671875, 9.4560546875, 10.55322265625, 11.650390625, 12.74755859375, 13.8447265625, 14.94189453125, 16.0390625, 17.13623046875, 18.2333984375, 19.33056640625, 20.427734375, 21.52490234375, 22.6220703125, 23.71923828125, 24.81640625, 25.91357421875, 27.0107421875, 28.10791015625, 29.205078125, 30.30224609375, 31.3994140625, 32.49658203125, 33.59375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 10.0, 10.0, 23.0, 23.0, 50.0, 75.0, 102.0, 218.0, 360.0, 537.0, 904.0, 1571.0, 2699.0, 4302.0, 7323.0, 11502.0, 18747.0, 28823.0, 42824.0, 60643.0, 81537.0, 100675.0, 114781.0, 119316.0, 112369.0, 97198.0, 76498.0, 56670.0, 38830.0, 26300.0, 16699.0, 10392.0, 6581.0, 3950.0, 2461.0, 1373.0, 834.0, 565.0, 278.0, 200.0, 112.0, 64.0, 51.0, 38.0, 17.0, 8.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-26.46875, -25.676025390625, -24.88330078125, -24.090576171875, -23.2978515625, -22.505126953125, -21.71240234375, -20.919677734375, -20.126953125, -19.334228515625, -18.54150390625, -17.748779296875, -16.9560546875, -16.163330078125, -15.37060546875, -14.577880859375, -13.78515625, -12.992431640625, -12.19970703125, -11.406982421875, -10.6142578125, -9.821533203125, -9.02880859375, -8.236083984375, -7.443359375, -6.650634765625, -5.85791015625, -5.065185546875, -4.2724609375, -3.479736328125, -2.68701171875, -1.894287109375, -1.1015625, -0.308837890625, 0.48388671875, 1.276611328125, 2.0693359375, 2.862060546875, 3.65478515625, 4.447509765625, 5.240234375, 6.032958984375, 6.82568359375, 7.618408203125, 8.4111328125, 9.203857421875, 9.99658203125, 10.789306640625, 11.58203125, 12.374755859375, 13.16748046875, 13.960205078125, 14.7529296875, 15.545654296875, 16.33837890625, 17.131103515625, 17.923828125, 18.716552734375, 19.50927734375, 20.302001953125, 21.0947265625, 21.887451171875, 22.68017578125, 23.472900390625, 24.265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 8.0, 8.0, 13.0, 14.0, 26.0, 28.0, 24.0, 32.0, 23.0, 36.0, 33.0, 48.0, 36.0, 48.0, 50.0, 44.0, 37.0, 51.0, 50.0, 41.0, 36.0, 44.0, 30.0, 27.0, 32.0, 24.0, 22.0, 21.0, 28.0, 17.0, 10.0, 10.0, 10.0, 2.0, 4.0, 1.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.03125, -28.238525390625, -27.44580078125, -26.653076171875, -25.8603515625, -25.067626953125, -24.27490234375, -23.482177734375, -22.689453125, -21.896728515625, -21.10400390625, -20.311279296875, -19.5185546875, -18.725830078125, -17.93310546875, -17.140380859375, -16.34765625, -15.554931640625, -14.76220703125, -13.969482421875, -13.1767578125, -12.384033203125, -11.59130859375, -10.798583984375, -10.005859375, -9.213134765625, -8.42041015625, -7.627685546875, -6.8349609375, -6.042236328125, -5.24951171875, -4.456787109375, -3.6640625, -2.871337890625, -2.07861328125, -1.285888671875, -0.4931640625, 0.299560546875, 1.09228515625, 1.885009765625, 2.677734375, 3.470458984375, 4.26318359375, 5.055908203125, 5.8486328125, 6.641357421875, 7.43408203125, 8.226806640625, 9.01953125, 9.812255859375, 10.60498046875, 11.397705078125, 12.1904296875, 12.983154296875, 13.77587890625, 14.568603515625, 15.361328125, 16.154052734375, 16.94677734375, 17.739501953125, 18.5322265625, 19.324951171875, 20.11767578125, 20.910400390625, 21.703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 11.0, 22.0, 13.0, 36.0, 44.0, 84.0, 109.0, 171.0, 244.0, 361.0, 515.0, 816.0, 1320.0, 2136.0, 3462.0, 5980.0, 10384.0, 18234.0, 33083.0, 58975.0, 96333.0, 141214.0, 171696.0, 167459.0, 130541.0, 86635.0, 50928.0, 28631.0, 16064.0, 9121.0, 5304.0, 3255.0, 1960.0, 1184.0, 755.0, 457.0, 336.0, 204.0, 143.0, 107.0, 57.0, 60.0, 36.0, 29.0, 13.0, 9.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.546875, -14.06005859375, -13.5732421875, -13.08642578125, -12.599609375, -12.11279296875, -11.6259765625, -11.13916015625, -10.65234375, -10.16552734375, -9.6787109375, -9.19189453125, -8.705078125, -8.21826171875, -7.7314453125, -7.24462890625, -6.7578125, -6.27099609375, -5.7841796875, -5.29736328125, -4.810546875, -4.32373046875, -3.8369140625, -3.35009765625, -2.86328125, -2.37646484375, -1.8896484375, -1.40283203125, -0.916015625, -0.42919921875, 0.0576171875, 0.54443359375, 1.03125, 1.51806640625, 2.0048828125, 2.49169921875, 2.978515625, 3.46533203125, 3.9521484375, 4.43896484375, 4.92578125, 5.41259765625, 5.8994140625, 6.38623046875, 6.873046875, 7.35986328125, 7.8466796875, 8.33349609375, 8.8203125, 9.30712890625, 9.7939453125, 10.28076171875, 10.767578125, 11.25439453125, 11.7412109375, 12.22802734375, 12.71484375, 13.20166015625, 13.6884765625, 14.17529296875, 14.662109375, 15.14892578125, 15.6357421875, 16.12255859375, 16.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 4.0, 6.0, 9.0, 10.0, 10.0, 9.0, 16.0, 24.0, 18.0, 16.0, 30.0, 21.0, 26.0, 45.0, 45.0, 50.0, 49.0, 45.0, 64.0, 60.0, 45.0, 48.0, 40.0, 25.0, 43.0, 34.0, 40.0, 32.0, 21.0, 19.0, 10.0, 11.0, 14.0, 12.0, 5.0, 11.0, 6.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0014524459838867188, -0.0014096498489379883, -0.0013668537139892578, -0.0013240575790405273, -0.0012812614440917969, -0.0012384653091430664, -0.001195669174194336, -0.0011528730392456055, -0.001110076904296875, -0.0010672807693481445, -0.001024484634399414, -0.0009816884994506836, -0.0009388923645019531, -0.0008960962295532227, -0.0008533000946044922, -0.0008105039596557617, -0.0007677078247070312, -0.0007249116897583008, -0.0006821155548095703, -0.0006393194198608398, -0.0005965232849121094, -0.0005537271499633789, -0.0005109310150146484, -0.00046813488006591797, -0.0004253387451171875, -0.00038254261016845703, -0.00033974647521972656, -0.0002969503402709961, -0.0002541542053222656, -0.00021135807037353516, -0.0001685619354248047, -0.00012576580047607422, -8.296966552734375e-05, -4.017353057861328e-05, 2.6226043701171875e-06, 4.5418739318847656e-05, 8.821487426757812e-05, 0.0001310110092163086, 0.00017380714416503906, 0.00021660327911376953, 0.0002593994140625, 0.00030219554901123047, 0.00034499168395996094, 0.0003877878189086914, 0.0004305839538574219, 0.00047338008880615234, 0.0005161762237548828, 0.0005589723587036133, 0.0006017684936523438, 0.0006445646286010742, 0.0006873607635498047, 0.0007301568984985352, 0.0007729530334472656, 0.0008157491683959961, 0.0008585453033447266, 0.000901341438293457, 0.0009441375732421875, 0.000986933708190918, 0.0010297298431396484, 0.001072525978088379, 0.0011153221130371094, 0.0011581182479858398, 0.0012009143829345703, 0.0012437105178833008, 0.0012865066528320312]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 4.0, 7.0, 13.0, 13.0, 15.0, 28.0, 24.0, 41.0, 62.0, 100.0, 135.0, 233.0, 312.0, 466.0, 623.0, 1031.0, 1562.0, 2306.0, 3626.0, 5578.0, 9188.0, 14809.0, 23734.0, 38470.0, 59242.0, 86932.0, 116532.0, 138118.0, 140970.0, 123994.0, 96179.0, 66774.0, 43836.0, 27454.0, 17083.0, 10433.0, 6614.0, 4223.0, 2653.0, 1692.0, 1186.0, 727.0, 490.0, 345.0, 219.0, 175.0, 102.0, 75.0, 41.0, 27.0, 19.0, 22.0, 9.0, 7.0, 7.0, 2.0, 4.0, 3.0, 0.0, 2.0], "bins": [-13.6015625, -13.178466796875, -12.75537109375, -12.332275390625, -11.9091796875, -11.486083984375, -11.06298828125, -10.639892578125, -10.216796875, -9.793701171875, -9.37060546875, -8.947509765625, -8.5244140625, -8.101318359375, -7.67822265625, -7.255126953125, -6.83203125, -6.408935546875, -5.98583984375, -5.562744140625, -5.1396484375, -4.716552734375, -4.29345703125, -3.870361328125, -3.447265625, -3.024169921875, -2.60107421875, -2.177978515625, -1.7548828125, -1.331787109375, -0.90869140625, -0.485595703125, -0.0625, 0.360595703125, 0.78369140625, 1.206787109375, 1.6298828125, 2.052978515625, 2.47607421875, 2.899169921875, 3.322265625, 3.745361328125, 4.16845703125, 4.591552734375, 5.0146484375, 5.437744140625, 5.86083984375, 6.283935546875, 6.70703125, 7.130126953125, 7.55322265625, 7.976318359375, 8.3994140625, 8.822509765625, 9.24560546875, 9.668701171875, 10.091796875, 10.514892578125, 10.93798828125, 11.361083984375, 11.7841796875, 12.207275390625, 12.63037109375, 13.053466796875, 13.4765625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 4.0, 13.0, 15.0, 13.0, 12.0, 18.0, 28.0, 22.0, 48.0, 42.0, 56.0, 64.0, 53.0, 69.0, 74.0, 85.0, 63.0, 61.0, 49.0, 46.0, 29.0, 30.0, 31.0, 15.0, 12.0, 10.0, 10.0, 5.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.25311279296875, -5.0179443359375, -4.78277587890625, -4.547607421875, -4.31243896484375, -4.0772705078125, -3.84210205078125, -3.60693359375, -3.37176513671875, -3.1365966796875, -2.90142822265625, -2.666259765625, -2.43109130859375, -2.1959228515625, -1.96075439453125, -1.7255859375, -1.49041748046875, -1.2552490234375, -1.02008056640625, -0.784912109375, -0.54974365234375, -0.3145751953125, -0.07940673828125, 0.15576171875, 0.39093017578125, 0.6260986328125, 0.86126708984375, 1.096435546875, 1.33160400390625, 1.5667724609375, 1.80194091796875, 2.037109375, 2.27227783203125, 2.5074462890625, 2.74261474609375, 2.977783203125, 3.21295166015625, 3.4481201171875, 3.68328857421875, 3.91845703125, 4.15362548828125, 4.3887939453125, 4.62396240234375, 4.859130859375, 5.09429931640625, 5.3294677734375, 5.56463623046875, 5.7998046875, 6.03497314453125, 6.2701416015625, 6.50531005859375, 6.740478515625, 6.97564697265625, 7.2108154296875, 7.44598388671875, 7.68115234375, 7.91632080078125, 8.1514892578125, 8.38665771484375, 8.621826171875, 8.85699462890625, 9.0921630859375, 9.32733154296875, 9.5625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 4.0, 3.0, 7.0, 6.0, 10.0, 9.0, 13.0, 17.0, 17.0, 19.0, 28.0, 30.0, 30.0, 47.0, 28.0, 45.0, 29.0, 33.0, 40.0, 41.0, 41.0, 49.0, 42.0, 39.0, 41.0, 39.0, 34.0, 42.0, 34.0, 30.0, 20.0, 22.0, 17.0, 15.0, 11.0, 15.0, 7.0, 10.0, 8.0, 11.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.053030014038086, -30.091337203979492, -29.1296443939209, -28.167949676513672, -27.206256866455078, -26.244564056396484, -25.28287124633789, -24.321178436279297, -23.359485626220703, -22.39779281616211, -21.436100006103516, -20.474407196044922, -19.512712478637695, -18.5510196685791, -17.589326858520508, -16.627634048461914, -15.665939331054688, -14.704246520996094, -13.742552757263184, -12.78085994720459, -11.81916618347168, -10.857473373413086, -9.895780563354492, -8.934087753295898, -7.972393989562988, -7.010700702667236, -6.049007415771484, -5.087314605712891, -4.125621318817139, -3.1639280319213867, -2.202235221862793, -1.240541934967041, -0.27884674072265625, 0.6828464269638062, 1.6445395946502686, 2.6062326431274414, 3.5679259300231934, 4.529619216918945, 5.491312026977539, 6.453005313873291, 7.414698600769043, 8.376391410827637, 9.338085174560547, 10.29977798461914, 11.261470794677734, 12.223164558410645, 13.184857368469238, 14.146551132202148, 15.108243942260742, 16.069936752319336, 17.03162956237793, 17.993324279785156, 18.95501708984375, 19.916709899902344, 20.878402709960938, 21.84009552001953, 22.801788330078125, 23.76348114013672, 24.725173950195312, 25.686866760253906, 26.648561477661133, 27.610254287719727, 28.57194709777832, 29.533639907836914, 30.49533462524414]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 3.0, 18.0, 10.0, 15.0, 15.0, 21.0, 32.0, 27.0, 30.0, 30.0, 29.0, 37.0, 34.0, 43.0, 43.0, 43.0, 43.0, 31.0, 44.0, 47.0, 29.0, 46.0, 36.0, 34.0, 24.0, 31.0, 27.0, 31.0, 26.0, 18.0, 20.0, 14.0, 13.0, 4.0, 18.0, 5.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-43.26028823852539, -42.05245590209961, -40.844627380371094, -39.63679504394531, -38.4289665222168, -37.221134185791016, -36.0133056640625, -34.80547332763672, -33.59764099121094, -32.389808654785156, -31.18198013305664, -29.974149703979492, -28.766319274902344, -27.558486938476562, -26.350656509399414, -25.142826080322266, -23.93499755859375, -22.7271671295166, -21.519336700439453, -20.311506271362305, -19.103675842285156, -17.895843505859375, -16.688013076782227, -15.480182647705078, -14.27235221862793, -13.064521789550781, -11.856691360473633, -10.648859977722168, -9.44102954864502, -8.233199119567871, -7.0253682136535645, -5.817537307739258, -4.609703063964844, -3.401872396469116, -2.1940417289733887, -0.9862110614776611, 0.2216196060180664, 1.4294500350952148, 2.6372809410095215, 3.845111846923828, 5.052942276000977, 6.260772705078125, 7.468603610992432, 8.676434516906738, 9.884264945983887, 11.092095375061035, 12.2999267578125, 13.507757186889648, 14.715587615966797, 15.923418045043945, 17.131248474121094, 18.339078903198242, 19.54690933227539, 20.754741668701172, 21.96257209777832, 23.17040252685547, 24.378232955932617, 25.586063385009766, 26.793893814086914, 28.001724243164062, 29.209556579589844, 30.41738510131836, 31.62521743774414, 32.833045959472656, 34.04087829589844]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 11.0, 17.0, 28.0, 63.0, 95.0, 140.0, 276.0, 443.0, 752.0, 1280.0, 2092.0, 3471.0, 5726.0, 9546.0, 15471.0, 25116.0, 39791.0, 61101.0, 93259.0, 136488.0, 192828.0, 259412.0, 328742.0, 390402.0, 428681.0, 437050.0, 409938.0, 358612.0, 292087.0, 222666.0, 160705.0, 112356.0, 75213.0, 48748.0, 31253.0, 19797.0, 11964.0, 7562.0, 4512.0, 2683.0, 1632.0, 929.0, 555.0, 339.0, 201.0, 106.0, 62.0, 38.0, 15.0, 15.0, 9.0, 4.0, 3.0, 2.0, 2.0], "bins": [-23.21875, -22.54052734375, -21.8623046875, -21.18408203125, -20.505859375, -19.82763671875, -19.1494140625, -18.47119140625, -17.79296875, -17.11474609375, -16.4365234375, -15.75830078125, -15.080078125, -14.40185546875, -13.7236328125, -13.04541015625, -12.3671875, -11.68896484375, -11.0107421875, -10.33251953125, -9.654296875, -8.97607421875, -8.2978515625, -7.61962890625, -6.94140625, -6.26318359375, -5.5849609375, -4.90673828125, -4.228515625, -3.55029296875, -2.8720703125, -2.19384765625, -1.515625, -0.83740234375, -0.1591796875, 0.51904296875, 1.197265625, 1.87548828125, 2.5537109375, 3.23193359375, 3.91015625, 4.58837890625, 5.2666015625, 5.94482421875, 6.623046875, 7.30126953125, 7.9794921875, 8.65771484375, 9.3359375, 10.01416015625, 10.6923828125, 11.37060546875, 12.048828125, 12.72705078125, 13.4052734375, 14.08349609375, 14.76171875, 15.43994140625, 16.1181640625, 16.79638671875, 17.474609375, 18.15283203125, 18.8310546875, 19.50927734375, 20.1875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 8.0, 16.0, 10.0, 15.0, 20.0, 24.0, 32.0, 25.0, 31.0, 29.0, 38.0, 29.0, 45.0, 40.0, 41.0, 43.0, 39.0, 39.0, 41.0, 39.0, 34.0, 50.0, 36.0, 22.0, 26.0, 36.0, 26.0, 28.0, 25.0, 16.0, 18.0, 14.0, 5.0, 9.0, 14.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-37.0, -35.9765625, -34.953125, -33.9296875, -32.90625, -31.8828125, -30.859375, -29.8359375, -28.8125, -27.7890625, -26.765625, -25.7421875, -24.71875, -23.6953125, -22.671875, -21.6484375, -20.625, -19.6015625, -18.578125, -17.5546875, -16.53125, -15.5078125, -14.484375, -13.4609375, -12.4375, -11.4140625, -10.390625, -9.3671875, -8.34375, -7.3203125, -6.296875, -5.2734375, -4.25, -3.2265625, -2.203125, -1.1796875, -0.15625, 0.8671875, 1.890625, 2.9140625, 3.9375, 4.9609375, 5.984375, 7.0078125, 8.03125, 9.0546875, 10.078125, 11.1015625, 12.125, 13.1484375, 14.171875, 15.1953125, 16.21875, 17.2421875, 18.265625, 19.2890625, 20.3125, 21.3359375, 22.359375, 23.3828125, 24.40625, 25.4296875, 26.453125, 27.4765625, 28.5]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 13.0, 22.0, 24.0, 60.0, 67.0, 144.0, 224.0, 351.0, 624.0, 1253.0, 1968.0, 3274.0, 5392.0, 8858.0, 14000.0, 21752.0, 33935.0, 50841.0, 74152.0, 104245.0, 143658.0, 188994.0, 239821.0, 287337.0, 332175.0, 362686.0, 374090.0, 366841.0, 338533.0, 296597.0, 248793.0, 197517.0, 151720.0, 111183.0, 79250.0, 54125.0, 36791.0, 23662.0, 15162.0, 9607.0, 5834.0, 3652.0, 2087.0, 1250.0, 734.0, 450.0, 247.0, 128.0, 59.0, 40.0, 30.0, 16.0, 11.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.6962890625, -18.064453125, -17.4326171875, -16.80078125, -16.1689453125, -15.537109375, -14.9052734375, -14.2734375, -13.6416015625, -13.009765625, -12.3779296875, -11.74609375, -11.1142578125, -10.482421875, -9.8505859375, -9.21875, -8.5869140625, -7.955078125, -7.3232421875, -6.69140625, -6.0595703125, -5.427734375, -4.7958984375, -4.1640625, -3.5322265625, -2.900390625, -2.2685546875, -1.63671875, -1.0048828125, -0.373046875, 0.2587890625, 0.890625, 1.5224609375, 2.154296875, 2.7861328125, 3.41796875, 4.0498046875, 4.681640625, 5.3134765625, 5.9453125, 6.5771484375, 7.208984375, 7.8408203125, 8.47265625, 9.1044921875, 9.736328125, 10.3681640625, 11.0, 11.6318359375, 12.263671875, 12.8955078125, 13.52734375, 14.1591796875, 14.791015625, 15.4228515625, 16.0546875, 16.6865234375, 17.318359375, 17.9501953125, 18.58203125, 19.2138671875, 19.845703125, 20.4775390625, 21.109375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 8.0, 8.0, 15.0, 14.0, 23.0, 18.0, 38.0, 42.0, 58.0, 55.0, 69.0, 95.0, 119.0, 109.0, 141.0, 159.0, 200.0, 207.0, 227.0, 210.0, 185.0, 235.0, 217.0, 199.0, 189.0, 193.0, 148.0, 135.0, 128.0, 120.0, 98.0, 86.0, 57.0, 58.0, 62.0, 35.0, 29.0, 22.0, 22.0, 9.0, 5.0, 4.0, 7.0, 4.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.5703125, -12.1209716796875, -11.671630859375, -11.2222900390625, -10.77294921875, -10.3236083984375, -9.874267578125, -9.4249267578125, -8.9755859375, -8.5262451171875, -8.076904296875, -7.6275634765625, -7.17822265625, -6.7288818359375, -6.279541015625, -5.8302001953125, -5.380859375, -4.9315185546875, -4.482177734375, -4.0328369140625, -3.58349609375, -3.1341552734375, -2.684814453125, -2.2354736328125, -1.7861328125, -1.3367919921875, -0.887451171875, -0.4381103515625, 0.01123046875, 0.4605712890625, 0.909912109375, 1.3592529296875, 1.80859375, 2.2579345703125, 2.707275390625, 3.1566162109375, 3.60595703125, 4.0552978515625, 4.504638671875, 4.9539794921875, 5.4033203125, 5.8526611328125, 6.302001953125, 6.7513427734375, 7.20068359375, 7.6500244140625, 8.099365234375, 8.5487060546875, 8.998046875, 9.4473876953125, 9.896728515625, 10.3460693359375, 10.79541015625, 11.2447509765625, 11.694091796875, 12.1434326171875, 12.5927734375, 13.0421142578125, 13.491455078125, 13.9407958984375, 14.39013671875, 14.8394775390625, 15.288818359375, 15.7381591796875, 16.1875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 9.0, 7.0, 24.0, 17.0, 22.0, 24.0, 27.0, 27.0, 26.0, 37.0, 39.0, 39.0, 44.0, 47.0, 42.0, 49.0, 47.0, 53.0, 46.0, 34.0, 36.0, 33.0, 39.0, 33.0, 28.0, 34.0, 17.0, 26.0, 19.0, 15.0, 9.0, 11.0, 13.0, 7.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.84752655029297, -29.82241439819336, -28.79730224609375, -27.77219009399414, -26.74707794189453, -25.721965789794922, -24.696855545043945, -23.671743392944336, -22.646631240844727, -21.621519088745117, -20.596406936645508, -19.5712947845459, -18.546184539794922, -17.521072387695312, -16.495960235595703, -15.470848083496094, -14.445735931396484, -13.420623779296875, -12.395511627197266, -11.370400428771973, -10.345288276672363, -9.320176124572754, -8.295064926147461, -7.269952774047852, -6.244840621948242, -5.219728469848633, -4.194616794586182, -3.1695048809051514, -2.144392967224121, -1.1192808151245117, -0.09416913986206055, 0.9309425354003906, 1.9560508728027344, 2.9811627864837646, 4.006274700164795, 5.031386375427246, 6.0564985275268555, 7.081610679626465, 8.106721878051758, 9.131834030151367, 10.156946182250977, 11.182058334350586, 12.207170486450195, 13.232281684875488, 14.257393836975098, 15.282505989074707, 16.3076171875, 17.33272933959961, 18.35784149169922, 19.382953643798828, 20.408065795898438, 21.433177947998047, 22.458290100097656, 23.483402252197266, 24.508512496948242, 25.53362464904785, 26.55873680114746, 27.58384895324707, 28.60896110534668, 29.63407325744629, 30.659183502197266, 31.684295654296875, 32.709407806396484, 33.734519958496094, 34.7596321105957]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 10.0, 15.0, 14.0, 23.0, 14.0, 22.0, 30.0, 19.0, 34.0, 40.0, 30.0, 32.0, 29.0, 40.0, 57.0, 34.0, 42.0, 26.0, 35.0, 46.0, 37.0, 37.0, 37.0, 43.0, 22.0, 32.0, 27.0, 22.0, 26.0, 18.0, 13.0, 19.0, 13.0, 8.0, 11.0, 4.0, 5.0, 8.0, 6.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-37.08695983886719, -35.967811584472656, -34.84865951538086, -33.72951126098633, -32.61035919189453, -31.4912109375, -30.372060775756836, -29.252910614013672, -28.133760452270508, -27.014610290527344, -25.89546012878418, -24.776309967041016, -23.657161712646484, -22.538009643554688, -21.418861389160156, -20.299711227416992, -19.180561065673828, -18.061410903930664, -16.9422607421875, -15.823111534118652, -14.703961372375488, -13.584811210632324, -12.465662002563477, -11.346511840820312, -10.227361679077148, -9.108211517333984, -7.9890618324279785, -6.869912147521973, -5.750761985778809, -4.6316118240356445, -3.5124621391296387, -2.393312454223633, -1.2741661071777344, -0.15501618385314941, 0.9641337394714355, 2.0832836627960205, 3.2024335861206055, 4.3215837478637695, 5.440733432769775, 6.559883117675781, 7.679033279418945, 8.79818344116211, 9.917333602905273, 11.036482810974121, 12.155632972717285, 13.27478313446045, 14.393932342529297, 15.513082504272461, 16.632232666015625, 17.75138282775879, 18.870532989501953, 19.989683151245117, 21.10883331298828, 22.227981567382812, 23.347131729125977, 24.46628189086914, 25.585432052612305, 26.70458221435547, 27.823732376098633, 28.942882537841797, 30.062030792236328, 31.181182861328125, 32.300331115722656, 33.41947937011719, 34.538631439208984]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 8.0, 7.0, 15.0, 27.0, 38.0, 53.0, 67.0, 111.0, 168.0, 227.0, 405.0, 581.0, 908.0, 1382.0, 2196.0, 3347.0, 5167.0, 8252.0, 12689.0, 20254.0, 32196.0, 51602.0, 83330.0, 132750.0, 183088.0, 177026.0, 125193.0, 77510.0, 47668.0, 30017.0, 18817.0, 12029.0, 7764.0, 4792.0, 3127.0, 1996.0, 1312.0, 854.0, 552.0, 352.0, 227.0, 133.0, 94.0, 86.0, 38.0, 36.0, 26.0, 21.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.6328125, -7.385986328125, -7.13916015625, -6.892333984375, -6.6455078125, -6.398681640625, -6.15185546875, -5.905029296875, -5.658203125, -5.411376953125, -5.16455078125, -4.917724609375, -4.6708984375, -4.424072265625, -4.17724609375, -3.930419921875, -3.68359375, -3.436767578125, -3.18994140625, -2.943115234375, -2.6962890625, -2.449462890625, -2.20263671875, -1.955810546875, -1.708984375, -1.462158203125, -1.21533203125, -0.968505859375, -0.7216796875, -0.474853515625, -0.22802734375, 0.018798828125, 0.265625, 0.512451171875, 0.75927734375, 1.006103515625, 1.2529296875, 1.499755859375, 1.74658203125, 1.993408203125, 2.240234375, 2.487060546875, 2.73388671875, 2.980712890625, 3.2275390625, 3.474365234375, 3.72119140625, 3.968017578125, 4.21484375, 4.461669921875, 4.70849609375, 4.955322265625, 5.2021484375, 5.448974609375, 5.69580078125, 5.942626953125, 6.189453125, 6.436279296875, 6.68310546875, 6.929931640625, 7.1767578125, 7.423583984375, 7.67041015625, 7.917236328125, 8.1640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 11.0, 16.0, 13.0, 22.0, 17.0, 22.0, 30.0, 20.0, 31.0, 41.0, 32.0, 32.0, 33.0, 38.0, 56.0, 31.0, 42.0, 25.0, 39.0, 41.0, 40.0, 37.0, 37.0, 39.0, 28.0, 28.0, 28.0, 23.0, 24.0, 18.0, 13.0, 18.0, 12.0, 9.0, 10.0, 5.0, 5.0, 8.0, 6.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-36.90625, -35.79150390625, -34.6767578125, -33.56201171875, -32.447265625, -31.33251953125, -30.2177734375, -29.10302734375, -27.98828125, -26.87353515625, -25.7587890625, -24.64404296875, -23.529296875, -22.41455078125, -21.2998046875, -20.18505859375, -19.0703125, -17.95556640625, -16.8408203125, -15.72607421875, -14.611328125, -13.49658203125, -12.3818359375, -11.26708984375, -10.15234375, -9.03759765625, -7.9228515625, -6.80810546875, -5.693359375, -4.57861328125, -3.4638671875, -2.34912109375, -1.234375, -0.11962890625, 0.9951171875, 2.10986328125, 3.224609375, 4.33935546875, 5.4541015625, 6.56884765625, 7.68359375, 8.79833984375, 9.9130859375, 11.02783203125, 12.142578125, 13.25732421875, 14.3720703125, 15.48681640625, 16.6015625, 17.71630859375, 18.8310546875, 19.94580078125, 21.060546875, 22.17529296875, 23.2900390625, 24.40478515625, 25.51953125, 26.63427734375, 27.7490234375, 28.86376953125, 29.978515625, 31.09326171875, 32.2080078125, 33.32275390625, 34.4375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 7.0, 8.0, 14.0, 10.0, 18.0, 27.0, 37.0, 52.0, 67.0, 81.0, 103.0, 178.0, 266.0, 290.0, 414.0, 631.0, 957.0, 1435.0, 2320.0, 3738.0, 6822.0, 13898.0, 35092.0, 118197.0, 437367.0, 300933.0, 75140.0, 25047.0, 10697.0, 5361.0, 3200.0, 1974.0, 1289.0, 831.0, 599.0, 429.0, 271.0, 209.0, 133.0, 113.0, 65.0, 52.0, 51.0, 34.0, 31.0, 15.0, 16.0, 11.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-15.65625, -15.1793212890625, -14.702392578125, -14.2254638671875, -13.74853515625, -13.2716064453125, -12.794677734375, -12.3177490234375, -11.8408203125, -11.3638916015625, -10.886962890625, -10.4100341796875, -9.93310546875, -9.4561767578125, -8.979248046875, -8.5023193359375, -8.025390625, -7.5484619140625, -7.071533203125, -6.5946044921875, -6.11767578125, -5.6407470703125, -5.163818359375, -4.6868896484375, -4.2099609375, -3.7330322265625, -3.256103515625, -2.7791748046875, -2.30224609375, -1.8253173828125, -1.348388671875, -0.8714599609375, -0.39453125, 0.0823974609375, 0.559326171875, 1.0362548828125, 1.51318359375, 1.9901123046875, 2.467041015625, 2.9439697265625, 3.4208984375, 3.8978271484375, 4.374755859375, 4.8516845703125, 5.32861328125, 5.8055419921875, 6.282470703125, 6.7593994140625, 7.236328125, 7.7132568359375, 8.190185546875, 8.6671142578125, 9.14404296875, 9.6209716796875, 10.097900390625, 10.5748291015625, 11.0517578125, 11.5286865234375, 12.005615234375, 12.4825439453125, 12.95947265625, 13.4364013671875, 13.913330078125, 14.3902587890625, 14.8671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 7.0, 7.0, 9.0, 13.0, 15.0, 15.0, 23.0, 17.0, 27.0, 31.0, 29.0, 30.0, 40.0, 32.0, 41.0, 35.0, 30.0, 32.0, 43.0, 44.0, 55.0, 40.0, 40.0, 24.0, 41.0, 36.0, 34.0, 32.0, 16.0, 24.0, 16.0, 23.0, 22.0, 12.0, 9.0, 8.0, 8.0, 9.0, 6.0, 4.0, 5.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 4.0], "bins": [-29.109375, -28.2900390625, -27.470703125, -26.6513671875, -25.83203125, -25.0126953125, -24.193359375, -23.3740234375, -22.5546875, -21.7353515625, -20.916015625, -20.0966796875, -19.27734375, -18.4580078125, -17.638671875, -16.8193359375, -16.0, -15.1806640625, -14.361328125, -13.5419921875, -12.72265625, -11.9033203125, -11.083984375, -10.2646484375, -9.4453125, -8.6259765625, -7.806640625, -6.9873046875, -6.16796875, -5.3486328125, -4.529296875, -3.7099609375, -2.890625, -2.0712890625, -1.251953125, -0.4326171875, 0.38671875, 1.2060546875, 2.025390625, 2.8447265625, 3.6640625, 4.4833984375, 5.302734375, 6.1220703125, 6.94140625, 7.7607421875, 8.580078125, 9.3994140625, 10.21875, 11.0380859375, 11.857421875, 12.6767578125, 13.49609375, 14.3154296875, 15.134765625, 15.9541015625, 16.7734375, 17.5927734375, 18.412109375, 19.2314453125, 20.05078125, 20.8701171875, 21.689453125, 22.5087890625, 23.328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 9.0, 7.0, 8.0, 8.0, 17.0, 28.0, 40.0, 61.0, 91.0, 118.0, 227.0, 323.0, 527.0, 841.0, 1546.0, 2912.0, 5967.0, 14515.0, 40272.0, 214013.0, 640836.0, 83112.0, 23817.0, 9547.0, 4316.0, 2255.0, 1172.0, 689.0, 434.0, 277.0, 182.0, 138.0, 84.0, 52.0, 38.0, 26.0, 19.0, 12.0, 12.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9296875, -13.5108642578125, -13.092041015625, -12.6732177734375, -12.25439453125, -11.8355712890625, -11.416748046875, -10.9979248046875, -10.5791015625, -10.1602783203125, -9.741455078125, -9.3226318359375, -8.90380859375, -8.4849853515625, -8.066162109375, -7.6473388671875, -7.228515625, -6.8096923828125, -6.390869140625, -5.9720458984375, -5.55322265625, -5.1343994140625, -4.715576171875, -4.2967529296875, -3.8779296875, -3.4591064453125, -3.040283203125, -2.6214599609375, -2.20263671875, -1.7838134765625, -1.364990234375, -0.9461669921875, -0.52734375, -0.1085205078125, 0.310302734375, 0.7291259765625, 1.14794921875, 1.5667724609375, 1.985595703125, 2.4044189453125, 2.8232421875, 3.2420654296875, 3.660888671875, 4.0797119140625, 4.49853515625, 4.9173583984375, 5.336181640625, 5.7550048828125, 6.173828125, 6.5926513671875, 7.011474609375, 7.4302978515625, 7.84912109375, 8.2679443359375, 8.686767578125, 9.1055908203125, 9.5244140625, 9.9432373046875, 10.362060546875, 10.7808837890625, 11.19970703125, 11.6185302734375, 12.037353515625, 12.4561767578125, 12.875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 5.0, 5.0, 11.0, 8.0, 14.0, 28.0, 33.0, 60.0, 127.0, 195.0, 161.0, 134.0, 65.0, 37.0, 23.0, 11.0, 15.0, 8.0, 11.0, 6.0, 2.0, 8.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0014047622680664062, -0.00136469304561615, -0.0013246238231658936, -0.0012845546007156372, -0.0012444853782653809, -0.0012044161558151245, -0.0011643469333648682, -0.0011242777109146118, -0.0010842084884643555, -0.0010441392660140991, -0.0010040700435638428, -0.0009640008211135864, -0.0009239315986633301, -0.0008838623762130737, -0.0008437931537628174, -0.000803723931312561, -0.0007636547088623047, -0.0007235854864120483, -0.000683516263961792, -0.0006434470415115356, -0.0006033778190612793, -0.000563308596611023, -0.0005232393741607666, -0.00048317015171051025, -0.0004431009292602539, -0.00040303170680999756, -0.0003629624843597412, -0.00032289326190948486, -0.0002828240394592285, -0.00024275481700897217, -0.00020268559455871582, -0.00016261637210845947, -0.00012254714965820312, -8.247792720794678e-05, -4.240870475769043e-05, -2.339482307434082e-06, 3.7729740142822266e-05, 7.779896259307861e-05, 0.00011786818504333496, 0.0001579374074935913, 0.00019800662994384766, 0.000238075852394104, 0.00027814507484436035, 0.0003182142972946167, 0.00035828351974487305, 0.0003983527421951294, 0.00043842196464538574, 0.0004784911870956421, 0.0005185604095458984, 0.0005586296319961548, 0.0005986988544464111, 0.0006387680768966675, 0.0006788372993469238, 0.0007189065217971802, 0.0007589757442474365, 0.0007990449666976929, 0.0008391141891479492, 0.0008791834115982056, 0.0009192526340484619, 0.0009593218564987183, 0.0009993910789489746, 0.001039460301399231, 0.0010795295238494873, 0.0011195987462997437, 0.00115966796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 18.0, 12.0, 26.0, 41.0, 50.0, 61.0, 121.0, 165.0, 250.0, 399.0, 693.0, 1170.0, 2149.0, 4031.0, 7431.0, 14124.0, 29954.0, 66507.0, 155203.0, 306899.0, 251208.0, 112386.0, 49093.0, 22376.0, 11016.0, 5742.0, 3030.0, 1775.0, 985.0, 586.0, 398.0, 231.0, 126.0, 74.0, 78.0, 37.0, 29.0, 23.0, 18.0, 12.0, 8.0, 9.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.90625, -8.6171875, -8.328125, -8.0390625, -7.75, -7.4609375, -7.171875, -6.8828125, -6.59375, -6.3046875, -6.015625, -5.7265625, -5.4375, -5.1484375, -4.859375, -4.5703125, -4.28125, -3.9921875, -3.703125, -3.4140625, -3.125, -2.8359375, -2.546875, -2.2578125, -1.96875, -1.6796875, -1.390625, -1.1015625, -0.8125, -0.5234375, -0.234375, 0.0546875, 0.34375, 0.6328125, 0.921875, 1.2109375, 1.5, 1.7890625, 2.078125, 2.3671875, 2.65625, 2.9453125, 3.234375, 3.5234375, 3.8125, 4.1015625, 4.390625, 4.6796875, 4.96875, 5.2578125, 5.546875, 5.8359375, 6.125, 6.4140625, 6.703125, 6.9921875, 7.28125, 7.5703125, 7.859375, 8.1484375, 8.4375, 8.7265625, 9.015625, 9.3046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 10.0, 10.0, 8.0, 11.0, 15.0, 17.0, 28.0, 25.0, 37.0, 50.0, 45.0, 49.0, 68.0, 75.0, 73.0, 64.0, 71.0, 47.0, 54.0, 42.0, 30.0, 22.0, 13.0, 21.0, 20.0, 13.0, 13.0, 8.0, 4.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.681640625, -3.57159423828125, -3.4615478515625, -3.35150146484375, -3.241455078125, -3.13140869140625, -3.0213623046875, -2.91131591796875, -2.80126953125, -2.69122314453125, -2.5811767578125, -2.47113037109375, -2.361083984375, -2.25103759765625, -2.1409912109375, -2.03094482421875, -1.9208984375, -1.81085205078125, -1.7008056640625, -1.59075927734375, -1.480712890625, -1.37066650390625, -1.2606201171875, -1.15057373046875, -1.04052734375, -0.93048095703125, -0.8204345703125, -0.71038818359375, -0.600341796875, -0.49029541015625, -0.3802490234375, -0.27020263671875, -0.16015625, -0.05010986328125, 0.0599365234375, 0.16998291015625, 0.280029296875, 0.39007568359375, 0.5001220703125, 0.61016845703125, 0.72021484375, 0.83026123046875, 0.9403076171875, 1.05035400390625, 1.160400390625, 1.27044677734375, 1.3804931640625, 1.49053955078125, 1.6005859375, 1.71063232421875, 1.8206787109375, 1.93072509765625, 2.040771484375, 2.15081787109375, 2.2608642578125, 2.37091064453125, 2.48095703125, 2.59100341796875, 2.7010498046875, 2.81109619140625, 2.921142578125, 3.03118896484375, 3.1412353515625, 3.25128173828125, 3.361328125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 3.0, 7.0, 6.0, 9.0, 14.0, 12.0, 21.0, 25.0, 29.0, 23.0, 34.0, 25.0, 34.0, 43.0, 43.0, 45.0, 39.0, 47.0, 50.0, 38.0, 58.0, 42.0, 34.0, 43.0, 42.0, 34.0, 31.0, 30.0, 26.0, 26.0, 19.0, 20.0, 13.0, 11.0, 8.0, 11.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.220537185668945, -30.17650032043457, -29.132461547851562, -28.088424682617188, -27.044387817382812, -26.000350952148438, -24.95631217956543, -23.912275314331055, -22.868236541748047, -21.824199676513672, -20.780160903930664, -19.73612403869629, -18.692087173461914, -17.648048400878906, -16.60401153564453, -15.559974670410156, -14.515937805175781, -13.47189998626709, -12.427863121032715, -11.383825302124023, -10.339788436889648, -9.295750617980957, -8.251712799072266, -7.207675457000732, -6.163638114929199, -5.119600772857666, -4.075563430786133, -3.0315256118774414, -1.9874882698059082, -0.943450927734375, 0.1005868911743164, 1.1446242332458496, 2.18865966796875, 3.232697010040283, 4.276734352111816, 5.320772171020508, 6.364809513092041, 7.408846855163574, 8.452884674072266, 9.49692153930664, 10.540959358215332, 11.584997177124023, 12.629034042358398, 13.67307186126709, 14.717109680175781, 15.761146545410156, 16.80518341064453, 17.84922218322754, 18.893259048461914, 19.93729591369629, 20.981334686279297, 22.025371551513672, 23.069408416748047, 24.113445281982422, 25.15748405456543, 26.201520919799805, 27.245559692382812, 28.289596557617188, 29.333635330200195, 30.37767219543457, 31.421709060668945, 32.46574783325195, 33.50978469848633, 34.5538215637207, 35.59785842895508]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 5.0, 14.0, 11.0, 18.0, 27.0, 20.0, 21.0, 30.0, 26.0, 41.0, 20.0, 42.0, 43.0, 38.0, 45.0, 40.0, 33.0, 38.0, 34.0, 47.0, 39.0, 32.0, 31.0, 41.0, 24.0, 38.0, 23.0, 28.0, 21.0, 22.0, 23.0, 14.0, 11.0, 9.0, 6.0, 6.0, 7.0, 8.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.48810577392578, -35.36256790161133, -34.237030029296875, -33.111488342285156, -31.985950469970703, -30.86041259765625, -29.734872817993164, -28.609333038330078, -27.483795166015625, -26.358257293701172, -25.232717514038086, -24.107177734375, -22.981639862060547, -21.856101989746094, -20.730562210083008, -19.605022430419922, -18.47948455810547, -17.353946685791016, -16.22840690612793, -15.10286808013916, -13.97732925415039, -12.851790428161621, -11.726251602172852, -10.600712776184082, -9.475173950195312, -8.349635124206543, -7.224096298217773, -6.098557472229004, -4.973018646240234, -3.847479820251465, -2.7219409942626953, -1.5964021682739258, -0.4708671569824219, 0.6546716690063477, 1.7802104949951172, 2.9057493209838867, 4.031288146972656, 5.156826972961426, 6.282365798950195, 7.407904624938965, 8.533443450927734, 9.658982276916504, 10.784521102905273, 11.910059928894043, 13.035598754882812, 14.161137580871582, 15.286676406860352, 16.412216186523438, 17.53775405883789, 18.663291931152344, 19.78883171081543, 20.914371490478516, 22.03990936279297, 23.165447235107422, 24.290987014770508, 25.416526794433594, 26.542064666748047, 27.6676025390625, 28.793142318725586, 29.918682098388672, 31.044219970703125, 32.16975784301758, 33.29529571533203, 34.42083740234375, 35.5463752746582]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 4.0, 9.0, 14.0, 36.0, 51.0, 73.0, 144.0, 197.0, 286.0, 513.0, 804.0, 1275.0, 1976.0, 3022.0, 4779.0, 7312.0, 10481.0, 16014.0, 22710.0, 31626.0, 42832.0, 55120.0, 67682.0, 79661.0, 89057.0, 94130.0, 93701.0, 88241.0, 78430.0, 66441.0, 53199.0, 41284.0, 30523.0, 21824.0, 15456.0, 10212.0, 6826.0, 4515.0, 3042.0, 1855.0, 1221.0, 735.0, 489.0, 261.0, 162.0, 120.0, 95.0, 44.0, 30.0, 19.0, 10.0, 12.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.078125, -17.474365234375, -16.87060546875, -16.266845703125, -15.6630859375, -15.059326171875, -14.45556640625, -13.851806640625, -13.248046875, -12.644287109375, -12.04052734375, -11.436767578125, -10.8330078125, -10.229248046875, -9.62548828125, -9.021728515625, -8.41796875, -7.814208984375, -7.21044921875, -6.606689453125, -6.0029296875, -5.399169921875, -4.79541015625, -4.191650390625, -3.587890625, -2.984130859375, -2.38037109375, -1.776611328125, -1.1728515625, -0.569091796875, 0.03466796875, 0.638427734375, 1.2421875, 1.845947265625, 2.44970703125, 3.053466796875, 3.6572265625, 4.260986328125, 4.86474609375, 5.468505859375, 6.072265625, 6.676025390625, 7.27978515625, 7.883544921875, 8.4873046875, 9.091064453125, 9.69482421875, 10.298583984375, 10.90234375, 11.506103515625, 12.10986328125, 12.713623046875, 13.3173828125, 13.921142578125, 14.52490234375, 15.128662109375, 15.732421875, 16.336181640625, 16.93994140625, 17.543701171875, 18.1474609375, 18.751220703125, 19.35498046875, 19.958740234375, 20.5625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 5.0, 5.0, 13.0, 13.0, 19.0, 23.0, 22.0, 20.0, 26.0, 29.0, 38.0, 21.0, 40.0, 42.0, 38.0, 45.0, 41.0, 34.0, 36.0, 39.0, 41.0, 42.0, 34.0, 30.0, 41.0, 25.0, 37.0, 26.0, 27.0, 23.0, 18.0, 26.0, 13.0, 12.0, 8.0, 8.0, 6.0, 8.0, 7.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.6875, -34.591796875, -33.49609375, -32.400390625, -31.3046875, -30.208984375, -29.11328125, -28.017578125, -26.921875, -25.826171875, -24.73046875, -23.634765625, -22.5390625, -21.443359375, -20.34765625, -19.251953125, -18.15625, -17.060546875, -15.96484375, -14.869140625, -13.7734375, -12.677734375, -11.58203125, -10.486328125, -9.390625, -8.294921875, -7.19921875, -6.103515625, -5.0078125, -3.912109375, -2.81640625, -1.720703125, -0.625, 0.470703125, 1.56640625, 2.662109375, 3.7578125, 4.853515625, 5.94921875, 7.044921875, 8.140625, 9.236328125, 10.33203125, 11.427734375, 12.5234375, 13.619140625, 14.71484375, 15.810546875, 16.90625, 18.001953125, 19.09765625, 20.193359375, 21.2890625, 22.384765625, 23.48046875, 24.576171875, 25.671875, 26.767578125, 27.86328125, 28.958984375, 30.0546875, 31.150390625, 32.24609375, 33.341796875, 34.4375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 14.0, 40.0, 53.0, 65.0, 107.0, 189.0, 287.0, 466.0, 658.0, 1106.0, 1807.0, 2886.0, 4513.0, 7057.0, 10865.0, 16319.0, 24354.0, 35061.0, 48256.0, 64067.0, 80390.0, 94310.0, 103721.0, 105999.0, 99785.0, 88039.0, 72357.0, 56515.0, 41511.0, 29723.0, 20149.0, 13506.0, 8979.0, 5556.0, 3595.0, 2310.0, 1456.0, 893.0, 622.0, 340.0, 219.0, 147.0, 101.0, 47.0, 37.0, 25.0, 15.0, 8.0, 7.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.545166015625, -20.85595703125, -20.166748046875, -19.4775390625, -18.788330078125, -18.09912109375, -17.409912109375, -16.720703125, -16.031494140625, -15.34228515625, -14.653076171875, -13.9638671875, -13.274658203125, -12.58544921875, -11.896240234375, -11.20703125, -10.517822265625, -9.82861328125, -9.139404296875, -8.4501953125, -7.760986328125, -7.07177734375, -6.382568359375, -5.693359375, -5.004150390625, -4.31494140625, -3.625732421875, -2.9365234375, -2.247314453125, -1.55810546875, -0.868896484375, -0.1796875, 0.509521484375, 1.19873046875, 1.887939453125, 2.5771484375, 3.266357421875, 3.95556640625, 4.644775390625, 5.333984375, 6.023193359375, 6.71240234375, 7.401611328125, 8.0908203125, 8.780029296875, 9.46923828125, 10.158447265625, 10.84765625, 11.536865234375, 12.22607421875, 12.915283203125, 13.6044921875, 14.293701171875, 14.98291015625, 15.672119140625, 16.361328125, 17.050537109375, 17.73974609375, 18.428955078125, 19.1181640625, 19.807373046875, 20.49658203125, 21.185791015625, 21.875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 5.0, 9.0, 8.0, 13.0, 6.0, 19.0, 13.0, 24.0, 18.0, 31.0, 21.0, 26.0, 39.0, 26.0, 36.0, 46.0, 34.0, 42.0, 44.0, 48.0, 44.0, 48.0, 45.0, 34.0, 43.0, 35.0, 30.0, 38.0, 24.0, 22.0, 22.0, 14.0, 19.0, 15.0, 11.0, 14.0, 6.0, 8.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.0625, -26.297119140625, -25.53173828125, -24.766357421875, -24.0009765625, -23.235595703125, -22.47021484375, -21.704833984375, -20.939453125, -20.174072265625, -19.40869140625, -18.643310546875, -17.8779296875, -17.112548828125, -16.34716796875, -15.581787109375, -14.81640625, -14.051025390625, -13.28564453125, -12.520263671875, -11.7548828125, -10.989501953125, -10.22412109375, -9.458740234375, -8.693359375, -7.927978515625, -7.16259765625, -6.397216796875, -5.6318359375, -4.866455078125, -4.10107421875, -3.335693359375, -2.5703125, -1.804931640625, -1.03955078125, -0.274169921875, 0.4912109375, 1.256591796875, 2.02197265625, 2.787353515625, 3.552734375, 4.318115234375, 5.08349609375, 5.848876953125, 6.6142578125, 7.379638671875, 8.14501953125, 8.910400390625, 9.67578125, 10.441162109375, 11.20654296875, 11.971923828125, 12.7373046875, 13.502685546875, 14.26806640625, 15.033447265625, 15.798828125, 16.564208984375, 17.32958984375, 18.094970703125, 18.8603515625, 19.625732421875, 20.39111328125, 21.156494140625, 21.921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 7.0, 2.0, 5.0, 9.0, 11.0, 14.0, 41.0, 53.0, 69.0, 110.0, 194.0, 283.0, 464.0, 736.0, 1174.0, 1859.0, 3009.0, 5106.0, 8229.0, 13662.0, 22752.0, 36735.0, 56916.0, 82765.0, 109868.0, 130962.0, 137229.0, 126021.0, 102838.0, 75287.0, 50223.0, 31783.0, 19766.0, 11842.0, 7087.0, 4318.0, 2641.0, 1657.0, 1071.0, 633.0, 391.0, 257.0, 171.0, 103.0, 64.0, 43.0, 31.0, 24.0, 18.0, 11.0, 10.0, 8.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5859375, -10.225341796875, -9.86474609375, -9.504150390625, -9.1435546875, -8.782958984375, -8.42236328125, -8.061767578125, -7.701171875, -7.340576171875, -6.97998046875, -6.619384765625, -6.2587890625, -5.898193359375, -5.53759765625, -5.177001953125, -4.81640625, -4.455810546875, -4.09521484375, -3.734619140625, -3.3740234375, -3.013427734375, -2.65283203125, -2.292236328125, -1.931640625, -1.571044921875, -1.21044921875, -0.849853515625, -0.4892578125, -0.128662109375, 0.23193359375, 0.592529296875, 0.953125, 1.313720703125, 1.67431640625, 2.034912109375, 2.3955078125, 2.756103515625, 3.11669921875, 3.477294921875, 3.837890625, 4.198486328125, 4.55908203125, 4.919677734375, 5.2802734375, 5.640869140625, 6.00146484375, 6.362060546875, 6.72265625, 7.083251953125, 7.44384765625, 7.804443359375, 8.1650390625, 8.525634765625, 8.88623046875, 9.246826171875, 9.607421875, 9.968017578125, 10.32861328125, 10.689208984375, 11.0498046875, 11.410400390625, 11.77099609375, 12.131591796875, 12.4921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 7.0, 7.0, 15.0, 12.0, 15.0, 24.0, 15.0, 18.0, 27.0, 30.0, 22.0, 30.0, 33.0, 42.0, 38.0, 52.0, 45.0, 41.0, 46.0, 38.0, 37.0, 31.0, 38.0, 44.0, 37.0, 29.0, 28.0, 19.0, 31.0, 16.0, 19.0, 21.0, 11.0, 9.0, 14.0, 16.0, 5.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00106048583984375, -0.0010278522968292236, -0.0009952187538146973, -0.0009625852108001709, -0.0009299516677856445, -0.0008973181247711182, -0.0008646845817565918, -0.0008320510387420654, -0.0007994174957275391, -0.0007667839527130127, -0.0007341504096984863, -0.00070151686668396, -0.0006688833236694336, -0.0006362497806549072, -0.0006036162376403809, -0.0005709826946258545, -0.0005383491516113281, -0.0005057156085968018, -0.0004730820655822754, -0.000440448522567749, -0.00040781497955322266, -0.0003751814365386963, -0.0003425478935241699, -0.00030991435050964355, -0.0002772808074951172, -0.0002446472644805908, -0.00021201372146606445, -0.00017938017845153809, -0.00014674663543701172, -0.00011411309242248535, -8.147954940795898e-05, -4.884600639343262e-05, -1.621246337890625e-05, 1.6421079635620117e-05, 4.9054622650146484e-05, 8.168816566467285e-05, 0.00011432170867919922, 0.00014695525169372559, 0.00017958879470825195, 0.00021222233772277832, 0.0002448558807373047, 0.00027748942375183105, 0.0003101229667663574, 0.0003427565097808838, 0.00037539005279541016, 0.0004080235958099365, 0.0004406571388244629, 0.00047329068183898926, 0.0005059242248535156, 0.000538557767868042, 0.0005711913108825684, 0.0006038248538970947, 0.0006364583969116211, 0.0006690919399261475, 0.0007017254829406738, 0.0007343590259552002, 0.0007669925689697266, 0.0007996261119842529, 0.0008322596549987793, 0.0008648931980133057, 0.000897526741027832, 0.0009301602840423584, 0.0009627938270568848, 0.0009954273700714111, 0.0010280609130859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 9.0, 10.0, 16.0, 22.0, 30.0, 43.0, 63.0, 80.0, 169.0, 239.0, 407.0, 723.0, 1217.0, 2258.0, 3994.0, 7449.0, 14008.0, 26347.0, 46875.0, 79317.0, 119245.0, 154922.0, 167833.0, 148694.0, 110735.0, 71652.0, 41930.0, 23056.0, 12308.0, 6555.0, 3594.0, 1979.0, 1125.0, 632.0, 365.0, 208.0, 162.0, 98.0, 48.0, 30.0, 26.0, 24.0, 21.0, 12.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8984375, -13.4256591796875, -12.952880859375, -12.4801025390625, -12.00732421875, -11.5345458984375, -11.061767578125, -10.5889892578125, -10.1162109375, -9.6434326171875, -9.170654296875, -8.6978759765625, -8.22509765625, -7.7523193359375, -7.279541015625, -6.8067626953125, -6.333984375, -5.8612060546875, -5.388427734375, -4.9156494140625, -4.44287109375, -3.9700927734375, -3.497314453125, -3.0245361328125, -2.5517578125, -2.0789794921875, -1.606201171875, -1.1334228515625, -0.66064453125, -0.1878662109375, 0.284912109375, 0.7576904296875, 1.23046875, 1.7032470703125, 2.176025390625, 2.6488037109375, 3.12158203125, 3.5943603515625, 4.067138671875, 4.5399169921875, 5.0126953125, 5.4854736328125, 5.958251953125, 6.4310302734375, 6.90380859375, 7.3765869140625, 7.849365234375, 8.3221435546875, 8.794921875, 9.2677001953125, 9.740478515625, 10.2132568359375, 10.68603515625, 11.1588134765625, 11.631591796875, 12.1043701171875, 12.5771484375, 13.0499267578125, 13.522705078125, 13.9954833984375, 14.46826171875, 14.9410400390625, 15.413818359375, 15.8865966796875, 16.359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 9.0, 3.0, 8.0, 3.0, 4.0, 7.0, 16.0, 10.0, 19.0, 24.0, 31.0, 29.0, 25.0, 43.0, 46.0, 48.0, 47.0, 41.0, 53.0, 45.0, 74.0, 57.0, 49.0, 48.0, 44.0, 28.0, 30.0, 36.0, 26.0, 18.0, 19.0, 13.0, 8.0, 9.0, 10.0, 6.0, 7.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.40625, -6.21484375, -6.0234375, -5.83203125, -5.640625, -5.44921875, -5.2578125, -5.06640625, -4.875, -4.68359375, -4.4921875, -4.30078125, -4.109375, -3.91796875, -3.7265625, -3.53515625, -3.34375, -3.15234375, -2.9609375, -2.76953125, -2.578125, -2.38671875, -2.1953125, -2.00390625, -1.8125, -1.62109375, -1.4296875, -1.23828125, -1.046875, -0.85546875, -0.6640625, -0.47265625, -0.28125, -0.08984375, 0.1015625, 0.29296875, 0.484375, 0.67578125, 0.8671875, 1.05859375, 1.25, 1.44140625, 1.6328125, 1.82421875, 2.015625, 2.20703125, 2.3984375, 2.58984375, 2.78125, 2.97265625, 3.1640625, 3.35546875, 3.546875, 3.73828125, 3.9296875, 4.12109375, 4.3125, 4.50390625, 4.6953125, 4.88671875, 5.078125, 5.26953125, 5.4609375, 5.65234375, 5.84375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 11.0, 14.0, 12.0, 19.0, 17.0, 24.0, 28.0, 29.0, 32.0, 37.0, 44.0, 62.0, 41.0, 39.0, 47.0, 46.0, 44.0, 47.0, 48.0, 44.0, 32.0, 30.0, 41.0, 43.0, 32.0, 23.0, 19.0, 19.0, 15.0, 11.0, 11.0, 13.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.589250564575195, -28.527496337890625, -27.465742111206055, -26.403987884521484, -25.342233657836914, -24.280479431152344, -23.218727111816406, -22.156970977783203, -21.095218658447266, -20.033464431762695, -18.971710205078125, -17.909955978393555, -16.848201751708984, -15.786447525024414, -14.72469425201416, -13.66294002532959, -12.601184844970703, -11.539430618286133, -10.477676391601562, -9.415922164916992, -8.354167938232422, -7.29241418838501, -6.230660438537598, -5.168906211853027, -4.107151985168457, -3.0453977584838867, -1.9836437702178955, -0.9218897819519043, 0.13986444473266602, 1.2016186714172363, 2.2633724212646484, 3.3251266479492188, 4.386878967285156, 5.448633193969727, 6.510387420654297, 7.572141170501709, 8.633895874023438, 9.695650100708008, 10.757403373718262, 11.819157600402832, 12.880911827087402, 13.942666053771973, 15.004420280456543, 16.066173553466797, 17.127927780151367, 18.189682006835938, 19.251436233520508, 20.313190460205078, 21.37494468688965, 22.43669891357422, 23.49845314025879, 24.56020736694336, 25.62196159362793, 26.6837158203125, 27.745468139648438, 28.80722427368164, 29.868976593017578, 30.93073081970215, 31.99248504638672, 33.054237365722656, 34.11599349975586, 35.1777458190918, 36.239501953125, 37.30125427246094, 38.36301040649414]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 9.0, 10.0, 13.0, 16.0, 22.0, 18.0, 21.0, 35.0, 43.0, 35.0, 42.0, 38.0, 34.0, 36.0, 44.0, 53.0, 49.0, 51.0, 51.0, 43.0, 48.0, 39.0, 36.0, 29.0, 28.0, 20.0, 24.0, 23.0, 16.0, 11.0, 11.0, 14.0, 9.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-47.754581451416016, -46.424312591552734, -45.09404373168945, -43.76377487182617, -42.433502197265625, -41.103233337402344, -39.77296447753906, -38.44269561767578, -37.1124267578125, -35.78215789794922, -34.45188903808594, -33.121620178222656, -31.791349411010742, -30.46108055114746, -29.130809783935547, -27.800540924072266, -26.470272064208984, -25.140003204345703, -23.809734344482422, -22.479463577270508, -21.149194717407227, -19.818925857543945, -18.48865509033203, -17.15838623046875, -15.828117370605469, -14.497848510742188, -13.16757869720459, -11.837308883666992, -10.507040023803711, -9.17677116394043, -7.846501350402832, -6.516231536865234, -5.1859588623046875, -3.855689525604248, -2.5254201889038086, -1.1951508522033691, 0.1351184844970703, 1.4653878211975098, 2.795657157897949, 4.125926971435547, 5.456195831298828, 6.786465167999268, 8.116734504699707, 9.447004318237305, 10.777273178100586, 12.107542037963867, 13.437811851501465, 14.768081665039062, 16.098350524902344, 17.428619384765625, 18.758888244628906, 20.08915901184082, 21.4194278717041, 22.749696731567383, 24.079967498779297, 25.410236358642578, 26.74050521850586, 28.07077407836914, 29.401042938232422, 30.731313705444336, 32.06158447265625, 33.39185333251953, 34.72212219238281, 36.052391052246094, 37.382659912109375]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 11.0, 16.0, 22.0, 36.0, 60.0, 108.0, 176.0, 288.0, 495.0, 838.0, 1225.0, 2135.0, 3420.0, 5597.0, 9207.0, 14734.0, 23686.0, 37308.0, 57882.0, 87196.0, 127264.0, 179276.0, 241164.0, 307986.0, 368958.0, 413128.0, 428317.0, 412362.0, 368871.0, 307473.0, 241890.0, 179876.0, 128276.0, 87265.0, 57948.0, 37517.0, 24051.0, 14866.0, 9250.0, 5550.0, 3423.0, 2094.0, 1294.0, 705.0, 431.0, 264.0, 148.0, 89.0, 52.0, 28.0, 13.0, 7.0, 6.0, 3.0, 4.0, 2.0], "bins": [-23.265625, -22.59130859375, -21.9169921875, -21.24267578125, -20.568359375, -19.89404296875, -19.2197265625, -18.54541015625, -17.87109375, -17.19677734375, -16.5224609375, -15.84814453125, -15.173828125, -14.49951171875, -13.8251953125, -13.15087890625, -12.4765625, -11.80224609375, -11.1279296875, -10.45361328125, -9.779296875, -9.10498046875, -8.4306640625, -7.75634765625, -7.08203125, -6.40771484375, -5.7333984375, -5.05908203125, -4.384765625, -3.71044921875, -3.0361328125, -2.36181640625, -1.6875, -1.01318359375, -0.3388671875, 0.33544921875, 1.009765625, 1.68408203125, 2.3583984375, 3.03271484375, 3.70703125, 4.38134765625, 5.0556640625, 5.72998046875, 6.404296875, 7.07861328125, 7.7529296875, 8.42724609375, 9.1015625, 9.77587890625, 10.4501953125, 11.12451171875, 11.798828125, 12.47314453125, 13.1474609375, 13.82177734375, 14.49609375, 15.17041015625, 15.8447265625, 16.51904296875, 17.193359375, 17.86767578125, 18.5419921875, 19.21630859375, 19.890625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 2.0, 8.0, 2.0, 11.0, 8.0, 14.0, 14.0, 17.0, 23.0, 22.0, 36.0, 39.0, 35.0, 38.0, 41.0, 30.0, 38.0, 42.0, 51.0, 50.0, 55.0, 48.0, 36.0, 55.0, 48.0, 34.0, 27.0, 27.0, 21.0, 28.0, 21.0, 16.0, 10.0, 14.0, 14.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.21875, -40.083251953125, -38.94775390625, -37.812255859375, -36.6767578125, -35.541259765625, -34.40576171875, -33.270263671875, -32.134765625, -30.999267578125, -29.86376953125, -28.728271484375, -27.5927734375, -26.457275390625, -25.32177734375, -24.186279296875, -23.05078125, -21.915283203125, -20.77978515625, -19.644287109375, -18.5087890625, -17.373291015625, -16.23779296875, -15.102294921875, -13.966796875, -12.831298828125, -11.69580078125, -10.560302734375, -9.4248046875, -8.289306640625, -7.15380859375, -6.018310546875, -4.8828125, -3.747314453125, -2.61181640625, -1.476318359375, -0.3408203125, 0.794677734375, 1.93017578125, 3.065673828125, 4.201171875, 5.336669921875, 6.47216796875, 7.607666015625, 8.7431640625, 9.878662109375, 11.01416015625, 12.149658203125, 13.28515625, 14.420654296875, 15.55615234375, 16.691650390625, 17.8271484375, 18.962646484375, 20.09814453125, 21.233642578125, 22.369140625, 23.504638671875, 24.64013671875, 25.775634765625, 26.9111328125, 28.046630859375, 29.18212890625, 30.317626953125, 31.453125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 5.0, 12.0, 16.0, 19.0, 51.0, 74.0, 139.0, 255.0, 361.0, 613.0, 1042.0, 1680.0, 2818.0, 4466.0, 7043.0, 11308.0, 17089.0, 26159.0, 38851.0, 56725.0, 80220.0, 109626.0, 145421.0, 187978.0, 232273.0, 274289.0, 310978.0, 337015.0, 347707.0, 344481.0, 324428.0, 290703.0, 251013.0, 206104.0, 163533.0, 125435.0, 92873.0, 66214.0, 46195.0, 31440.0, 21149.0, 13412.0, 8858.0, 5475.0, 3413.0, 2156.0, 1231.0, 782.0, 460.0, 274.0, 196.0, 99.0, 58.0, 38.0, 23.0, 10.0, 3.0, 3.0, 1.0, 2.0], "bins": [-19.828125, -19.22216796875, -18.6162109375, -18.01025390625, -17.404296875, -16.79833984375, -16.1923828125, -15.58642578125, -14.98046875, -14.37451171875, -13.7685546875, -13.16259765625, -12.556640625, -11.95068359375, -11.3447265625, -10.73876953125, -10.1328125, -9.52685546875, -8.9208984375, -8.31494140625, -7.708984375, -7.10302734375, -6.4970703125, -5.89111328125, -5.28515625, -4.67919921875, -4.0732421875, -3.46728515625, -2.861328125, -2.25537109375, -1.6494140625, -1.04345703125, -0.4375, 0.16845703125, 0.7744140625, 1.38037109375, 1.986328125, 2.59228515625, 3.1982421875, 3.80419921875, 4.41015625, 5.01611328125, 5.6220703125, 6.22802734375, 6.833984375, 7.43994140625, 8.0458984375, 8.65185546875, 9.2578125, 9.86376953125, 10.4697265625, 11.07568359375, 11.681640625, 12.28759765625, 12.8935546875, 13.49951171875, 14.10546875, 14.71142578125, 15.3173828125, 15.92333984375, 16.529296875, 17.13525390625, 17.7412109375, 18.34716796875, 18.953125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 4.0, 6.0, 12.0, 13.0, 22.0, 37.0, 37.0, 48.0, 53.0, 61.0, 71.0, 85.0, 88.0, 119.0, 114.0, 145.0, 133.0, 158.0, 156.0, 186.0, 182.0, 192.0, 206.0, 184.0, 183.0, 195.0, 183.0, 167.0, 125.0, 122.0, 116.0, 109.0, 99.0, 80.0, 77.0, 59.0, 46.0, 45.0, 37.0, 28.0, 16.0, 21.0, 16.0, 8.0, 6.0, 6.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-12.34375, -11.936767578125, -11.52978515625, -11.122802734375, -10.7158203125, -10.308837890625, -9.90185546875, -9.494873046875, -9.087890625, -8.680908203125, -8.27392578125, -7.866943359375, -7.4599609375, -7.052978515625, -6.64599609375, -6.239013671875, -5.83203125, -5.425048828125, -5.01806640625, -4.611083984375, -4.2041015625, -3.797119140625, -3.39013671875, -2.983154296875, -2.576171875, -2.169189453125, -1.76220703125, -1.355224609375, -0.9482421875, -0.541259765625, -0.13427734375, 0.272705078125, 0.6796875, 1.086669921875, 1.49365234375, 1.900634765625, 2.3076171875, 2.714599609375, 3.12158203125, 3.528564453125, 3.935546875, 4.342529296875, 4.74951171875, 5.156494140625, 5.5634765625, 5.970458984375, 6.37744140625, 6.784423828125, 7.19140625, 7.598388671875, 8.00537109375, 8.412353515625, 8.8193359375, 9.226318359375, 9.63330078125, 10.040283203125, 10.447265625, 10.854248046875, 11.26123046875, 11.668212890625, 12.0751953125, 12.482177734375, 12.88916015625, 13.296142578125, 13.703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 5.0, 9.0, 7.0, 12.0, 15.0, 19.0, 18.0, 22.0, 21.0, 33.0, 37.0, 39.0, 34.0, 55.0, 44.0, 58.0, 60.0, 43.0, 49.0, 51.0, 39.0, 44.0, 46.0, 30.0, 29.0, 31.0, 21.0, 27.0, 20.0, 13.0, 13.0, 7.0, 10.0, 7.0, 13.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.40149688720703, -32.34184646606445, -31.28219223022461, -30.2225399017334, -29.162887573242188, -28.103235244750977, -27.043582916259766, -25.983932495117188, -24.924278259277344, -23.864625930786133, -22.804973602294922, -21.74532127380371, -20.6856689453125, -19.62601661682129, -18.566364288330078, -17.5067138671875, -16.44706153869629, -15.387409210205078, -14.327756881713867, -13.268104553222656, -12.208452224731445, -11.148799896240234, -10.08914852142334, -9.029496192932129, -7.969843864440918, -6.910191535949707, -5.850539207458496, -4.790887355804443, -3.7312350273132324, -2.6715826988220215, -1.6119308471679688, -0.5522785186767578, 0.5073738098144531, 1.5670260190963745, 2.626678228378296, 3.6863303184509277, 4.745982646942139, 5.80563497543335, 6.865286827087402, 7.924939155578613, 8.984591484069824, 10.044243812561035, 11.103896141052246, 12.16354751586914, 13.223199844360352, 14.282852172851562, 15.342504501342773, 16.402156829833984, 17.461809158325195, 18.521461486816406, 19.581113815307617, 20.640766143798828, 21.70041847229004, 22.76007080078125, 23.819721221923828, 24.879375457763672, 25.93902587890625, 26.99867820739746, 28.058330535888672, 29.117982864379883, 30.177635192871094, 31.237287521362305, 32.296939849853516, 33.356590270996094, 34.41624450683594]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 8.0, 5.0, 12.0, 10.0, 12.0, 13.0, 22.0, 30.0, 15.0, 38.0, 45.0, 33.0, 42.0, 43.0, 40.0, 48.0, 39.0, 43.0, 46.0, 44.0, 44.0, 46.0, 49.0, 37.0, 36.0, 42.0, 22.0, 25.0, 14.0, 22.0, 15.0, 14.0, 12.0, 4.0, 7.0, 4.0, 9.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.51961898803711, -42.22698211669922, -40.93434143066406, -39.64170455932617, -38.349063873291016, -37.056427001953125, -35.76378631591797, -34.47114944458008, -33.17851257324219, -31.885873794555664, -30.59323501586914, -29.300596237182617, -28.007957458496094, -26.715320587158203, -25.42268180847168, -24.130043029785156, -22.83740234375, -21.544763565063477, -20.252124786376953, -18.95948600769043, -17.666847229003906, -16.374210357666016, -15.081571578979492, -13.788932800292969, -12.496294021606445, -11.203655242919922, -9.911016464233398, -8.618378639221191, -7.325739860534668, -6.0331010818481445, -4.740462779998779, -3.447824478149414, -2.155181884765625, -0.8625433444976807, 0.43009519577026367, 1.722733736038208, 3.0153722763061523, 4.308011054992676, 5.600649356842041, 6.893287658691406, 8.18592643737793, 9.478565216064453, 10.771203994750977, 12.063841819763184, 13.356480598449707, 14.64911937713623, 15.941757202148438, 17.23439598083496, 18.527034759521484, 19.819673538208008, 21.11231231689453, 22.404951095581055, 23.697589874267578, 24.99022674560547, 26.282865524291992, 27.575504302978516, 28.86814308166504, 30.160781860351562, 31.453420639038086, 32.74605941772461, 34.0386962890625, 35.331336975097656, 36.62397384643555, 37.91661071777344, 39.209251403808594]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 10.0, 8.0, 15.0, 19.0, 22.0, 36.0, 46.0, 64.0, 97.0, 144.0, 166.0, 240.0, 338.0, 489.0, 677.0, 1003.0, 1510.0, 2622.0, 4421.0, 8797.0, 21597.0, 63132.0, 219035.0, 445126.0, 186020.0, 54377.0, 19228.0, 8051.0, 4048.0, 2470.0, 1497.0, 976.0, 693.0, 435.0, 335.0, 189.0, 186.0, 130.0, 81.0, 68.0, 39.0, 31.0, 39.0, 13.0, 11.0, 4.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.8291015625, -18.189453125, -17.5498046875, -16.91015625, -16.2705078125, -15.630859375, -14.9912109375, -14.3515625, -13.7119140625, -13.072265625, -12.4326171875, -11.79296875, -11.1533203125, -10.513671875, -9.8740234375, -9.234375, -8.5947265625, -7.955078125, -7.3154296875, -6.67578125, -6.0361328125, -5.396484375, -4.7568359375, -4.1171875, -3.4775390625, -2.837890625, -2.1982421875, -1.55859375, -0.9189453125, -0.279296875, 0.3603515625, 1.0, 1.6396484375, 2.279296875, 2.9189453125, 3.55859375, 4.1982421875, 4.837890625, 5.4775390625, 6.1171875, 6.7568359375, 7.396484375, 8.0361328125, 8.67578125, 9.3154296875, 9.955078125, 10.5947265625, 11.234375, 11.8740234375, 12.513671875, 13.1533203125, 13.79296875, 14.4326171875, 15.072265625, 15.7119140625, 16.3515625, 16.9912109375, 17.630859375, 18.2705078125, 18.91015625, 19.5498046875, 20.189453125, 20.8291015625, 21.46875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 13.0, 10.0, 11.0, 13.0, 23.0, 30.0, 17.0, 35.0, 46.0, 35.0, 40.0, 43.0, 43.0, 45.0, 38.0, 48.0, 43.0, 43.0, 43.0, 46.0, 50.0, 38.0, 36.0, 40.0, 24.0, 24.0, 14.0, 21.0, 15.0, 14.0, 12.0, 4.0, 7.0, 6.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.53125, -42.240234375, -40.94921875, -39.658203125, -38.3671875, -37.076171875, -35.78515625, -34.494140625, -33.203125, -31.912109375, -30.62109375, -29.330078125, -28.0390625, -26.748046875, -25.45703125, -24.166015625, -22.875, -21.583984375, -20.29296875, -19.001953125, -17.7109375, -16.419921875, -15.12890625, -13.837890625, -12.546875, -11.255859375, -9.96484375, -8.673828125, -7.3828125, -6.091796875, -4.80078125, -3.509765625, -2.21875, -0.927734375, 0.36328125, 1.654296875, 2.9453125, 4.236328125, 5.52734375, 6.818359375, 8.109375, 9.400390625, 10.69140625, 11.982421875, 13.2734375, 14.564453125, 15.85546875, 17.146484375, 18.4375, 19.728515625, 21.01953125, 22.310546875, 23.6015625, 24.892578125, 26.18359375, 27.474609375, 28.765625, 30.056640625, 31.34765625, 32.638671875, 33.9296875, 35.220703125, 36.51171875, 37.802734375, 39.09375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 14.0, 15.0, 18.0, 31.0, 37.0, 39.0, 62.0, 89.0, 107.0, 151.0, 233.0, 348.0, 581.0, 935.0, 1702.0, 3449.0, 9174.0, 34371.0, 307696.0, 603326.0, 62802.0, 13496.0, 4556.0, 2164.0, 1116.0, 667.0, 425.0, 286.0, 187.0, 131.0, 93.0, 64.0, 59.0, 27.0, 21.0, 22.0, 17.0, 13.0, 5.0, 10.0, 5.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.890625, -27.0234375, -26.15625, -25.2890625, -24.421875, -23.5546875, -22.6875, -21.8203125, -20.953125, -20.0859375, -19.21875, -18.3515625, -17.484375, -16.6171875, -15.75, -14.8828125, -14.015625, -13.1484375, -12.28125, -11.4140625, -10.546875, -9.6796875, -8.8125, -7.9453125, -7.078125, -6.2109375, -5.34375, -4.4765625, -3.609375, -2.7421875, -1.875, -1.0078125, -0.140625, 0.7265625, 1.59375, 2.4609375, 3.328125, 4.1953125, 5.0625, 5.9296875, 6.796875, 7.6640625, 8.53125, 9.3984375, 10.265625, 11.1328125, 12.0, 12.8671875, 13.734375, 14.6015625, 15.46875, 16.3359375, 17.203125, 18.0703125, 18.9375, 19.8046875, 20.671875, 21.5390625, 22.40625, 23.2734375, 24.140625, 25.0078125, 25.875, 26.7421875, 27.609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 8.0, 10.0, 13.0, 4.0, 9.0, 18.0, 18.0, 19.0, 26.0, 22.0, 25.0, 29.0, 30.0, 32.0, 41.0, 48.0, 49.0, 43.0, 42.0, 49.0, 47.0, 50.0, 40.0, 38.0, 37.0, 28.0, 23.0, 32.0, 28.0, 25.0, 20.0, 18.0, 8.0, 18.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.90625, -24.0078125, -23.109375, -22.2109375, -21.3125, -20.4140625, -19.515625, -18.6171875, -17.71875, -16.8203125, -15.921875, -15.0234375, -14.125, -13.2265625, -12.328125, -11.4296875, -10.53125, -9.6328125, -8.734375, -7.8359375, -6.9375, -6.0390625, -5.140625, -4.2421875, -3.34375, -2.4453125, -1.546875, -0.6484375, 0.25, 1.1484375, 2.046875, 2.9453125, 3.84375, 4.7421875, 5.640625, 6.5390625, 7.4375, 8.3359375, 9.234375, 10.1328125, 11.03125, 11.9296875, 12.828125, 13.7265625, 14.625, 15.5234375, 16.421875, 17.3203125, 18.21875, 19.1171875, 20.015625, 20.9140625, 21.8125, 22.7109375, 23.609375, 24.5078125, 25.40625, 26.3046875, 27.203125, 28.1015625, 29.0, 29.8984375, 30.796875, 31.6953125, 32.59375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 4.0, 9.0, 10.0, 14.0, 9.0, 27.0, 40.0, 39.0, 56.0, 61.0, 82.0, 114.0, 126.0, 189.0, 265.0, 329.0, 497.0, 686.0, 1165.0, 1895.0, 4017.0, 10024.0, 40240.0, 558164.0, 379810.0, 32852.0, 8826.0, 3624.0, 1866.0, 1040.0, 645.0, 480.0, 314.0, 233.0, 189.0, 154.0, 104.0, 87.0, 59.0, 47.0, 37.0, 28.0, 28.0, 24.0, 13.0, 11.0, 4.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8203125, -15.2918701171875, -14.763427734375, -14.2349853515625, -13.70654296875, -13.1781005859375, -12.649658203125, -12.1212158203125, -11.5927734375, -11.0643310546875, -10.535888671875, -10.0074462890625, -9.47900390625, -8.9505615234375, -8.422119140625, -7.8936767578125, -7.365234375, -6.8367919921875, -6.308349609375, -5.7799072265625, -5.25146484375, -4.7230224609375, -4.194580078125, -3.6661376953125, -3.1376953125, -2.6092529296875, -2.080810546875, -1.5523681640625, -1.02392578125, -0.4954833984375, 0.032958984375, 0.5614013671875, 1.08984375, 1.6182861328125, 2.146728515625, 2.6751708984375, 3.20361328125, 3.7320556640625, 4.260498046875, 4.7889404296875, 5.3173828125, 5.8458251953125, 6.374267578125, 6.9027099609375, 7.43115234375, 7.9595947265625, 8.488037109375, 9.0164794921875, 9.544921875, 10.0733642578125, 10.601806640625, 11.1302490234375, 11.65869140625, 12.1871337890625, 12.715576171875, 13.2440185546875, 13.7724609375, 14.3009033203125, 14.829345703125, 15.3577880859375, 15.88623046875, 16.4146728515625, 16.943115234375, 17.4715576171875, 18.0]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 12.0, 20.0, 37.0, 51.0, 73.0, 105.0, 151.0, 134.0, 135.0, 90.0, 53.0, 39.0, 30.0, 21.0, 9.0, 6.0, 9.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008521080017089844, -0.0008221343159675598, -0.0007921606302261353, -0.0007621869444847107, -0.0007322132587432861, -0.0007022395730018616, -0.000672265887260437, -0.0006422922015190125, -0.0006123185157775879, -0.0005823448300361633, -0.0005523711442947388, -0.0005223974585533142, -0.0004924237728118896, -0.0004624500870704651, -0.00043247640132904053, -0.00040250271558761597, -0.0003725290298461914, -0.00034255534410476685, -0.0003125816583633423, -0.0002826079726219177, -0.00025263428688049316, -0.0002226606011390686, -0.00019268691539764404, -0.00016271322965621948, -0.00013273954391479492, -0.00010276585817337036, -7.27921724319458e-05, -4.281848669052124e-05, -1.284480094909668e-05, 1.712888479232788e-05, 4.710257053375244e-05, 7.7076256275177e-05, 0.00010704994201660156, 0.00013702362775802612, 0.00016699731349945068, 0.00019697099924087524, 0.0002269446849822998, 0.00025691837072372437, 0.0002868920564651489, 0.0003168657422065735, 0.00034683942794799805, 0.0003768131136894226, 0.00040678679943084717, 0.00043676048517227173, 0.0004667341709136963, 0.0004967078566551208, 0.0005266815423965454, 0.00055665522813797, 0.0005866289138793945, 0.0006166025996208191, 0.0006465762853622437, 0.0006765499711036682, 0.0007065236568450928, 0.0007364973425865173, 0.0007664710283279419, 0.0007964447140693665, 0.000826418399810791, 0.0008563920855522156, 0.0008863657712936401, 0.0009163394570350647, 0.0009463131427764893, 0.0009762868285179138, 0.0010062605142593384, 0.001036234200000763, 0.0010662078857421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 10.0, 6.0, 11.0, 19.0, 21.0, 18.0, 39.0, 62.0, 79.0, 92.0, 151.0, 183.0, 256.0, 359.0, 476.0, 674.0, 841.0, 1193.0, 1773.0, 2612.0, 3942.0, 6594.0, 12129.0, 24370.0, 54769.0, 131246.0, 293908.0, 283574.0, 123946.0, 51831.0, 23147.0, 11498.0, 6431.0, 3730.0, 2474.0, 1660.0, 1168.0, 868.0, 603.0, 486.0, 343.0, 289.0, 195.0, 129.0, 110.0, 66.0, 61.0, 37.0, 30.0, 11.0, 14.0, 15.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.890625, -8.603515625, -8.31640625, -8.029296875, -7.7421875, -7.455078125, -7.16796875, -6.880859375, -6.59375, -6.306640625, -6.01953125, -5.732421875, -5.4453125, -5.158203125, -4.87109375, -4.583984375, -4.296875, -4.009765625, -3.72265625, -3.435546875, -3.1484375, -2.861328125, -2.57421875, -2.287109375, -2.0, -1.712890625, -1.42578125, -1.138671875, -0.8515625, -0.564453125, -0.27734375, 0.009765625, 0.296875, 0.583984375, 0.87109375, 1.158203125, 1.4453125, 1.732421875, 2.01953125, 2.306640625, 2.59375, 2.880859375, 3.16796875, 3.455078125, 3.7421875, 4.029296875, 4.31640625, 4.603515625, 4.890625, 5.177734375, 5.46484375, 5.751953125, 6.0390625, 6.326171875, 6.61328125, 6.900390625, 7.1875, 7.474609375, 7.76171875, 8.048828125, 8.3359375, 8.623046875, 8.91015625, 9.197265625, 9.484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 8.0, 9.0, 11.0, 15.0, 27.0, 31.0, 48.0, 60.0, 59.0, 69.0, 153.0, 149.0, 85.0, 62.0, 56.0, 38.0, 37.0, 23.0, 15.0, 16.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.328125, -6.15692138671875, -5.9857177734375, -5.81451416015625, -5.643310546875, -5.47210693359375, -5.3009033203125, -5.12969970703125, -4.95849609375, -4.78729248046875, -4.6160888671875, -4.44488525390625, -4.273681640625, -4.10247802734375, -3.9312744140625, -3.76007080078125, -3.5888671875, -3.41766357421875, -3.2464599609375, -3.07525634765625, -2.904052734375, -2.73284912109375, -2.5616455078125, -2.39044189453125, -2.21923828125, -2.04803466796875, -1.8768310546875, -1.70562744140625, -1.534423828125, -1.36322021484375, -1.1920166015625, -1.02081298828125, -0.849609375, -0.67840576171875, -0.5072021484375, -0.33599853515625, -0.164794921875, 0.00640869140625, 0.1776123046875, 0.34881591796875, 0.52001953125, 0.69122314453125, 0.8624267578125, 1.03363037109375, 1.204833984375, 1.37603759765625, 1.5472412109375, 1.71844482421875, 1.8896484375, 2.06085205078125, 2.2320556640625, 2.40325927734375, 2.574462890625, 2.74566650390625, 2.9168701171875, 3.08807373046875, 3.25927734375, 3.43048095703125, 3.6016845703125, 3.77288818359375, 3.944091796875, 4.11529541015625, 4.2864990234375, 4.45770263671875, 4.62890625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 10.0, 5.0, 10.0, 14.0, 15.0, 20.0, 20.0, 23.0, 31.0, 30.0, 31.0, 52.0, 44.0, 43.0, 52.0, 49.0, 41.0, 60.0, 54.0, 55.0, 32.0, 36.0, 41.0, 32.0, 21.0, 37.0, 25.0, 17.0, 18.0, 15.0, 12.0, 10.0, 7.0, 6.0, 10.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.68431854248047, -32.63035583496094, -31.57638931274414, -30.522424697875977, -29.468460083007812, -28.41449737548828, -27.360532760620117, -26.306568145751953, -25.25260353088379, -24.198638916015625, -23.14467430114746, -22.090709686279297, -21.036746978759766, -19.98278045654297, -18.928817749023438, -17.874853134155273, -16.82088851928711, -15.766923904418945, -14.712959289550781, -13.658995628356934, -12.60503101348877, -11.551066398620605, -10.497102737426758, -9.443138122558594, -8.38917350769043, -7.335208892822266, -6.28124475479126, -5.227280616760254, -4.17331600189209, -3.119351387023926, -2.06538724899292, -1.011423110961914, 0.042537689208984375, 1.0965020656585693, 2.1504664421081543, 3.2044308185577393, 4.258395195007324, 5.312359809875488, 6.366323947906494, 7.4202880859375, 8.474252700805664, 9.528217315673828, 10.582181930541992, 11.63614559173584, 12.690110206604004, 13.744074821472168, 14.798038482666016, 15.85200309753418, 16.905967712402344, 17.959932327270508, 19.013896942138672, 20.067861557006836, 21.121826171875, 22.17578887939453, 23.229753494262695, 24.28371810913086, 25.337682723999023, 26.391647338867188, 27.44561195373535, 28.499576568603516, 29.553539276123047, 30.607505798339844, 31.661468505859375, 32.715431213378906, 33.7693977355957]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 6.0, 15.0, 9.0, 11.0, 23.0, 20.0, 32.0, 23.0, 33.0, 44.0, 43.0, 34.0, 48.0, 43.0, 45.0, 42.0, 59.0, 36.0, 45.0, 43.0, 43.0, 48.0, 32.0, 36.0, 40.0, 20.0, 24.0, 12.0, 16.0, 12.0, 13.0, 7.0, 7.0, 9.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.84357452392578, -43.52841567993164, -42.213253021240234, -40.898094177246094, -39.58293533325195, -38.26777648925781, -36.952613830566406, -35.637454986572266, -34.322296142578125, -33.007137298583984, -31.69197654724121, -30.376815795898438, -29.061656951904297, -27.746496200561523, -26.43133544921875, -25.11617660522461, -23.801015853881836, -22.485855102539062, -21.170696258544922, -19.85553550720215, -18.540376663208008, -17.225215911865234, -15.910056114196777, -14.59489631652832, -13.279736518859863, -11.964576721191406, -10.64941692352295, -9.334257125854492, -8.019096374511719, -6.70393705368042, -5.388776779174805, -4.073616981506348, -2.7584571838378906, -1.443297266960144, -0.12813735008239746, 1.1870226860046387, 2.5021824836730957, 3.8173422813415527, 5.132502555847168, 6.447662353515625, 7.762822151184082, 9.077981948852539, 10.393141746520996, 11.708301544189453, 13.023462295532227, 14.338621139526367, 15.65378189086914, 16.96894073486328, 18.284101486206055, 19.599262237548828, 20.91442108154297, 22.229581832885742, 23.544740676879883, 24.859901428222656, 26.175060272216797, 27.49022102355957, 28.805381774902344, 30.120542526245117, 31.435701370239258, 32.75086212158203, 34.06602096557617, 35.38117980957031, 36.69634246826172, 38.01150131225586, 39.32666015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 4.0, 5.0, 7.0, 19.0, 12.0, 44.0, 50.0, 98.0, 127.0, 186.0, 313.0, 565.0, 833.0, 1352.0, 2068.0, 3258.0, 4937.0, 7578.0, 11304.0, 16280.0, 23088.0, 32242.0, 42883.0, 54693.0, 67209.0, 79356.0, 88280.0, 92939.0, 92608.0, 87716.0, 78290.0, 66401.0, 53361.0, 41431.0, 30450.0, 22122.0, 15497.0, 10602.0, 7200.0, 4858.0, 3005.0, 1940.0, 1229.0, 848.0, 424.0, 315.0, 186.0, 141.0, 78.0, 57.0, 28.0, 20.0, 8.0, 8.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.265625, -16.70751953125, -16.1494140625, -15.59130859375, -15.033203125, -14.47509765625, -13.9169921875, -13.35888671875, -12.80078125, -12.24267578125, -11.6845703125, -11.12646484375, -10.568359375, -10.01025390625, -9.4521484375, -8.89404296875, -8.3359375, -7.77783203125, -7.2197265625, -6.66162109375, -6.103515625, -5.54541015625, -4.9873046875, -4.42919921875, -3.87109375, -3.31298828125, -2.7548828125, -2.19677734375, -1.638671875, -1.08056640625, -0.5224609375, 0.03564453125, 0.59375, 1.15185546875, 1.7099609375, 2.26806640625, 2.826171875, 3.38427734375, 3.9423828125, 4.50048828125, 5.05859375, 5.61669921875, 6.1748046875, 6.73291015625, 7.291015625, 7.84912109375, 8.4072265625, 8.96533203125, 9.5234375, 10.08154296875, 10.6396484375, 11.19775390625, 11.755859375, 12.31396484375, 12.8720703125, 13.43017578125, 13.98828125, 14.54638671875, 15.1044921875, 15.66259765625, 16.220703125, 16.77880859375, 17.3369140625, 17.89501953125, 18.453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 13.0, 11.0, 10.0, 20.0, 23.0, 31.0, 21.0, 34.0, 42.0, 41.0, 36.0, 46.0, 46.0, 41.0, 44.0, 55.0, 43.0, 43.0, 40.0, 43.0, 49.0, 30.0, 40.0, 38.0, 24.0, 23.0, 12.0, 17.0, 13.0, 13.0, 8.0, 7.0, 10.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.78125, -42.5029296875, -41.224609375, -39.9462890625, -38.66796875, -37.3896484375, -36.111328125, -34.8330078125, -33.5546875, -32.2763671875, -30.998046875, -29.7197265625, -28.44140625, -27.1630859375, -25.884765625, -24.6064453125, -23.328125, -22.0498046875, -20.771484375, -19.4931640625, -18.21484375, -16.9365234375, -15.658203125, -14.3798828125, -13.1015625, -11.8232421875, -10.544921875, -9.2666015625, -7.98828125, -6.7099609375, -5.431640625, -4.1533203125, -2.875, -1.5966796875, -0.318359375, 0.9599609375, 2.23828125, 3.5166015625, 4.794921875, 6.0732421875, 7.3515625, 8.6298828125, 9.908203125, 11.1865234375, 12.46484375, 13.7431640625, 15.021484375, 16.2998046875, 17.578125, 18.8564453125, 20.134765625, 21.4130859375, 22.69140625, 23.9697265625, 25.248046875, 26.5263671875, 27.8046875, 29.0830078125, 30.361328125, 31.6396484375, 32.91796875, 34.1962890625, 35.474609375, 36.7529296875, 38.03125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 2.0, 7.0, 6.0, 9.0, 21.0, 33.0, 48.0, 81.0, 113.0, 195.0, 329.0, 486.0, 809.0, 1296.0, 2089.0, 3325.0, 5277.0, 8230.0, 12618.0, 18849.0, 27369.0, 38832.0, 52106.0, 66585.0, 81004.0, 93599.0, 100744.0, 101020.0, 95705.0, 83973.0, 69686.0, 54832.0, 41197.0, 29508.0, 20332.0, 13526.0, 9023.0, 5828.0, 3720.0, 2296.0, 1446.0, 904.0, 593.0, 328.0, 237.0, 142.0, 69.0, 46.0, 38.0, 25.0, 9.0, 5.0, 5.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-18.703125, -18.081787109375, -17.46044921875, -16.839111328125, -16.2177734375, -15.596435546875, -14.97509765625, -14.353759765625, -13.732421875, -13.111083984375, -12.48974609375, -11.868408203125, -11.2470703125, -10.625732421875, -10.00439453125, -9.383056640625, -8.76171875, -8.140380859375, -7.51904296875, -6.897705078125, -6.2763671875, -5.655029296875, -5.03369140625, -4.412353515625, -3.791015625, -3.169677734375, -2.54833984375, -1.927001953125, -1.3056640625, -0.684326171875, -0.06298828125, 0.558349609375, 1.1796875, 1.801025390625, 2.42236328125, 3.043701171875, 3.6650390625, 4.286376953125, 4.90771484375, 5.529052734375, 6.150390625, 6.771728515625, 7.39306640625, 8.014404296875, 8.6357421875, 9.257080078125, 9.87841796875, 10.499755859375, 11.12109375, 11.742431640625, 12.36376953125, 12.985107421875, 13.6064453125, 14.227783203125, 14.84912109375, 15.470458984375, 16.091796875, 16.713134765625, 17.33447265625, 17.955810546875, 18.5771484375, 19.198486328125, 19.81982421875, 20.441162109375, 21.0625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 1.0, 8.0, 6.0, 4.0, 6.0, 11.0, 15.0, 12.0, 19.0, 17.0, 23.0, 25.0, 31.0, 31.0, 28.0, 39.0, 31.0, 36.0, 34.0, 44.0, 35.0, 43.0, 38.0, 48.0, 41.0, 43.0, 38.0, 34.0, 22.0, 21.0, 28.0, 25.0, 32.0, 20.0, 24.0, 15.0, 12.0, 20.0, 13.0, 7.0, 3.0, 12.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.359375, -21.6533203125, -20.947265625, -20.2412109375, -19.53515625, -18.8291015625, -18.123046875, -17.4169921875, -16.7109375, -16.0048828125, -15.298828125, -14.5927734375, -13.88671875, -13.1806640625, -12.474609375, -11.7685546875, -11.0625, -10.3564453125, -9.650390625, -8.9443359375, -8.23828125, -7.5322265625, -6.826171875, -6.1201171875, -5.4140625, -4.7080078125, -4.001953125, -3.2958984375, -2.58984375, -1.8837890625, -1.177734375, -0.4716796875, 0.234375, 0.9404296875, 1.646484375, 2.3525390625, 3.05859375, 3.7646484375, 4.470703125, 5.1767578125, 5.8828125, 6.5888671875, 7.294921875, 8.0009765625, 8.70703125, 9.4130859375, 10.119140625, 10.8251953125, 11.53125, 12.2373046875, 12.943359375, 13.6494140625, 14.35546875, 15.0615234375, 15.767578125, 16.4736328125, 17.1796875, 17.8857421875, 18.591796875, 19.2978515625, 20.00390625, 20.7099609375, 21.416015625, 22.1220703125, 22.828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 13.0, 19.0, 27.0, 25.0, 55.0, 96.0, 124.0, 215.0, 378.0, 640.0, 1219.0, 2273.0, 4134.0, 7654.0, 13905.0, 24412.0, 41278.0, 65792.0, 95277.0, 124407.0, 142207.0, 142630.0, 124006.0, 95602.0, 65813.0, 41619.0, 24481.0, 13662.0, 7539.0, 4051.0, 2211.0, 1221.0, 641.0, 369.0, 214.0, 138.0, 72.0, 46.0, 30.0, 20.0, 9.0, 4.0, 6.0, 10.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.1796875, -11.8316650390625, -11.483642578125, -11.1356201171875, -10.78759765625, -10.4395751953125, -10.091552734375, -9.7435302734375, -9.3955078125, -9.0474853515625, -8.699462890625, -8.3514404296875, -8.00341796875, -7.6553955078125, -7.307373046875, -6.9593505859375, -6.611328125, -6.2633056640625, -5.915283203125, -5.5672607421875, -5.21923828125, -4.8712158203125, -4.523193359375, -4.1751708984375, -3.8271484375, -3.4791259765625, -3.131103515625, -2.7830810546875, -2.43505859375, -2.0870361328125, -1.739013671875, -1.3909912109375, -1.04296875, -0.6949462890625, -0.346923828125, 0.0010986328125, 0.34912109375, 0.6971435546875, 1.045166015625, 1.3931884765625, 1.7412109375, 2.0892333984375, 2.437255859375, 2.7852783203125, 3.13330078125, 3.4813232421875, 3.829345703125, 4.1773681640625, 4.525390625, 4.8734130859375, 5.221435546875, 5.5694580078125, 5.91748046875, 6.2655029296875, 6.613525390625, 6.9615478515625, 7.3095703125, 7.6575927734375, 8.005615234375, 8.3536376953125, 8.70166015625, 9.0496826171875, 9.397705078125, 9.7457275390625, 10.09375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 5.0, 6.0, 11.0, 11.0, 10.0, 19.0, 18.0, 19.0, 30.0, 24.0, 43.0, 44.0, 43.0, 44.0, 47.0, 69.0, 48.0, 69.0, 59.0, 66.0, 43.0, 37.0, 33.0, 35.0, 32.0, 26.0, 22.0, 21.0, 15.0, 17.0, 8.0, 7.0, 6.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00109100341796875, -0.0010508894920349121, -0.0010107755661010742, -0.0009706616401672363, -0.0009305477142333984, -0.0008904337882995605, -0.0008503198623657227, -0.0008102059364318848, -0.0007700920104980469, -0.000729978084564209, -0.0006898641586303711, -0.0006497502326965332, -0.0006096363067626953, -0.0005695223808288574, -0.0005294084548950195, -0.0004892945289611816, -0.00044918060302734375, -0.00040906667709350586, -0.00036895275115966797, -0.0003288388252258301, -0.0002887248992919922, -0.0002486109733581543, -0.0002084970474243164, -0.00016838312149047852, -0.00012826919555664062, -8.815526962280273e-05, -4.8041343688964844e-05, -7.927417755126953e-06, 3.218650817871094e-05, 7.230043411254883e-05, 0.00011241436004638672, 0.0001525282859802246, 0.0001926422119140625, 0.0002327561378479004, 0.0002728700637817383, 0.00031298398971557617, 0.00035309791564941406, 0.00039321184158325195, 0.00043332576751708984, 0.00047343969345092773, 0.0005135536193847656, 0.0005536675453186035, 0.0005937814712524414, 0.0006338953971862793, 0.0006740093231201172, 0.0007141232490539551, 0.000754237174987793, 0.0007943511009216309, 0.0008344650268554688, 0.0008745789527893066, 0.0009146928787231445, 0.0009548068046569824, 0.0009949207305908203, 0.0010350346565246582, 0.001075148582458496, 0.001115262508392334, 0.0011553764343261719, 0.0011954903602600098, 0.0012356042861938477, 0.0012757182121276855, 0.0013158321380615234, 0.0013559460639953613, 0.0013960599899291992, 0.0014361739158630371, 0.001476287841796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 18.0, 19.0, 37.0, 64.0, 97.0, 144.0, 214.0, 337.0, 542.0, 864.0, 1394.0, 2148.0, 3318.0, 5612.0, 8785.0, 14112.0, 21853.0, 33561.0, 49338.0, 69093.0, 91764.0, 110991.0, 121402.0, 120411.0, 107402.0, 87650.0, 66045.0, 46105.0, 31083.0, 20339.0, 12523.0, 7816.0, 5037.0, 3010.0, 1963.0, 1306.0, 788.0, 485.0, 325.0, 180.0, 118.0, 92.0, 67.0, 31.0, 20.0, 20.0, 9.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-11.265625, -10.933349609375, -10.60107421875, -10.268798828125, -9.9365234375, -9.604248046875, -9.27197265625, -8.939697265625, -8.607421875, -8.275146484375, -7.94287109375, -7.610595703125, -7.2783203125, -6.946044921875, -6.61376953125, -6.281494140625, -5.94921875, -5.616943359375, -5.28466796875, -4.952392578125, -4.6201171875, -4.287841796875, -3.95556640625, -3.623291015625, -3.291015625, -2.958740234375, -2.62646484375, -2.294189453125, -1.9619140625, -1.629638671875, -1.29736328125, -0.965087890625, -0.6328125, -0.300537109375, 0.03173828125, 0.364013671875, 0.6962890625, 1.028564453125, 1.36083984375, 1.693115234375, 2.025390625, 2.357666015625, 2.68994140625, 3.022216796875, 3.3544921875, 3.686767578125, 4.01904296875, 4.351318359375, 4.68359375, 5.015869140625, 5.34814453125, 5.680419921875, 6.0126953125, 6.344970703125, 6.67724609375, 7.009521484375, 7.341796875, 7.674072265625, 8.00634765625, 8.338623046875, 8.6708984375, 9.003173828125, 9.33544921875, 9.667724609375, 10.0]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 4.0, 5.0, 14.0, 11.0, 19.0, 34.0, 29.0, 36.0, 45.0, 49.0, 43.0, 58.0, 76.0, 73.0, 63.0, 91.0, 56.0, 67.0, 46.0, 41.0, 29.0, 28.0, 24.0, 14.0, 6.0, 9.0, 6.0, 8.0, 5.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9921875, -8.742919921875, -8.49365234375, -8.244384765625, -7.9951171875, -7.745849609375, -7.49658203125, -7.247314453125, -6.998046875, -6.748779296875, -6.49951171875, -6.250244140625, -6.0009765625, -5.751708984375, -5.50244140625, -5.253173828125, -5.00390625, -4.754638671875, -4.50537109375, -4.256103515625, -4.0068359375, -3.757568359375, -3.50830078125, -3.259033203125, -3.009765625, -2.760498046875, -2.51123046875, -2.261962890625, -2.0126953125, -1.763427734375, -1.51416015625, -1.264892578125, -1.015625, -0.766357421875, -0.51708984375, -0.267822265625, -0.0185546875, 0.230712890625, 0.47998046875, 0.729248046875, 0.978515625, 1.227783203125, 1.47705078125, 1.726318359375, 1.9755859375, 2.224853515625, 2.47412109375, 2.723388671875, 2.97265625, 3.221923828125, 3.47119140625, 3.720458984375, 3.9697265625, 4.218994140625, 4.46826171875, 4.717529296875, 4.966796875, 5.216064453125, 5.46533203125, 5.714599609375, 5.9638671875, 6.213134765625, 6.46240234375, 6.711669921875, 6.9609375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 8.0, 5.0, 10.0, 13.0, 8.0, 9.0, 6.0, 23.0, 23.0, 22.0, 25.0, 36.0, 31.0, 41.0, 44.0, 44.0, 38.0, 49.0, 44.0, 40.0, 39.0, 44.0, 44.0, 27.0, 41.0, 30.0, 28.0, 29.0, 24.0, 28.0, 18.0, 15.0, 18.0, 15.0, 14.0, 13.0, 7.0, 10.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-28.403156280517578, -27.485095977783203, -26.56703758239746, -25.648977279663086, -24.73091697692871, -23.81285858154297, -22.894798278808594, -21.97673797607422, -21.058677673339844, -20.14061737060547, -19.222558975219727, -18.30449867248535, -17.386438369750977, -16.468379974365234, -15.55031967163086, -14.632259368896484, -13.714200973510742, -12.796141624450684, -11.878081321716309, -10.96002197265625, -10.041961669921875, -9.123902320861816, -8.205842971801758, -7.287783145904541, -6.369723320007324, -5.451663494110107, -4.533603668212891, -3.615544319152832, -2.6974844932556152, -1.7794246673583984, -0.8613653182983398, 0.05669450759887695, 0.9747543334960938, 1.892814040184021, 2.8108737468719482, 3.728933334350586, 4.646993160247803, 5.5650529861450195, 6.483112335205078, 7.401172161102295, 8.319231986999512, 9.23729133605957, 10.155351638793945, 11.073410987854004, 11.991470336914062, 12.909530639648438, 13.827589988708496, 14.745649337768555, 15.66370964050293, 16.581769943237305, 17.499828338623047, 18.417888641357422, 19.335948944091797, 20.254009246826172, 21.172067642211914, 22.09012794494629, 23.00818634033203, 23.926246643066406, 24.84430503845215, 25.762365341186523, 26.6804256439209, 27.59848403930664, 28.516544342041016, 29.43460464477539, 30.352664947509766]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 11.0, 6.0, 7.0, 9.0, 9.0, 11.0, 17.0, 15.0, 20.0, 23.0, 27.0, 33.0, 37.0, 35.0, 40.0, 44.0, 55.0, 48.0, 34.0, 32.0, 46.0, 49.0, 50.0, 38.0, 44.0, 28.0, 40.0, 29.0, 29.0, 19.0, 25.0, 22.0, 13.0, 12.0, 8.0, 11.0, 9.0, 2.0, 4.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-42.07172775268555, -40.781211853027344, -39.490692138671875, -38.20017623901367, -36.9096565246582, -35.619140625, -34.32862091064453, -33.03810501098633, -31.74758529663086, -30.457067489624023, -29.166549682617188, -27.87603187561035, -26.585514068603516, -25.29499626159668, -24.004478454589844, -22.71396255493164, -21.423444747924805, -20.13292694091797, -18.842409133911133, -17.551891326904297, -16.26137351989746, -14.970855712890625, -13.680338859558105, -12.38982105255127, -11.099303245544434, -9.808785438537598, -8.518267631530762, -7.227750301361084, -5.937232494354248, -4.646714687347412, -3.3561973571777344, -2.0656795501708984, -0.7751617431640625, 0.5153559446334839, 1.8058736324310303, 3.096391201019287, 4.386909008026123, 5.677426815032959, 6.967944145202637, 8.258461952209473, 9.548979759216309, 10.839497566223145, 12.13001537322998, 13.4205322265625, 14.711050033569336, 16.001567840576172, 17.292085647583008, 18.582603454589844, 19.87312126159668, 21.163639068603516, 22.45415687561035, 23.744674682617188, 25.035192489624023, 26.32571029663086, 27.616226196289062, 28.90674591064453, 30.197261810302734, 31.48777961730957, 32.778297424316406, 34.06881332397461, 35.35933303833008, 36.64984893798828, 37.94036865234375, 39.23088455200195, 40.52140426635742]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [3.0, 5.0, 9.0, 13.0, 13.0, 32.0, 50.0, 69.0, 133.0, 205.0, 292.0, 511.0, 839.0, 1286.0, 2013.0, 3226.0, 4913.0, 7773.0, 12079.0, 18168.0, 27549.0, 40901.0, 58639.0, 83686.0, 116639.0, 156798.0, 202917.0, 253096.0, 301598.0, 339240.0, 366454.0, 369805.0, 355875.0, 322935.0, 278637.0, 228143.0, 180990.0, 136861.0, 100285.0, 71694.0, 50035.0, 33865.0, 22780.0, 15298.0, 10012.0, 6429.0, 4264.0, 2592.0, 1714.0, 1078.0, 701.0, 434.0, 275.0, 173.0, 101.0, 79.0, 39.0, 26.0, 18.0, 6.0, 4.0, 2.0, 2.0, 3.0], "bins": [-19.0625, -18.452880859375, -17.84326171875, -17.233642578125, -16.6240234375, -16.014404296875, -15.40478515625, -14.795166015625, -14.185546875, -13.575927734375, -12.96630859375, -12.356689453125, -11.7470703125, -11.137451171875, -10.52783203125, -9.918212890625, -9.30859375, -8.698974609375, -8.08935546875, -7.479736328125, -6.8701171875, -6.260498046875, -5.65087890625, -5.041259765625, -4.431640625, -3.822021484375, -3.21240234375, -2.602783203125, -1.9931640625, -1.383544921875, -0.77392578125, -0.164306640625, 0.4453125, 1.054931640625, 1.66455078125, 2.274169921875, 2.8837890625, 3.493408203125, 4.10302734375, 4.712646484375, 5.322265625, 5.931884765625, 6.54150390625, 7.151123046875, 7.7607421875, 8.370361328125, 8.97998046875, 9.589599609375, 10.19921875, 10.808837890625, 11.41845703125, 12.028076171875, 12.6376953125, 13.247314453125, 13.85693359375, 14.466552734375, 15.076171875, 15.685791015625, 16.29541015625, 16.905029296875, 17.5146484375, 18.124267578125, 18.73388671875, 19.343505859375, 19.953125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 10.0, 3.0, 7.0, 11.0, 11.0, 15.0, 15.0, 14.0, 29.0, 25.0, 30.0, 33.0, 33.0, 39.0, 44.0, 45.0, 63.0, 33.0, 37.0, 40.0, 46.0, 48.0, 43.0, 47.0, 32.0, 34.0, 34.0, 32.0, 17.0, 26.0, 21.0, 14.0, 11.0, 14.0, 10.0, 9.0, 3.0, 5.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-36.1875, -35.08203125, -33.9765625, -32.87109375, -31.765625, -30.66015625, -29.5546875, -28.44921875, -27.34375, -26.23828125, -25.1328125, -24.02734375, -22.921875, -21.81640625, -20.7109375, -19.60546875, -18.5, -17.39453125, -16.2890625, -15.18359375, -14.078125, -12.97265625, -11.8671875, -10.76171875, -9.65625, -8.55078125, -7.4453125, -6.33984375, -5.234375, -4.12890625, -3.0234375, -1.91796875, -0.8125, 0.29296875, 1.3984375, 2.50390625, 3.609375, 4.71484375, 5.8203125, 6.92578125, 8.03125, 9.13671875, 10.2421875, 11.34765625, 12.453125, 13.55859375, 14.6640625, 15.76953125, 16.875, 17.98046875, 19.0859375, 20.19140625, 21.296875, 22.40234375, 23.5078125, 24.61328125, 25.71875, 26.82421875, 27.9296875, 29.03515625, 30.140625, 31.24609375, 32.3515625, 33.45703125, 34.5625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 12.0, 32.0, 52.0, 84.0, 160.0, 287.0, 402.0, 742.0, 1218.0, 1960.0, 3408.0, 5388.0, 8652.0, 13812.0, 21024.0, 31629.0, 46764.0, 66718.0, 92468.0, 126909.0, 165007.0, 207605.0, 251455.0, 292381.0, 325079.0, 343351.0, 347051.0, 336543.0, 309448.0, 273915.0, 230992.0, 186526.0, 145621.0, 109536.0, 80242.0, 56607.0, 38386.0, 26118.0, 17512.0, 11146.0, 7106.0, 4392.0, 2672.0, 1556.0, 982.0, 534.0, 352.0, 216.0, 95.0, 63.0, 35.0, 13.0, 11.0, 8.0, 0.0, 2.0], "bins": [-21.546875, -20.91796875, -20.2890625, -19.66015625, -19.03125, -18.40234375, -17.7734375, -17.14453125, -16.515625, -15.88671875, -15.2578125, -14.62890625, -14.0, -13.37109375, -12.7421875, -12.11328125, -11.484375, -10.85546875, -10.2265625, -9.59765625, -8.96875, -8.33984375, -7.7109375, -7.08203125, -6.453125, -5.82421875, -5.1953125, -4.56640625, -3.9375, -3.30859375, -2.6796875, -2.05078125, -1.421875, -0.79296875, -0.1640625, 0.46484375, 1.09375, 1.72265625, 2.3515625, 2.98046875, 3.609375, 4.23828125, 4.8671875, 5.49609375, 6.125, 6.75390625, 7.3828125, 8.01171875, 8.640625, 9.26953125, 9.8984375, 10.52734375, 11.15625, 11.78515625, 12.4140625, 13.04296875, 13.671875, 14.30078125, 14.9296875, 15.55859375, 16.1875, 16.81640625, 17.4453125, 18.07421875, 18.703125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 6.0, 16.0, 16.0, 27.0, 27.0, 32.0, 48.0, 54.0, 84.0, 103.0, 110.0, 137.0, 144.0, 153.0, 190.0, 162.0, 190.0, 188.0, 202.0, 203.0, 199.0, 196.0, 194.0, 194.0, 162.0, 171.0, 148.0, 114.0, 110.0, 104.0, 89.0, 70.0, 36.0, 36.0, 42.0, 31.0, 17.0, 19.0, 15.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.125, -15.6556396484375, -15.186279296875, -14.7169189453125, -14.24755859375, -13.7781982421875, -13.308837890625, -12.8394775390625, -12.3701171875, -11.9007568359375, -11.431396484375, -10.9620361328125, -10.49267578125, -10.0233154296875, -9.553955078125, -9.0845947265625, -8.615234375, -8.1458740234375, -7.676513671875, -7.2071533203125, -6.73779296875, -6.2684326171875, -5.799072265625, -5.3297119140625, -4.8603515625, -4.3909912109375, -3.921630859375, -3.4522705078125, -2.98291015625, -2.5135498046875, -2.044189453125, -1.5748291015625, -1.10546875, -0.6361083984375, -0.166748046875, 0.3026123046875, 0.77197265625, 1.2413330078125, 1.710693359375, 2.1800537109375, 2.6494140625, 3.1187744140625, 3.588134765625, 4.0574951171875, 4.52685546875, 4.9962158203125, 5.465576171875, 5.9349365234375, 6.404296875, 6.8736572265625, 7.343017578125, 7.8123779296875, 8.28173828125, 8.7510986328125, 9.220458984375, 9.6898193359375, 10.1591796875, 10.6285400390625, 11.097900390625, 11.5672607421875, 12.03662109375, 12.5059814453125, 12.975341796875, 13.4447021484375, 13.9140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 3.0, 5.0, 3.0, 6.0, 11.0, 15.0, 14.0, 17.0, 23.0, 18.0, 26.0, 35.0, 30.0, 39.0, 39.0, 41.0, 50.0, 37.0, 53.0, 38.0, 46.0, 44.0, 46.0, 42.0, 41.0, 36.0, 32.0, 25.0, 33.0, 26.0, 24.0, 14.0, 27.0, 18.0, 10.0, 9.0, 4.0, 5.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.505916595458984, -31.42090606689453, -30.335895538330078, -29.250885009765625, -28.165874481201172, -27.08086395263672, -25.995853424072266, -24.910842895507812, -23.82583236694336, -22.740821838378906, -21.655811309814453, -20.57080078125, -19.485790252685547, -18.400779724121094, -17.31576919555664, -16.230758666992188, -15.145748138427734, -14.060737609863281, -12.975727081298828, -11.890716552734375, -10.805706024169922, -9.720695495605469, -8.635684967041016, -7.5506744384765625, -6.465663909912109, -5.380653381347656, -4.295642852783203, -3.21063232421875, -2.125621795654297, -1.0406112670898438, 0.044399261474609375, 1.1294097900390625, 2.2144203186035156, 3.2994308471679688, 4.384441375732422, 5.469451904296875, 6.554462432861328, 7.639472961425781, 8.724483489990234, 9.809494018554688, 10.89450454711914, 11.979515075683594, 13.064525604248047, 14.1495361328125, 15.234546661376953, 16.319557189941406, 17.40456771850586, 18.489578247070312, 19.574588775634766, 20.65959930419922, 21.744609832763672, 22.829620361328125, 23.914630889892578, 24.99964141845703, 26.084651947021484, 27.169662475585938, 28.25467300415039, 29.339683532714844, 30.424694061279297, 31.50970458984375, 32.5947151184082, 33.679725646972656, 34.76473617553711, 35.84974670410156, 36.934757232666016]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 3.0, 8.0, 6.0, 11.0, 7.0, 9.0, 18.0, 13.0, 21.0, 22.0, 30.0, 36.0, 42.0, 28.0, 35.0, 34.0, 44.0, 45.0, 53.0, 39.0, 40.0, 48.0, 45.0, 37.0, 39.0, 26.0, 35.0, 35.0, 26.0, 29.0, 21.0, 19.0, 14.0, 17.0, 16.0, 14.0, 9.0, 7.0, 4.0, 3.0, 4.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.774681091308594, -34.55237579345703, -33.33007049560547, -32.10776138305664, -30.885456085205078, -29.663150787353516, -28.440845489501953, -27.21854019165039, -25.996232986450195, -24.773927688598633, -23.551620483398438, -22.329315185546875, -21.107009887695312, -19.884702682495117, -18.662397384643555, -17.44009017944336, -16.217784881591797, -14.995478630065918, -13.773172378540039, -12.550867080688477, -11.328560829162598, -10.106254577636719, -8.883949279785156, -7.661643028259277, -6.439336776733398, -5.2170305252075195, -3.994724750518799, -2.772418737411499, -1.5501127243041992, -0.3278064727783203, 0.8944993019104004, 2.116805076599121, 3.339111328125, 4.561417579650879, 5.7837233543396, 7.00602912902832, 8.2283353805542, 9.450641632080078, 10.67294692993164, 11.89525318145752, 13.117559432983398, 14.339865684509277, 15.562171936035156, 16.78447723388672, 18.00678253173828, 19.229089736938477, 20.45139503479004, 21.673702239990234, 22.896007537841797, 24.11831283569336, 25.340620040893555, 26.562925338745117, 27.785232543945312, 29.007537841796875, 30.229843139648438, 31.4521484375, 32.67445373535156, 33.896759033203125, 35.11906433105469, 36.341373443603516, 37.56367874145508, 38.78598403930664, 40.0082893371582, 41.230594635009766, 42.452903747558594]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 10.0, 13.0, 13.0, 8.0, 13.0, 30.0, 33.0, 37.0, 61.0, 79.0, 133.0, 188.0, 283.0, 431.0, 676.0, 1040.0, 1711.0, 2672.0, 4333.0, 7597.0, 13029.0, 23644.0, 44662.0, 87832.0, 165323.0, 244312.0, 205304.0, 114685.0, 58790.0, 30922.0, 16558.0, 9418.0, 5579.0, 3400.0, 2066.0, 1239.0, 815.0, 506.0, 327.0, 239.0, 159.0, 111.0, 73.0, 53.0, 47.0, 29.0, 21.0, 15.0, 5.0, 15.0, 5.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-7.66796875, -7.41827392578125, -7.1685791015625, -6.91888427734375, -6.669189453125, -6.41949462890625, -6.1697998046875, -5.92010498046875, -5.67041015625, -5.42071533203125, -5.1710205078125, -4.92132568359375, -4.671630859375, -4.42193603515625, -4.1722412109375, -3.92254638671875, -3.6728515625, -3.42315673828125, -3.1734619140625, -2.92376708984375, -2.674072265625, -2.42437744140625, -2.1746826171875, -1.92498779296875, -1.67529296875, -1.42559814453125, -1.1759033203125, -0.92620849609375, -0.676513671875, -0.42681884765625, -0.1771240234375, 0.07257080078125, 0.322265625, 0.57196044921875, 0.8216552734375, 1.07135009765625, 1.321044921875, 1.57073974609375, 1.8204345703125, 2.07012939453125, 2.31982421875, 2.56951904296875, 2.8192138671875, 3.06890869140625, 3.318603515625, 3.56829833984375, 3.8179931640625, 4.06768798828125, 4.3173828125, 4.56707763671875, 4.8167724609375, 5.06646728515625, 5.316162109375, 5.56585693359375, 5.8155517578125, 6.06524658203125, 6.31494140625, 6.56463623046875, 6.8143310546875, 7.06402587890625, 7.313720703125, 7.56341552734375, 7.8131103515625, 8.06280517578125, 8.3125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 3.0, 8.0, 6.0, 11.0, 7.0, 8.0, 19.0, 12.0, 23.0, 22.0, 29.0, 35.0, 41.0, 32.0, 33.0, 34.0, 43.0, 46.0, 53.0, 40.0, 39.0, 51.0, 44.0, 34.0, 38.0, 26.0, 37.0, 35.0, 27.0, 28.0, 21.0, 18.0, 14.0, 18.0, 15.0, 15.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.375, -34.15380859375, -32.9326171875, -31.71142578125, -30.490234375, -29.26904296875, -28.0478515625, -26.82666015625, -25.60546875, -24.38427734375, -23.1630859375, -21.94189453125, -20.720703125, -19.49951171875, -18.2783203125, -17.05712890625, -15.8359375, -14.61474609375, -13.3935546875, -12.17236328125, -10.951171875, -9.72998046875, -8.5087890625, -7.28759765625, -6.06640625, -4.84521484375, -3.6240234375, -2.40283203125, -1.181640625, 0.03955078125, 1.2607421875, 2.48193359375, 3.703125, 4.92431640625, 6.1455078125, 7.36669921875, 8.587890625, 9.80908203125, 11.0302734375, 12.25146484375, 13.47265625, 14.69384765625, 15.9150390625, 17.13623046875, 18.357421875, 19.57861328125, 20.7998046875, 22.02099609375, 23.2421875, 24.46337890625, 25.6845703125, 26.90576171875, 28.126953125, 29.34814453125, 30.5693359375, 31.79052734375, 33.01171875, 34.23291015625, 35.4541015625, 36.67529296875, 37.896484375, 39.11767578125, 40.3388671875, 41.56005859375, 42.78125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 12.0, 9.0, 13.0, 17.0, 28.0, 37.0, 43.0, 44.0, 63.0, 96.0, 113.0, 191.0, 256.0, 371.0, 564.0, 866.0, 1319.0, 2125.0, 3665.0, 7087.0, 13411.0, 30087.0, 76375.0, 221729.0, 387583.0, 184646.0, 64363.0, 26092.0, 12067.0, 6179.0, 3396.0, 1957.0, 1252.0, 761.0, 500.0, 345.0, 228.0, 185.0, 124.0, 90.0, 69.0, 52.0, 40.0, 20.0, 24.0, 15.0, 12.0, 7.0, 12.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0], "bins": [-9.4140625, -9.13232421875, -8.8505859375, -8.56884765625, -8.287109375, -8.00537109375, -7.7236328125, -7.44189453125, -7.16015625, -6.87841796875, -6.5966796875, -6.31494140625, -6.033203125, -5.75146484375, -5.4697265625, -5.18798828125, -4.90625, -4.62451171875, -4.3427734375, -4.06103515625, -3.779296875, -3.49755859375, -3.2158203125, -2.93408203125, -2.65234375, -2.37060546875, -2.0888671875, -1.80712890625, -1.525390625, -1.24365234375, -0.9619140625, -0.68017578125, -0.3984375, -0.11669921875, 0.1650390625, 0.44677734375, 0.728515625, 1.01025390625, 1.2919921875, 1.57373046875, 1.85546875, 2.13720703125, 2.4189453125, 2.70068359375, 2.982421875, 3.26416015625, 3.5458984375, 3.82763671875, 4.109375, 4.39111328125, 4.6728515625, 4.95458984375, 5.236328125, 5.51806640625, 5.7998046875, 6.08154296875, 6.36328125, 6.64501953125, 6.9267578125, 7.20849609375, 7.490234375, 7.77197265625, 8.0537109375, 8.33544921875, 8.6171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 2.0, 8.0, 6.0, 8.0, 8.0, 8.0, 9.0, 3.0, 11.0, 15.0, 21.0, 13.0, 25.0, 32.0, 32.0, 28.0, 25.0, 42.0, 42.0, 38.0, 41.0, 27.0, 30.0, 40.0, 50.0, 36.0, 35.0, 34.0, 37.0, 33.0, 29.0, 25.0, 35.0, 34.0, 17.0, 10.0, 20.0, 14.0, 14.0, 10.0, 9.0, 9.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.890625, -24.103515625, -23.31640625, -22.529296875, -21.7421875, -20.955078125, -20.16796875, -19.380859375, -18.59375, -17.806640625, -17.01953125, -16.232421875, -15.4453125, -14.658203125, -13.87109375, -13.083984375, -12.296875, -11.509765625, -10.72265625, -9.935546875, -9.1484375, -8.361328125, -7.57421875, -6.787109375, -6.0, -5.212890625, -4.42578125, -3.638671875, -2.8515625, -2.064453125, -1.27734375, -0.490234375, 0.296875, 1.083984375, 1.87109375, 2.658203125, 3.4453125, 4.232421875, 5.01953125, 5.806640625, 6.59375, 7.380859375, 8.16796875, 8.955078125, 9.7421875, 10.529296875, 11.31640625, 12.103515625, 12.890625, 13.677734375, 14.46484375, 15.251953125, 16.0390625, 16.826171875, 17.61328125, 18.400390625, 19.1875, 19.974609375, 20.76171875, 21.548828125, 22.3359375, 23.123046875, 23.91015625, 24.697265625, 25.484375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 2.0, 7.0, 4.0, 10.0, 13.0, 29.0, 30.0, 45.0, 58.0, 77.0, 133.0, 204.0, 317.0, 482.0, 879.0, 1342.0, 2316.0, 4201.0, 7676.0, 15686.0, 36758.0, 112861.0, 458673.0, 285796.0, 69220.0, 25972.0, 11670.0, 5937.0, 3276.0, 1856.0, 1088.0, 750.0, 392.0, 305.0, 177.0, 102.0, 64.0, 54.0, 29.0, 18.0, 18.0, 13.0, 6.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.47265625, -5.3154296875, -5.158203125, -5.0009765625, -4.84375, -4.6865234375, -4.529296875, -4.3720703125, -4.21484375, -4.0576171875, -3.900390625, -3.7431640625, -3.5859375, -3.4287109375, -3.271484375, -3.1142578125, -2.95703125, -2.7998046875, -2.642578125, -2.4853515625, -2.328125, -2.1708984375, -2.013671875, -1.8564453125, -1.69921875, -1.5419921875, -1.384765625, -1.2275390625, -1.0703125, -0.9130859375, -0.755859375, -0.5986328125, -0.44140625, -0.2841796875, -0.126953125, 0.0302734375, 0.1875, 0.3447265625, 0.501953125, 0.6591796875, 0.81640625, 0.9736328125, 1.130859375, 1.2880859375, 1.4453125, 1.6025390625, 1.759765625, 1.9169921875, 2.07421875, 2.2314453125, 2.388671875, 2.5458984375, 2.703125, 2.8603515625, 3.017578125, 3.1748046875, 3.33203125, 3.4892578125, 3.646484375, 3.8037109375, 3.9609375, 4.1181640625, 4.275390625, 4.4326171875, 4.58984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 8.0, 9.0, 12.0, 16.0, 17.0, 25.0, 31.0, 46.0, 68.0, 78.0, 105.0, 109.0, 81.0, 89.0, 72.0, 55.0, 48.0, 44.0, 30.0, 20.0, 9.0, 8.0, 7.0, 0.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003669261932373047, -0.0003542117774486542, -0.00034149736166000366, -0.00032878294587135315, -0.00031606853008270264, -0.0003033541142940521, -0.0002906396985054016, -0.0002779252827167511, -0.0002652108669281006, -0.0002524964511394501, -0.00023978203535079956, -0.00022706761956214905, -0.00021435320377349854, -0.00020163878798484802, -0.0001889243721961975, -0.000176209956407547, -0.00016349554061889648, -0.00015078112483024597, -0.00013806670904159546, -0.00012535229325294495, -0.00011263787746429443, -9.992346167564392e-05, -8.720904588699341e-05, -7.44946300983429e-05, -6.178021430969238e-05, -4.906579852104187e-05, -3.635138273239136e-05, -2.3636966943740845e-05, -1.0922551155090332e-05, 1.7918646335601807e-06, 1.4506280422210693e-05, 2.7220696210861206e-05, 3.993511199951172e-05, 5.264952778816223e-05, 6.536394357681274e-05, 7.807835936546326e-05, 9.079277515411377e-05, 0.00010350719094276428, 0.0001162216067314148, 0.0001289360225200653, 0.00014165043830871582, 0.00015436485409736633, 0.00016707926988601685, 0.00017979368567466736, 0.00019250810146331787, 0.00020522251725196838, 0.0002179369330406189, 0.0002306513488292694, 0.00024336576461791992, 0.00025608018040657043, 0.00026879459619522095, 0.00028150901198387146, 0.00029422342777252197, 0.0003069378435611725, 0.000319652259349823, 0.0003323666751384735, 0.000345081090927124, 0.00035779550671577454, 0.00037050992250442505, 0.00038322433829307556, 0.0003959387540817261, 0.0004086531698703766, 0.0004213675856590271, 0.0004340820014476776, 0.0004467964172363281]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 8.0, 16.0, 19.0, 33.0, 40.0, 57.0, 86.0, 117.0, 205.0, 279.0, 392.0, 627.0, 895.0, 1413.0, 2214.0, 3612.0, 5797.0, 9671.0, 17162.0, 30538.0, 57162.0, 106394.0, 186672.0, 236809.0, 173223.0, 96055.0, 51455.0, 28235.0, 15717.0, 9057.0, 5376.0, 3330.0, 1990.0, 1246.0, 861.0, 556.0, 388.0, 245.0, 185.0, 138.0, 78.0, 64.0, 47.0, 28.0, 18.0, 18.0, 7.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.35546875, -4.21685791015625, -4.0782470703125, -3.93963623046875, -3.801025390625, -3.66241455078125, -3.5238037109375, -3.38519287109375, -3.24658203125, -3.10797119140625, -2.9693603515625, -2.83074951171875, -2.692138671875, -2.55352783203125, -2.4149169921875, -2.27630615234375, -2.1376953125, -1.99908447265625, -1.8604736328125, -1.72186279296875, -1.583251953125, -1.44464111328125, -1.3060302734375, -1.16741943359375, -1.02880859375, -0.89019775390625, -0.7515869140625, -0.61297607421875, -0.474365234375, -0.33575439453125, -0.1971435546875, -0.05853271484375, 0.080078125, 0.21868896484375, 0.3572998046875, 0.49591064453125, 0.634521484375, 0.77313232421875, 0.9117431640625, 1.05035400390625, 1.18896484375, 1.32757568359375, 1.4661865234375, 1.60479736328125, 1.743408203125, 1.88201904296875, 2.0206298828125, 2.15924072265625, 2.2978515625, 2.43646240234375, 2.5750732421875, 2.71368408203125, 2.852294921875, 2.99090576171875, 3.1295166015625, 3.26812744140625, 3.40673828125, 3.54534912109375, 3.6839599609375, 3.82257080078125, 3.961181640625, 4.09979248046875, 4.2384033203125, 4.37701416015625, 4.515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 12.0, 6.0, 21.0, 32.0, 36.0, 67.0, 76.0, 104.0, 113.0, 111.0, 121.0, 83.0, 67.0, 40.0, 28.0, 14.0, 9.0, 9.0, 6.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.46484375, -4.34332275390625, -4.2218017578125, -4.10028076171875, -3.978759765625, -3.85723876953125, -3.7357177734375, -3.61419677734375, -3.49267578125, -3.37115478515625, -3.2496337890625, -3.12811279296875, -3.006591796875, -2.88507080078125, -2.7635498046875, -2.64202880859375, -2.5205078125, -2.39898681640625, -2.2774658203125, -2.15594482421875, -2.034423828125, -1.91290283203125, -1.7913818359375, -1.66986083984375, -1.54833984375, -1.42681884765625, -1.3052978515625, -1.18377685546875, -1.062255859375, -0.94073486328125, -0.8192138671875, -0.69769287109375, -0.576171875, -0.45465087890625, -0.3331298828125, -0.21160888671875, -0.090087890625, 0.03143310546875, 0.1529541015625, 0.27447509765625, 0.39599609375, 0.51751708984375, 0.6390380859375, 0.76055908203125, 0.882080078125, 1.00360107421875, 1.1251220703125, 1.24664306640625, 1.3681640625, 1.48968505859375, 1.6112060546875, 1.73272705078125, 1.854248046875, 1.97576904296875, 2.0972900390625, 2.21881103515625, 2.34033203125, 2.46185302734375, 2.5833740234375, 2.70489501953125, 2.826416015625, 2.94793701171875, 3.0694580078125, 3.19097900390625, 3.3125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 8.0, 10.0, 17.0, 8.0, 17.0, 20.0, 22.0, 23.0, 33.0, 25.0, 43.0, 34.0, 39.0, 47.0, 45.0, 47.0, 44.0, 47.0, 42.0, 39.0, 50.0, 41.0, 42.0, 31.0, 27.0, 30.0, 30.0, 22.0, 16.0, 19.0, 19.0, 17.0, 9.0, 8.0, 6.0, 5.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.85098648071289, -31.76666831970215, -30.682350158691406, -29.598033905029297, -28.513715744018555, -27.429397583007812, -26.345081329345703, -25.26076316833496, -24.17644500732422, -23.092126846313477, -22.007808685302734, -20.923492431640625, -19.839174270629883, -18.75485610961914, -17.67053985595703, -16.58622169494629, -15.501903533935547, -14.417585372924805, -13.333268165588379, -12.248950958251953, -11.164632797241211, -10.080314636230469, -8.995997428894043, -7.911679744720459, -6.827362060546875, -5.743044376373291, -4.658726692199707, -3.574409008026123, -2.490091323852539, -1.405773639678955, -0.3214559555053711, 0.7628617286682129, 1.8471832275390625, 2.9315009117126465, 4.0158185958862305, 5.1001362800598145, 6.184453964233398, 7.268771648406982, 8.353089332580566, 9.437406539916992, 10.521724700927734, 11.606042861938477, 12.690360069274902, 13.774677276611328, 14.85899543762207, 15.943313598632812, 17.027629852294922, 18.111948013305664, 19.196266174316406, 20.28058433532715, 21.36490249633789, 22.44921875, 23.533536911010742, 24.617855072021484, 25.702171325683594, 26.786489486694336, 27.870807647705078, 28.95512580871582, 30.039443969726562, 31.123760223388672, 32.20807647705078, 33.292396545410156, 34.376712799072266, 35.46103286743164, 36.54534912109375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 10.0, 9.0, 14.0, 7.0, 21.0, 21.0, 16.0, 37.0, 29.0, 38.0, 36.0, 36.0, 32.0, 40.0, 50.0, 45.0, 46.0, 46.0, 55.0, 38.0, 30.0, 36.0, 30.0, 40.0, 31.0, 24.0, 26.0, 25.0, 16.0, 17.0, 15.0, 19.0, 11.0, 8.0, 8.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.312740325927734, -34.09036636352539, -32.86799240112305, -31.645618438720703, -30.42324447631836, -29.200870513916016, -27.97849464416504, -26.756120681762695, -25.53374671936035, -24.311372756958008, -23.088998794555664, -21.86662483215332, -20.644248962402344, -19.421875, -18.199501037597656, -16.977127075195312, -15.754753112792969, -14.532379150390625, -13.310005187988281, -12.087630271911621, -10.865256309509277, -9.642882347106934, -8.420507431030273, -7.19813346862793, -5.975759506225586, -4.753385543823242, -3.5310111045837402, -2.3086369037628174, -1.0862627029418945, 0.13611125946044922, 1.3584856986999512, 2.580860137939453, 3.8032379150390625, 5.025611877441406, 6.247986316680908, 7.47036075592041, 8.692734718322754, 9.915108680725098, 11.137483596801758, 12.359857559204102, 13.582231521606445, 14.804605484008789, 16.026979446411133, 17.249353408813477, 18.471729278564453, 19.694103240966797, 20.91647720336914, 22.138851165771484, 23.361225128173828, 24.583599090576172, 25.805973052978516, 27.02834701538086, 28.250720977783203, 29.473094940185547, 30.695470809936523, 31.917844772338867, 33.140220642089844, 34.36259460449219, 35.58496856689453, 36.807342529296875, 38.02971649169922, 39.25209045410156, 40.474464416503906, 41.69683837890625, 42.919212341308594]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 16.0, 29.0, 58.0, 77.0, 130.0, 215.0, 395.0, 718.0, 1194.0, 1936.0, 3254.0, 5225.0, 8345.0, 12990.0, 19723.0, 29126.0, 41113.0, 55488.0, 71864.0, 87088.0, 98582.0, 105277.0, 103636.0, 95274.0, 81107.0, 66249.0, 50761.0, 36723.0, 25546.0, 16953.0, 11070.0, 7075.0, 4352.0, 2823.0, 1727.0, 1023.0, 550.0, 344.0, 205.0, 134.0, 59.0, 40.0, 27.0, 15.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.37158203125, -18.7431640625, -18.11474609375, -17.486328125, -16.85791015625, -16.2294921875, -15.60107421875, -14.97265625, -14.34423828125, -13.7158203125, -13.08740234375, -12.458984375, -11.83056640625, -11.2021484375, -10.57373046875, -9.9453125, -9.31689453125, -8.6884765625, -8.06005859375, -7.431640625, -6.80322265625, -6.1748046875, -5.54638671875, -4.91796875, -4.28955078125, -3.6611328125, -3.03271484375, -2.404296875, -1.77587890625, -1.1474609375, -0.51904296875, 0.109375, 0.73779296875, 1.3662109375, 1.99462890625, 2.623046875, 3.25146484375, 3.8798828125, 4.50830078125, 5.13671875, 5.76513671875, 6.3935546875, 7.02197265625, 7.650390625, 8.27880859375, 8.9072265625, 9.53564453125, 10.1640625, 10.79248046875, 11.4208984375, 12.04931640625, 12.677734375, 13.30615234375, 13.9345703125, 14.56298828125, 15.19140625, 15.81982421875, 16.4482421875, 17.07666015625, 17.705078125, 18.33349609375, 18.9619140625, 19.59033203125, 20.21875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 10.0, 8.0, 13.0, 9.0, 19.0, 20.0, 17.0, 37.0, 26.0, 42.0, 31.0, 37.0, 36.0, 38.0, 43.0, 49.0, 50.0, 39.0, 53.0, 47.0, 28.0, 33.0, 33.0, 40.0, 31.0, 27.0, 27.0, 24.0, 16.0, 17.0, 14.0, 18.0, 13.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6875, -33.49169921875, -32.2958984375, -31.10009765625, -29.904296875, -28.70849609375, -27.5126953125, -26.31689453125, -25.12109375, -23.92529296875, -22.7294921875, -21.53369140625, -20.337890625, -19.14208984375, -17.9462890625, -16.75048828125, -15.5546875, -14.35888671875, -13.1630859375, -11.96728515625, -10.771484375, -9.57568359375, -8.3798828125, -7.18408203125, -5.98828125, -4.79248046875, -3.5966796875, -2.40087890625, -1.205078125, -0.00927734375, 1.1865234375, 2.38232421875, 3.578125, 4.77392578125, 5.9697265625, 7.16552734375, 8.361328125, 9.55712890625, 10.7529296875, 11.94873046875, 13.14453125, 14.34033203125, 15.5361328125, 16.73193359375, 17.927734375, 19.12353515625, 20.3193359375, 21.51513671875, 22.7109375, 23.90673828125, 25.1025390625, 26.29833984375, 27.494140625, 28.68994140625, 29.8857421875, 31.08154296875, 32.27734375, 33.47314453125, 34.6689453125, 35.86474609375, 37.060546875, 38.25634765625, 39.4521484375, 40.64794921875, 41.84375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 4.0, 8.0, 15.0, 11.0, 27.0, 38.0, 56.0, 101.0, 140.0, 225.0, 415.0, 605.0, 1029.0, 1623.0, 2488.0, 3845.0, 5853.0, 8942.0, 13063.0, 18855.0, 27033.0, 37216.0, 48593.0, 61975.0, 74414.0, 86059.0, 93178.0, 95561.0, 91898.0, 83861.0, 72438.0, 59426.0, 45933.0, 34901.0, 25354.0, 17469.0, 12196.0, 8347.0, 5481.0, 3677.0, 2299.0, 1439.0, 952.0, 540.0, 359.0, 238.0, 161.0, 81.0, 51.0, 31.0, 25.0, 12.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.015625, -17.423095703125, -16.83056640625, -16.238037109375, -15.6455078125, -15.052978515625, -14.46044921875, -13.867919921875, -13.275390625, -12.682861328125, -12.09033203125, -11.497802734375, -10.9052734375, -10.312744140625, -9.72021484375, -9.127685546875, -8.53515625, -7.942626953125, -7.35009765625, -6.757568359375, -6.1650390625, -5.572509765625, -4.97998046875, -4.387451171875, -3.794921875, -3.202392578125, -2.60986328125, -2.017333984375, -1.4248046875, -0.832275390625, -0.23974609375, 0.352783203125, 0.9453125, 1.537841796875, 2.13037109375, 2.722900390625, 3.3154296875, 3.907958984375, 4.50048828125, 5.093017578125, 5.685546875, 6.278076171875, 6.87060546875, 7.463134765625, 8.0556640625, 8.648193359375, 9.24072265625, 9.833251953125, 10.42578125, 11.018310546875, 11.61083984375, 12.203369140625, 12.7958984375, 13.388427734375, 13.98095703125, 14.573486328125, 15.166015625, 15.758544921875, 16.35107421875, 16.943603515625, 17.5361328125, 18.128662109375, 18.72119140625, 19.313720703125, 19.90625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 3.0, 4.0, 8.0, 6.0, 12.0, 11.0, 8.0, 17.0, 8.0, 21.0, 22.0, 18.0, 19.0, 33.0, 41.0, 40.0, 42.0, 36.0, 52.0, 38.0, 31.0, 29.0, 40.0, 45.0, 33.0, 34.0, 32.0, 32.0, 38.0, 35.0, 32.0, 32.0, 14.0, 16.0, 20.0, 13.0, 9.0, 9.0, 14.0, 7.0, 5.0, 5.0, 13.0, 4.0, 7.0, 6.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.34375, -22.607666015625, -21.87158203125, -21.135498046875, -20.3994140625, -19.663330078125, -18.92724609375, -18.191162109375, -17.455078125, -16.718994140625, -15.98291015625, -15.246826171875, -14.5107421875, -13.774658203125, -13.03857421875, -12.302490234375, -11.56640625, -10.830322265625, -10.09423828125, -9.358154296875, -8.6220703125, -7.885986328125, -7.14990234375, -6.413818359375, -5.677734375, -4.941650390625, -4.20556640625, -3.469482421875, -2.7333984375, -1.997314453125, -1.26123046875, -0.525146484375, 0.2109375, 0.947021484375, 1.68310546875, 2.419189453125, 3.1552734375, 3.891357421875, 4.62744140625, 5.363525390625, 6.099609375, 6.835693359375, 7.57177734375, 8.307861328125, 9.0439453125, 9.780029296875, 10.51611328125, 11.252197265625, 11.98828125, 12.724365234375, 13.46044921875, 14.196533203125, 14.9326171875, 15.668701171875, 16.40478515625, 17.140869140625, 17.876953125, 18.613037109375, 19.34912109375, 20.085205078125, 20.8212890625, 21.557373046875, 22.29345703125, 23.029541015625, 23.765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 17.0, 23.0, 26.0, 30.0, 48.0, 93.0, 145.0, 248.0, 416.0, 617.0, 997.0, 1752.0, 3072.0, 5255.0, 9261.0, 16449.0, 28090.0, 45833.0, 71199.0, 100095.0, 126463.0, 141678.0, 136715.0, 117626.0, 89198.0, 60648.0, 38358.0, 23120.0, 13199.0, 7612.0, 4275.0, 2374.0, 1404.0, 849.0, 515.0, 330.0, 191.0, 120.0, 71.0, 52.0, 37.0, 17.0, 11.0, 11.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0078125, -10.6385498046875, -10.269287109375, -9.9000244140625, -9.53076171875, -9.1614990234375, -8.792236328125, -8.4229736328125, -8.0537109375, -7.6844482421875, -7.315185546875, -6.9459228515625, -6.57666015625, -6.2073974609375, -5.838134765625, -5.4688720703125, -5.099609375, -4.7303466796875, -4.361083984375, -3.9918212890625, -3.62255859375, -3.2532958984375, -2.884033203125, -2.5147705078125, -2.1455078125, -1.7762451171875, -1.406982421875, -1.0377197265625, -0.66845703125, -0.2991943359375, 0.070068359375, 0.4393310546875, 0.80859375, 1.1778564453125, 1.547119140625, 1.9163818359375, 2.28564453125, 2.6549072265625, 3.024169921875, 3.3934326171875, 3.7626953125, 4.1319580078125, 4.501220703125, 4.8704833984375, 5.23974609375, 5.6090087890625, 5.978271484375, 6.3475341796875, 6.716796875, 7.0860595703125, 7.455322265625, 7.8245849609375, 8.19384765625, 8.5631103515625, 8.932373046875, 9.3016357421875, 9.6708984375, 10.0401611328125, 10.409423828125, 10.7786865234375, 11.14794921875, 11.5172119140625, 11.886474609375, 12.2557373046875, 12.625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 2.0, 6.0, 7.0, 10.0, 16.0, 14.0, 19.0, 24.0, 19.0, 34.0, 40.0, 39.0, 43.0, 45.0, 59.0, 44.0, 54.0, 60.0, 52.0, 42.0, 45.0, 39.0, 50.0, 33.0, 36.0, 28.0, 33.0, 14.0, 14.0, 22.0, 6.0, 15.0, 7.0, 8.0, 4.0, 7.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011301040649414062, -0.0010917186737060547, -0.0010533332824707031, -0.0010149478912353516, -0.0009765625, -0.0009381771087646484, -0.0008997917175292969, -0.0008614063262939453, -0.0008230209350585938, -0.0007846355438232422, -0.0007462501525878906, -0.0007078647613525391, -0.0006694793701171875, -0.0006310939788818359, -0.0005927085876464844, -0.0005543231964111328, -0.0005159378051757812, -0.0004775524139404297, -0.0004391670227050781, -0.00040078163146972656, -0.000362396240234375, -0.00032401084899902344, -0.0002856254577636719, -0.0002472400665283203, -0.00020885467529296875, -0.0001704692840576172, -0.00013208389282226562, -9.369850158691406e-05, -5.53131103515625e-05, -1.6927719116210938e-05, 2.1457672119140625e-05, 5.984306335449219e-05, 9.822845458984375e-05, 0.0001366138458251953, 0.00017499923706054688, 0.00021338462829589844, 0.00025177001953125, 0.00029015541076660156, 0.0003285408020019531, 0.0003669261932373047, 0.00040531158447265625, 0.0004436969757080078, 0.0004820823669433594, 0.0005204677581787109, 0.0005588531494140625, 0.0005972385406494141, 0.0006356239318847656, 0.0006740093231201172, 0.0007123947143554688, 0.0007507801055908203, 0.0007891654968261719, 0.0008275508880615234, 0.000865936279296875, 0.0009043216705322266, 0.0009427070617675781, 0.0009810924530029297, 0.0010194778442382812, 0.0010578632354736328, 0.0010962486267089844, 0.001134634017944336, 0.0011730194091796875, 0.001211404800415039, 0.0012497901916503906, 0.0012881755828857422, 0.0013265609741210938]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 15.0, 17.0, 33.0, 39.0, 76.0, 135.0, 241.0, 425.0, 750.0, 1237.0, 2035.0, 3837.0, 6648.0, 11768.0, 20382.0, 34062.0, 55290.0, 82551.0, 112912.0, 137015.0, 144715.0, 132141.0, 105487.0, 75643.0, 49764.0, 29803.0, 17692.0, 10210.0, 5909.0, 3252.0, 1889.0, 1058.0, 612.0, 351.0, 230.0, 119.0, 77.0, 53.0, 30.0, 21.0, 13.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.690185546875, -11.26318359375, -10.836181640625, -10.4091796875, -9.982177734375, -9.55517578125, -9.128173828125, -8.701171875, -8.274169921875, -7.84716796875, -7.420166015625, -6.9931640625, -6.566162109375, -6.13916015625, -5.712158203125, -5.28515625, -4.858154296875, -4.43115234375, -4.004150390625, -3.5771484375, -3.150146484375, -2.72314453125, -2.296142578125, -1.869140625, -1.442138671875, -1.01513671875, -0.588134765625, -0.1611328125, 0.265869140625, 0.69287109375, 1.119873046875, 1.546875, 1.973876953125, 2.40087890625, 2.827880859375, 3.2548828125, 3.681884765625, 4.10888671875, 4.535888671875, 4.962890625, 5.389892578125, 5.81689453125, 6.243896484375, 6.6708984375, 7.097900390625, 7.52490234375, 7.951904296875, 8.37890625, 8.805908203125, 9.23291015625, 9.659912109375, 10.0869140625, 10.513916015625, 10.94091796875, 11.367919921875, 11.794921875, 12.221923828125, 12.64892578125, 13.075927734375, 13.5029296875, 13.929931640625, 14.35693359375, 14.783935546875, 15.2109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 2.0, 1.0, 2.0, 4.0, 8.0, 9.0, 10.0, 11.0, 12.0, 22.0, 26.0, 19.0, 36.0, 41.0, 39.0, 39.0, 46.0, 45.0, 49.0, 53.0, 44.0, 58.0, 46.0, 47.0, 40.0, 35.0, 34.0, 27.0, 31.0, 28.0, 20.0, 18.0, 22.0, 11.0, 16.0, 10.0, 10.0, 10.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83984375, -4.68084716796875, -4.5218505859375, -4.36285400390625, -4.203857421875, -4.04486083984375, -3.8858642578125, -3.72686767578125, -3.56787109375, -3.40887451171875, -3.2498779296875, -3.09088134765625, -2.931884765625, -2.77288818359375, -2.6138916015625, -2.45489501953125, -2.2958984375, -2.13690185546875, -1.9779052734375, -1.81890869140625, -1.659912109375, -1.50091552734375, -1.3419189453125, -1.18292236328125, -1.02392578125, -0.86492919921875, -0.7059326171875, -0.54693603515625, -0.387939453125, -0.22894287109375, -0.0699462890625, 0.08905029296875, 0.248046875, 0.40704345703125, 0.5660400390625, 0.72503662109375, 0.884033203125, 1.04302978515625, 1.2020263671875, 1.36102294921875, 1.52001953125, 1.67901611328125, 1.8380126953125, 1.99700927734375, 2.156005859375, 2.31500244140625, 2.4739990234375, 2.63299560546875, 2.7919921875, 2.95098876953125, 3.1099853515625, 3.26898193359375, 3.427978515625, 3.58697509765625, 3.7459716796875, 3.90496826171875, 4.06396484375, 4.22296142578125, 4.3819580078125, 4.54095458984375, 4.699951171875, 4.85894775390625, 5.0179443359375, 5.17694091796875, 5.3359375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 11.0, 7.0, 7.0, 12.0, 16.0, 21.0, 27.0, 22.0, 26.0, 25.0, 34.0, 38.0, 29.0, 41.0, 48.0, 30.0, 41.0, 32.0, 44.0, 53.0, 36.0, 36.0, 49.0, 30.0, 35.0, 39.0, 37.0, 22.0, 20.0, 23.0, 18.0, 16.0, 17.0, 12.0, 10.0, 6.0, 14.0, 3.0, 2.0, 4.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.44992446899414, -30.42497444152832, -29.4000244140625, -28.375076293945312, -27.350126266479492, -26.325176239013672, -25.300228118896484, -24.275278091430664, -23.250328063964844, -22.225378036499023, -21.200428009033203, -20.175479888916016, -19.150529861450195, -18.125579833984375, -17.100631713867188, -16.075681686401367, -15.050731658935547, -14.025781631469727, -13.000832557678223, -11.975883483886719, -10.950933456420898, -9.925983428955078, -8.901034355163574, -7.876084804534912, -6.85113525390625, -5.826185703277588, -4.801236152648926, -3.7762866020202637, -2.7513370513916016, -1.7263875007629395, -0.7014379501342773, 0.32351160049438477, 1.3484573364257812, 2.3734068870544434, 3.3983564376831055, 4.423305988311768, 5.44825553894043, 6.473205089569092, 7.498154640197754, 8.523103713989258, 9.548053741455078, 10.573003768920898, 11.597952842712402, 12.622901916503906, 13.647851943969727, 14.672801971435547, 15.69775104522705, 16.722700119018555, 17.747650146484375, 18.772600173950195, 19.797550201416016, 20.822498321533203, 21.847448348999023, 22.872398376464844, 23.89734649658203, 24.92229652404785, 25.947246551513672, 26.972196578979492, 27.997146606445312, 29.0220947265625, 30.04704475402832, 31.07199478149414, 32.09694290161133, 33.12189483642578, 34.14684295654297]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 3.0, 9.0, 7.0, 16.0, 11.0, 16.0, 23.0, 22.0, 18.0, 26.0, 37.0, 37.0, 31.0, 44.0, 36.0, 61.0, 46.0, 47.0, 38.0, 38.0, 58.0, 43.0, 39.0, 35.0, 25.0, 33.0, 20.0, 28.0, 27.0, 21.0, 12.0, 21.0, 10.0, 13.0, 11.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.10544204711914, -39.828407287597656, -38.55137252807617, -37.27433776855469, -35.99729919433594, -34.72026443481445, -33.44322967529297, -32.166194915771484, -30.88916015625, -29.612125396728516, -28.33509063720703, -27.058053970336914, -25.78101921081543, -24.503984451293945, -23.226947784423828, -21.949913024902344, -20.67287826538086, -19.395843505859375, -18.11880874633789, -16.841772079467773, -15.564737319946289, -14.287702560424805, -13.010666847229004, -11.733631134033203, -10.456596374511719, -9.179561614990234, -7.902525901794434, -6.625490665435791, -5.348455429077148, -4.071420192718506, -2.7943849563598633, -1.5173492431640625, -0.24031448364257812, 1.0367207527160645, 2.313755989074707, 3.5907912254333496, 4.867826461791992, 6.144861698150635, 7.421896934509277, 8.698932647705078, 9.975967407226562, 11.253002166748047, 12.530037879943848, 13.807073593139648, 15.084108352661133, 16.361143112182617, 17.638179779052734, 18.91521453857422, 20.192249298095703, 21.469284057617188, 22.746318817138672, 24.02335548400879, 25.300390243530273, 26.577425003051758, 27.854461669921875, 29.13149642944336, 30.408531188964844, 31.685565948486328, 32.96260070800781, 34.2396354675293, 35.51667022705078, 36.79370880126953, 38.070743560791016, 39.3477783203125, 40.624813079833984]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 17.0, 12.0, 36.0, 69.0, 118.0, 166.0, 276.0, 442.0, 778.0, 1303.0, 2118.0, 3505.0, 5898.0, 9485.0, 15094.0, 24214.0, 37566.0, 57042.0, 84602.0, 121108.0, 167796.0, 222199.0, 281202.0, 336058.0, 377050.0, 400262.0, 395700.0, 369383.0, 322616.0, 265260.0, 207831.0, 154935.0, 111310.0, 76718.0, 51433.0, 33826.0, 21632.0, 13523.0, 8424.0, 5238.0, 3144.0, 1879.0, 1204.0, 699.0, 452.0, 255.0, 168.0, 97.0, 57.0, 43.0, 19.0, 12.0, 5.0, 7.0, 0.0, 0.0, 4.0], "bins": [-22.609375, -21.921630859375, -21.23388671875, -20.546142578125, -19.8583984375, -19.170654296875, -18.48291015625, -17.795166015625, -17.107421875, -16.419677734375, -15.73193359375, -15.044189453125, -14.3564453125, -13.668701171875, -12.98095703125, -12.293212890625, -11.60546875, -10.917724609375, -10.22998046875, -9.542236328125, -8.8544921875, -8.166748046875, -7.47900390625, -6.791259765625, -6.103515625, -5.415771484375, -4.72802734375, -4.040283203125, -3.3525390625, -2.664794921875, -1.97705078125, -1.289306640625, -0.6015625, 0.086181640625, 0.77392578125, 1.461669921875, 2.1494140625, 2.837158203125, 3.52490234375, 4.212646484375, 4.900390625, 5.588134765625, 6.27587890625, 6.963623046875, 7.6513671875, 8.339111328125, 9.02685546875, 9.714599609375, 10.40234375, 11.090087890625, 11.77783203125, 12.465576171875, 13.1533203125, 13.841064453125, 14.52880859375, 15.216552734375, 15.904296875, 16.592041015625, 17.27978515625, 17.967529296875, 18.6552734375, 19.343017578125, 20.03076171875, 20.718505859375, 21.40625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 5.0, 9.0, 6.0, 10.0, 14.0, 13.0, 16.0, 27.0, 18.0, 18.0, 28.0, 41.0, 32.0, 35.0, 47.0, 36.0, 53.0, 48.0, 49.0, 39.0, 47.0, 46.0, 43.0, 40.0, 36.0, 28.0, 27.0, 21.0, 34.0, 25.0, 18.0, 10.0, 22.0, 10.0, 8.0, 10.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.375, -34.265625, -33.15625, -32.046875, -30.9375, -29.828125, -28.71875, -27.609375, -26.5, -25.390625, -24.28125, -23.171875, -22.0625, -20.953125, -19.84375, -18.734375, -17.625, -16.515625, -15.40625, -14.296875, -13.1875, -12.078125, -10.96875, -9.859375, -8.75, -7.640625, -6.53125, -5.421875, -4.3125, -3.203125, -2.09375, -0.984375, 0.125, 1.234375, 2.34375, 3.453125, 4.5625, 5.671875, 6.78125, 7.890625, 9.0, 10.109375, 11.21875, 12.328125, 13.4375, 14.546875, 15.65625, 16.765625, 17.875, 18.984375, 20.09375, 21.203125, 22.3125, 23.421875, 24.53125, 25.640625, 26.75, 27.859375, 28.96875, 30.078125, 31.1875, 32.296875, 33.40625, 34.515625, 35.625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 9.0, 11.0, 21.0, 34.0, 63.0, 135.0, 193.0, 415.0, 615.0, 1060.0, 1825.0, 3015.0, 4924.0, 7924.0, 12586.0, 19397.0, 29208.0, 43266.0, 62432.0, 86634.0, 118172.0, 154967.0, 195800.0, 236989.0, 278605.0, 310917.0, 334444.0, 341762.0, 336893.0, 316276.0, 283259.0, 242114.0, 201504.0, 159945.0, 122037.0, 90153.0, 65161.0, 45308.0, 30901.0, 20548.0, 13309.0, 8347.0, 5196.0, 3211.0, 1969.0, 1152.0, 682.0, 398.0, 239.0, 119.0, 56.0, 51.0, 21.0, 4.0, 11.0, 3.0, 4.0, 2.0, 0.0, 1.0], "bins": [-20.328125, -19.68408203125, -19.0400390625, -18.39599609375, -17.751953125, -17.10791015625, -16.4638671875, -15.81982421875, -15.17578125, -14.53173828125, -13.8876953125, -13.24365234375, -12.599609375, -11.95556640625, -11.3115234375, -10.66748046875, -10.0234375, -9.37939453125, -8.7353515625, -8.09130859375, -7.447265625, -6.80322265625, -6.1591796875, -5.51513671875, -4.87109375, -4.22705078125, -3.5830078125, -2.93896484375, -2.294921875, -1.65087890625, -1.0068359375, -0.36279296875, 0.28125, 0.92529296875, 1.5693359375, 2.21337890625, 2.857421875, 3.50146484375, 4.1455078125, 4.78955078125, 5.43359375, 6.07763671875, 6.7216796875, 7.36572265625, 8.009765625, 8.65380859375, 9.2978515625, 9.94189453125, 10.5859375, 11.22998046875, 11.8740234375, 12.51806640625, 13.162109375, 13.80615234375, 14.4501953125, 15.09423828125, 15.73828125, 16.38232421875, 17.0263671875, 17.67041015625, 18.314453125, 18.95849609375, 19.6025390625, 20.24658203125, 20.890625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 12.0, 10.0, 19.0, 21.0, 15.0, 36.0, 28.0, 40.0, 35.0, 64.0, 76.0, 72.0, 86.0, 107.0, 109.0, 136.0, 129.0, 138.0, 138.0, 172.0, 171.0, 180.0, 157.0, 162.0, 187.0, 179.0, 175.0, 165.0, 153.0, 158.0, 133.0, 111.0, 99.0, 90.0, 71.0, 82.0, 56.0, 47.0, 51.0, 34.0, 46.0, 19.0, 25.0, 17.0, 12.0, 6.0, 10.0, 15.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-12.546875, -12.15478515625, -11.7626953125, -11.37060546875, -10.978515625, -10.58642578125, -10.1943359375, -9.80224609375, -9.41015625, -9.01806640625, -8.6259765625, -8.23388671875, -7.841796875, -7.44970703125, -7.0576171875, -6.66552734375, -6.2734375, -5.88134765625, -5.4892578125, -5.09716796875, -4.705078125, -4.31298828125, -3.9208984375, -3.52880859375, -3.13671875, -2.74462890625, -2.3525390625, -1.96044921875, -1.568359375, -1.17626953125, -0.7841796875, -0.39208984375, 0.0, 0.39208984375, 0.7841796875, 1.17626953125, 1.568359375, 1.96044921875, 2.3525390625, 2.74462890625, 3.13671875, 3.52880859375, 3.9208984375, 4.31298828125, 4.705078125, 5.09716796875, 5.4892578125, 5.88134765625, 6.2734375, 6.66552734375, 7.0576171875, 7.44970703125, 7.841796875, 8.23388671875, 8.6259765625, 9.01806640625, 9.41015625, 9.80224609375, 10.1943359375, 10.58642578125, 10.978515625, 11.37060546875, 11.7626953125, 12.15478515625, 12.546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 8.0, 8.0, 14.0, 12.0, 19.0, 20.0, 16.0, 26.0, 21.0, 25.0, 38.0, 34.0, 29.0, 39.0, 42.0, 49.0, 42.0, 41.0, 43.0, 43.0, 53.0, 35.0, 45.0, 30.0, 32.0, 26.0, 22.0, 25.0, 33.0, 22.0, 17.0, 14.0, 11.0, 16.0, 11.0, 3.0, 12.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.25745391845703, -29.222204208374023, -28.186954498291016, -27.15170669555664, -26.116456985473633, -25.081207275390625, -24.045957565307617, -23.01070785522461, -21.975460052490234, -20.940210342407227, -19.90496063232422, -18.869712829589844, -17.834463119506836, -16.799213409423828, -15.76396369934082, -14.728713989257812, -13.693464279174805, -12.658214569091797, -11.622965812683105, -10.587716102600098, -9.552467346191406, -8.517217636108398, -7.481967926025391, -6.446718692779541, -5.411469459533691, -4.376220226287842, -3.340970754623413, -2.3057212829589844, -1.2704720497131348, -0.23522281646728516, 0.8000268936157227, 1.8352761268615723, 2.870525360107422, 3.9057745933532715, 4.941023826599121, 5.976273536682129, 7.0115227699279785, 8.046772003173828, 9.082021713256836, 10.117271423339844, 11.152520179748535, 12.187769889831543, 13.223018646240234, 14.258268356323242, 15.29351806640625, 16.328765869140625, 17.364017486572266, 18.39926528930664, 19.43451499938965, 20.469764709472656, 21.505014419555664, 22.540264129638672, 23.575511932373047, 24.610761642456055, 25.646011352539062, 26.68126106262207, 27.716510772705078, 28.751760482788086, 29.787010192871094, 30.82225799560547, 31.857507705688477, 32.892757415771484, 33.928009033203125, 34.9632568359375, 35.998504638671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 13.0, 7.0, 5.0, 6.0, 11.0, 13.0, 16.0, 17.0, 20.0, 35.0, 27.0, 31.0, 24.0, 34.0, 32.0, 38.0, 40.0, 57.0, 42.0, 36.0, 47.0, 44.0, 44.0, 50.0, 40.0, 33.0, 31.0, 26.0, 29.0, 17.0, 31.0, 22.0, 18.0, 14.0, 10.0, 10.0, 8.0, 1.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.57291030883789, -38.352291107177734, -37.13167190551758, -35.91105270385742, -34.690433502197266, -33.469810485839844, -32.24919128417969, -31.02857208251953, -29.807952880859375, -28.58733367919922, -27.366714477539062, -26.146095275878906, -24.925474166870117, -23.70485496520996, -22.484235763549805, -21.263614654541016, -20.042997360229492, -18.822378158569336, -17.60175895690918, -16.38113784790039, -15.160518646240234, -13.939899444580078, -12.719280242919922, -11.49866008758545, -10.278040885925293, -9.057421684265137, -7.836801528930664, -6.616182327270508, -5.395562648773193, -4.174942970275879, -2.9543237686157227, -1.73370361328125, -0.5130844116210938, 0.7075351476669312, 1.928154706954956, 3.1487741470336914, 4.369393825531006, 5.59001350402832, 6.810632705688477, 8.03125286102295, 9.251872062683105, 10.472491264343262, 11.693111419677734, 12.91373062133789, 14.134349822998047, 15.35496997833252, 16.57558822631836, 17.79620933532715, 19.016828536987305, 20.23744773864746, 21.458066940307617, 22.678688049316406, 23.899307250976562, 25.11992645263672, 26.340545654296875, 27.56116485595703, 28.781784057617188, 30.002403259277344, 31.2230224609375, 32.443641662597656, 33.66426086425781, 34.88488006591797, 36.105499267578125, 37.32612228393555, 38.5467414855957]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 9.0, 13.0, 21.0, 26.0, 53.0, 72.0, 102.0, 137.0, 233.0, 327.0, 524.0, 792.0, 1161.0, 1765.0, 2832.0, 4303.0, 6671.0, 10496.0, 16467.0, 26794.0, 42150.0, 67276.0, 103924.0, 145338.0, 168493.0, 149633.0, 107922.0, 70503.0, 44285.0, 27893.0, 17476.0, 10886.0, 6995.0, 4529.0, 2897.0, 1921.0, 1190.0, 831.0, 562.0, 362.0, 258.0, 147.0, 104.0, 72.0, 48.0, 32.0, 18.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.421875, -5.26495361328125, -5.1080322265625, -4.95111083984375, -4.794189453125, -4.63726806640625, -4.4803466796875, -4.32342529296875, -4.16650390625, -4.00958251953125, -3.8526611328125, -3.69573974609375, -3.538818359375, -3.38189697265625, -3.2249755859375, -3.06805419921875, -2.9111328125, -2.75421142578125, -2.5972900390625, -2.44036865234375, -2.283447265625, -2.12652587890625, -1.9696044921875, -1.81268310546875, -1.65576171875, -1.49884033203125, -1.3419189453125, -1.18499755859375, -1.028076171875, -0.87115478515625, -0.7142333984375, -0.55731201171875, -0.400390625, -0.24346923828125, -0.0865478515625, 0.07037353515625, 0.227294921875, 0.38421630859375, 0.5411376953125, 0.69805908203125, 0.85498046875, 1.01190185546875, 1.1688232421875, 1.32574462890625, 1.482666015625, 1.63958740234375, 1.7965087890625, 1.95343017578125, 2.1103515625, 2.26727294921875, 2.4241943359375, 2.58111572265625, 2.738037109375, 2.89495849609375, 3.0518798828125, 3.20880126953125, 3.36572265625, 3.52264404296875, 3.6795654296875, 3.83648681640625, 3.993408203125, 4.15032958984375, 4.3072509765625, 4.46417236328125, 4.62109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 13.0, 9.0, 3.0, 7.0, 10.0, 13.0, 17.0, 16.0, 20.0, 36.0, 26.0, 30.0, 25.0, 36.0, 30.0, 38.0, 41.0, 53.0, 44.0, 37.0, 47.0, 43.0, 42.0, 52.0, 39.0, 35.0, 28.0, 28.0, 29.0, 17.0, 30.0, 23.0, 18.0, 15.0, 10.0, 10.0, 8.0, 1.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.59375, -38.37548828125, -37.1572265625, -35.93896484375, -34.720703125, -33.50244140625, -32.2841796875, -31.06591796875, -29.84765625, -28.62939453125, -27.4111328125, -26.19287109375, -24.974609375, -23.75634765625, -22.5380859375, -21.31982421875, -20.1015625, -18.88330078125, -17.6650390625, -16.44677734375, -15.228515625, -14.01025390625, -12.7919921875, -11.57373046875, -10.35546875, -9.13720703125, -7.9189453125, -6.70068359375, -5.482421875, -4.26416015625, -3.0458984375, -1.82763671875, -0.609375, 0.60888671875, 1.8271484375, 3.04541015625, 4.263671875, 5.48193359375, 6.7001953125, 7.91845703125, 9.13671875, 10.35498046875, 11.5732421875, 12.79150390625, 14.009765625, 15.22802734375, 16.4462890625, 17.66455078125, 18.8828125, 20.10107421875, 21.3193359375, 22.53759765625, 23.755859375, 24.97412109375, 26.1923828125, 27.41064453125, 28.62890625, 29.84716796875, 31.0654296875, 32.28369140625, 33.501953125, 34.72021484375, 35.9384765625, 37.15673828125, 38.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 12.0, 12.0, 26.0, 34.0, 46.0, 67.0, 82.0, 125.0, 185.0, 279.0, 420.0, 618.0, 869.0, 1353.0, 2065.0, 3389.0, 5630.0, 10170.0, 19154.0, 39443.0, 89468.0, 206194.0, 310075.0, 194007.0, 84118.0, 37551.0, 18335.0, 9831.0, 5546.0, 3331.0, 2046.0, 1302.0, 900.0, 576.0, 389.0, 270.0, 183.0, 130.0, 95.0, 63.0, 46.0, 46.0, 12.0, 20.0, 6.0, 13.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-6.83984375, -6.629150390625, -6.41845703125, -6.207763671875, -5.9970703125, -5.786376953125, -5.57568359375, -5.364990234375, -5.154296875, -4.943603515625, -4.73291015625, -4.522216796875, -4.3115234375, -4.100830078125, -3.89013671875, -3.679443359375, -3.46875, -3.258056640625, -3.04736328125, -2.836669921875, -2.6259765625, -2.415283203125, -2.20458984375, -1.993896484375, -1.783203125, -1.572509765625, -1.36181640625, -1.151123046875, -0.9404296875, -0.729736328125, -0.51904296875, -0.308349609375, -0.09765625, 0.113037109375, 0.32373046875, 0.534423828125, 0.7451171875, 0.955810546875, 1.16650390625, 1.377197265625, 1.587890625, 1.798583984375, 2.00927734375, 2.219970703125, 2.4306640625, 2.641357421875, 2.85205078125, 3.062744140625, 3.2734375, 3.484130859375, 3.69482421875, 3.905517578125, 4.1162109375, 4.326904296875, 4.53759765625, 4.748291015625, 4.958984375, 5.169677734375, 5.38037109375, 5.591064453125, 5.8017578125, 6.012451171875, 6.22314453125, 6.433837890625, 6.64453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 9.0, 11.0, 8.0, 12.0, 13.0, 13.0, 20.0, 35.0, 21.0, 23.0, 36.0, 29.0, 43.0, 39.0, 46.0, 43.0, 40.0, 47.0, 43.0, 42.0, 42.0, 43.0, 28.0, 32.0, 27.0, 38.0, 25.0, 39.0, 24.0, 24.0, 21.0, 16.0, 17.0, 8.0, 10.0, 10.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.328125, -22.47314453125, -21.6181640625, -20.76318359375, -19.908203125, -19.05322265625, -18.1982421875, -17.34326171875, -16.48828125, -15.63330078125, -14.7783203125, -13.92333984375, -13.068359375, -12.21337890625, -11.3583984375, -10.50341796875, -9.6484375, -8.79345703125, -7.9384765625, -7.08349609375, -6.228515625, -5.37353515625, -4.5185546875, -3.66357421875, -2.80859375, -1.95361328125, -1.0986328125, -0.24365234375, 0.611328125, 1.46630859375, 2.3212890625, 3.17626953125, 4.03125, 4.88623046875, 5.7412109375, 6.59619140625, 7.451171875, 8.30615234375, 9.1611328125, 10.01611328125, 10.87109375, 11.72607421875, 12.5810546875, 13.43603515625, 14.291015625, 15.14599609375, 16.0009765625, 16.85595703125, 17.7109375, 18.56591796875, 19.4208984375, 20.27587890625, 21.130859375, 21.98583984375, 22.8408203125, 23.69580078125, 24.55078125, 25.40576171875, 26.2607421875, 27.11572265625, 27.970703125, 28.82568359375, 29.6806640625, 30.53564453125, 31.390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 12.0, 10.0, 18.0, 20.0, 35.0, 44.0, 53.0, 96.0, 127.0, 200.0, 306.0, 494.0, 875.0, 1531.0, 3016.0, 5983.0, 13776.0, 39264.0, 166379.0, 605795.0, 149510.0, 36182.0, 12921.0, 5577.0, 2732.0, 1419.0, 803.0, 456.0, 306.0, 186.0, 138.0, 62.0, 69.0, 40.0, 28.0, 20.0, 20.0, 14.0, 13.0, 6.0, 3.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.52734375, -6.34332275390625, -6.1593017578125, -5.97528076171875, -5.791259765625, -5.60723876953125, -5.4232177734375, -5.23919677734375, -5.05517578125, -4.87115478515625, -4.6871337890625, -4.50311279296875, -4.319091796875, -4.13507080078125, -3.9510498046875, -3.76702880859375, -3.5830078125, -3.39898681640625, -3.2149658203125, -3.03094482421875, -2.846923828125, -2.66290283203125, -2.4788818359375, -2.29486083984375, -2.11083984375, -1.92681884765625, -1.7427978515625, -1.55877685546875, -1.374755859375, -1.19073486328125, -1.0067138671875, -0.82269287109375, -0.638671875, -0.45465087890625, -0.2706298828125, -0.08660888671875, 0.097412109375, 0.28143310546875, 0.4654541015625, 0.64947509765625, 0.83349609375, 1.01751708984375, 1.2015380859375, 1.38555908203125, 1.569580078125, 1.75360107421875, 1.9376220703125, 2.12164306640625, 2.3056640625, 2.48968505859375, 2.6737060546875, 2.85772705078125, 3.041748046875, 3.22576904296875, 3.4097900390625, 3.59381103515625, 3.77783203125, 3.96185302734375, 4.1458740234375, 4.32989501953125, 4.513916015625, 4.69793701171875, 4.8819580078125, 5.06597900390625, 5.25]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 10.0, 12.0, 6.0, 15.0, 21.0, 18.0, 37.0, 32.0, 43.0, 48.0, 56.0, 62.0, 54.0, 71.0, 68.0, 77.0, 59.0, 50.0, 55.0, 39.0, 29.0, 32.0, 29.0, 11.0, 16.0, 15.0, 8.0, 9.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0003352165222167969, -0.0003263428807258606, -0.0003174692392349243, -0.00030859559774398804, -0.00029972195625305176, -0.0002908483147621155, -0.0002819746732711792, -0.0002731010317802429, -0.00026422739028930664, -0.00025535374879837036, -0.0002464801073074341, -0.0002376064658164978, -0.00022873282432556152, -0.00021985918283462524, -0.00021098554134368896, -0.00020211189985275269, -0.0001932382583618164, -0.00018436461687088013, -0.00017549097537994385, -0.00016661733388900757, -0.0001577436923980713, -0.000148870050907135, -0.00013999640941619873, -0.00013112276792526245, -0.00012224912643432617, -0.00011337548494338989, -0.00010450184345245361, -9.562820196151733e-05, -8.675456047058105e-05, -7.788091897964478e-05, -6.90072774887085e-05, -6.013363599777222e-05, -5.125999450683594e-05, -4.238635301589966e-05, -3.351271152496338e-05, -2.46390700340271e-05, -1.576542854309082e-05, -6.891787052154541e-06, 1.9818544387817383e-06, 1.0855495929718018e-05, 1.9729137420654297e-05, 2.8602778911590576e-05, 3.7476420402526855e-05, 4.6350061893463135e-05, 5.5223703384399414e-05, 6.40973448753357e-05, 7.297098636627197e-05, 8.184462785720825e-05, 9.071826934814453e-05, 9.959191083908081e-05, 0.00010846555233001709, 0.00011733919382095337, 0.00012621283531188965, 0.00013508647680282593, 0.0001439601182937622, 0.00015283375978469849, 0.00016170740127563477, 0.00017058104276657104, 0.00017945468425750732, 0.0001883283257484436, 0.00019720196723937988, 0.00020607560873031616, 0.00021494925022125244, 0.00022382289171218872, 0.000232696533203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 10.0, 12.0, 16.0, 31.0, 43.0, 71.0, 103.0, 135.0, 219.0, 275.0, 434.0, 617.0, 931.0, 1449.0, 2111.0, 3176.0, 4973.0, 7540.0, 11719.0, 18724.0, 29830.0, 49912.0, 83122.0, 134215.0, 188560.0, 183075.0, 126139.0, 76817.0, 46474.0, 28477.0, 17639.0, 10824.0, 7119.0, 4644.0, 3067.0, 1985.0, 1298.0, 918.0, 582.0, 412.0, 266.0, 184.0, 130.0, 97.0, 60.0, 33.0, 27.0, 27.0, 16.0, 4.0, 9.0, 4.0, 2.0, 3.0, 1.0], "bins": [-3.896484375, -3.781646728515625, -3.66680908203125, -3.551971435546875, -3.4371337890625, -3.322296142578125, -3.20745849609375, -3.092620849609375, -2.977783203125, -2.862945556640625, -2.74810791015625, -2.633270263671875, -2.5184326171875, -2.403594970703125, -2.28875732421875, -2.173919677734375, -2.05908203125, -1.944244384765625, -1.82940673828125, -1.714569091796875, -1.5997314453125, -1.484893798828125, -1.37005615234375, -1.255218505859375, -1.140380859375, -1.025543212890625, -0.91070556640625, -0.795867919921875, -0.6810302734375, -0.566192626953125, -0.45135498046875, -0.336517333984375, -0.2216796875, -0.106842041015625, 0.00799560546875, 0.122833251953125, 0.2376708984375, 0.352508544921875, 0.46734619140625, 0.582183837890625, 0.697021484375, 0.811859130859375, 0.92669677734375, 1.041534423828125, 1.1563720703125, 1.271209716796875, 1.38604736328125, 1.500885009765625, 1.61572265625, 1.730560302734375, 1.84539794921875, 1.960235595703125, 2.0750732421875, 2.189910888671875, 2.30474853515625, 2.419586181640625, 2.534423828125, 2.649261474609375, 2.76409912109375, 2.878936767578125, 2.9937744140625, 3.108612060546875, 3.22344970703125, 3.338287353515625, 3.453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 7.0, 12.0, 11.0, 19.0, 19.0, 23.0, 33.0, 36.0, 35.0, 51.0, 45.0, 61.0, 72.0, 68.0, 73.0, 64.0, 57.0, 51.0, 38.0, 42.0, 35.0, 15.0, 21.0, 13.0, 16.0, 13.0, 8.0, 6.0, 6.0, 7.0, 5.0, 2.0, 3.0, 0.0, 7.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.287109375, -2.217559814453125, -2.14801025390625, -2.078460693359375, -2.0089111328125, -1.939361572265625, -1.86981201171875, -1.800262451171875, -1.730712890625, -1.661163330078125, -1.59161376953125, -1.522064208984375, -1.4525146484375, -1.382965087890625, -1.31341552734375, -1.243865966796875, -1.17431640625, -1.104766845703125, -1.03521728515625, -0.965667724609375, -0.8961181640625, -0.826568603515625, -0.75701904296875, -0.687469482421875, -0.617919921875, -0.548370361328125, -0.47882080078125, -0.409271240234375, -0.3397216796875, -0.270172119140625, -0.20062255859375, -0.131072998046875, -0.0615234375, 0.008026123046875, 0.07757568359375, 0.147125244140625, 0.2166748046875, 0.286224365234375, 0.35577392578125, 0.425323486328125, 0.494873046875, 0.564422607421875, 0.63397216796875, 0.703521728515625, 0.7730712890625, 0.842620849609375, 0.91217041015625, 0.981719970703125, 1.05126953125, 1.120819091796875, 1.19036865234375, 1.259918212890625, 1.3294677734375, 1.399017333984375, 1.46856689453125, 1.538116455078125, 1.607666015625, 1.677215576171875, 1.74676513671875, 1.816314697265625, 1.8858642578125, 1.955413818359375, 2.02496337890625, 2.094512939453125, 2.1640625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 3.0, 10.0, 16.0, 11.0, 22.0, 15.0, 20.0, 23.0, 19.0, 30.0, 34.0, 28.0, 32.0, 44.0, 39.0, 48.0, 40.0, 50.0, 41.0, 47.0, 36.0, 39.0, 48.0, 34.0, 25.0, 32.0, 16.0, 30.0, 31.0, 26.0, 17.0, 13.0, 14.0, 11.0, 14.0, 7.0, 5.0, 7.0, 5.0, 1.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.098224639892578, -29.06899642944336, -28.039766311645508, -27.01053810119629, -25.981307983398438, -24.95207977294922, -23.9228515625, -22.89362335205078, -21.86439323425293, -20.83516502380371, -19.80593490600586, -18.77670669555664, -17.747478485107422, -16.71824836730957, -15.689020156860352, -14.659790992736816, -13.630561828613281, -12.601332664489746, -11.572103500366211, -10.542875289916992, -9.513646125793457, -8.484416961669922, -7.455188274383545, -6.425959587097168, -5.396730422973633, -4.367501258850098, -3.3382725715637207, -2.3090436458587646, -1.2798147201538086, -0.25058555603027344, 0.7786431312561035, 1.8078718185424805, 2.8371009826660156, 3.8663299083709717, 4.895558834075928, 5.924787521362305, 6.95401668548584, 7.983245849609375, 9.012474060058594, 10.041703224182129, 11.070932388305664, 12.1001615524292, 13.129390716552734, 14.158618927001953, 15.187848091125488, 16.217077255249023, 17.246305465698242, 18.275535583496094, 19.304763793945312, 20.33399200439453, 21.363222122192383, 22.3924503326416, 23.421680450439453, 24.450908660888672, 25.48013687133789, 26.50936508178711, 27.53859519958496, 28.56782341003418, 29.59705352783203, 30.62628173828125, 31.65550994873047, 32.68473815917969, 33.71397018432617, 34.74319839477539, 35.77242660522461]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 8.0, 7.0, 6.0, 11.0, 15.0, 14.0, 13.0, 25.0, 33.0, 25.0, 30.0, 27.0, 34.0, 39.0, 30.0, 46.0, 42.0, 49.0, 39.0, 43.0, 50.0, 42.0, 57.0, 32.0, 35.0, 32.0, 22.0, 27.0, 23.0, 28.0, 26.0, 14.0, 15.0, 13.0, 5.0, 10.0, 3.0, 1.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.76948928833008, -38.54486846923828, -37.32024383544922, -36.09562301635742, -34.87099838256836, -33.64637756347656, -32.4217529296875, -31.197132110595703, -29.97250747680664, -28.74788475036621, -27.52326202392578, -26.29863929748535, -25.074016571044922, -23.849393844604492, -22.624771118164062, -21.400150299072266, -20.175527572631836, -18.950904846191406, -17.726282119750977, -16.501659393310547, -15.277036666870117, -14.052413940429688, -12.827792167663574, -11.603169441223145, -10.378546714782715, -9.153923988342285, -7.9293012619018555, -6.704679012298584, -5.480056285858154, -4.255433559417725, -3.030811309814453, -1.8061885833740234, -0.5815658569335938, 0.6430567502975464, 1.8676793575286865, 3.092301845550537, 4.316924571990967, 5.5415472984313965, 6.766169548034668, 7.990792274475098, 9.215415000915527, 10.440037727355957, 11.664660453796387, 12.8892822265625, 14.11390495300293, 15.33852767944336, 16.56315040588379, 17.78777313232422, 19.01239585876465, 20.237018585205078, 21.461641311645508, 22.686264038085938, 23.910886764526367, 25.135509490966797, 26.360130310058594, 27.584754943847656, 28.809375762939453, 30.033998489379883, 31.258621215820312, 32.48324203491211, 33.70786666870117, 34.93248748779297, 36.15711212158203, 37.38173294067383, 38.60635757446289]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 9.0, 10.0, 31.0, 33.0, 44.0, 87.0, 130.0, 235.0, 409.0, 545.0, 866.0, 1347.0, 2044.0, 3231.0, 4827.0, 6937.0, 10294.0, 14626.0, 21096.0, 28091.0, 37632.0, 47749.0, 59750.0, 70403.0, 79783.0, 86043.0, 88503.0, 86132.0, 80505.0, 71218.0, 60017.0, 48829.0, 38709.0, 29120.0, 21477.0, 15392.0, 10786.0, 7216.0, 5098.0, 3283.0, 2153.0, 1393.0, 875.0, 611.0, 383.0, 219.0, 133.0, 101.0, 56.0, 31.0, 21.0, 23.0, 13.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-16.265625, -15.75, -15.234375, -14.71875, -14.203125, -13.6875, -13.171875, -12.65625, -12.140625, -11.625, -11.109375, -10.59375, -10.078125, -9.5625, -9.046875, -8.53125, -8.015625, -7.5, -6.984375, -6.46875, -5.953125, -5.4375, -4.921875, -4.40625, -3.890625, -3.375, -2.859375, -2.34375, -1.828125, -1.3125, -0.796875, -0.28125, 0.234375, 0.75, 1.265625, 1.78125, 2.296875, 2.8125, 3.328125, 3.84375, 4.359375, 4.875, 5.390625, 5.90625, 6.421875, 6.9375, 7.453125, 7.96875, 8.484375, 9.0, 9.515625, 10.03125, 10.546875, 11.0625, 11.578125, 12.09375, 12.609375, 13.125, 13.640625, 14.15625, 14.671875, 15.1875, 15.703125, 16.21875, 16.734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 11.0, 4.0, 6.0, 10.0, 14.0, 17.0, 14.0, 21.0, 38.0, 26.0, 27.0, 28.0, 36.0, 34.0, 33.0, 44.0, 42.0, 47.0, 41.0, 41.0, 51.0, 41.0, 57.0, 32.0, 36.0, 27.0, 25.0, 30.0, 21.0, 25.0, 29.0, 13.0, 17.0, 12.0, 6.0, 10.0, 3.0, 2.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-38.75, -37.55810546875, -36.3662109375, -35.17431640625, -33.982421875, -32.79052734375, -31.5986328125, -30.40673828125, -29.21484375, -28.02294921875, -26.8310546875, -25.63916015625, -24.447265625, -23.25537109375, -22.0634765625, -20.87158203125, -19.6796875, -18.48779296875, -17.2958984375, -16.10400390625, -14.912109375, -13.72021484375, -12.5283203125, -11.33642578125, -10.14453125, -8.95263671875, -7.7607421875, -6.56884765625, -5.376953125, -4.18505859375, -2.9931640625, -1.80126953125, -0.609375, 0.58251953125, 1.7744140625, 2.96630859375, 4.158203125, 5.35009765625, 6.5419921875, 7.73388671875, 8.92578125, 10.11767578125, 11.3095703125, 12.50146484375, 13.693359375, 14.88525390625, 16.0771484375, 17.26904296875, 18.4609375, 19.65283203125, 20.8447265625, 22.03662109375, 23.228515625, 24.42041015625, 25.6123046875, 26.80419921875, 27.99609375, 29.18798828125, 30.3798828125, 31.57177734375, 32.763671875, 33.95556640625, 35.1474609375, 36.33935546875, 37.53125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 15.0, 34.0, 53.0, 78.0, 124.0, 224.0, 311.0, 641.0, 870.0, 1411.0, 2076.0, 3164.0, 4857.0, 7163.0, 10425.0, 14941.0, 21042.0, 28782.0, 38204.0, 48965.0, 59787.0, 71117.0, 81015.0, 86629.0, 88805.0, 86452.0, 80180.0, 70874.0, 59567.0, 48120.0, 37639.0, 28420.0, 20714.0, 14666.0, 10366.0, 7136.0, 4789.0, 3180.0, 2086.0, 1294.0, 826.0, 570.0, 319.0, 237.0, 151.0, 83.0, 53.0, 33.0, 23.0, 14.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-16.5, -15.975830078125, -15.45166015625, -14.927490234375, -14.4033203125, -13.879150390625, -13.35498046875, -12.830810546875, -12.306640625, -11.782470703125, -11.25830078125, -10.734130859375, -10.2099609375, -9.685791015625, -9.16162109375, -8.637451171875, -8.11328125, -7.589111328125, -7.06494140625, -6.540771484375, -6.0166015625, -5.492431640625, -4.96826171875, -4.444091796875, -3.919921875, -3.395751953125, -2.87158203125, -2.347412109375, -1.8232421875, -1.299072265625, -0.77490234375, -0.250732421875, 0.2734375, 0.797607421875, 1.32177734375, 1.845947265625, 2.3701171875, 2.894287109375, 3.41845703125, 3.942626953125, 4.466796875, 4.990966796875, 5.51513671875, 6.039306640625, 6.5634765625, 7.087646484375, 7.61181640625, 8.135986328125, 8.66015625, 9.184326171875, 9.70849609375, 10.232666015625, 10.7568359375, 11.281005859375, 11.80517578125, 12.329345703125, 12.853515625, 13.377685546875, 13.90185546875, 14.426025390625, 14.9501953125, 15.474365234375, 15.99853515625, 16.522705078125, 17.046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 7.0, 14.0, 10.0, 9.0, 14.0, 13.0, 10.0, 27.0, 16.0, 18.0, 25.0, 21.0, 31.0, 29.0, 46.0, 33.0, 39.0, 28.0, 27.0, 34.0, 41.0, 39.0, 38.0, 49.0, 42.0, 36.0, 27.0, 38.0, 27.0, 27.0, 21.0, 15.0, 26.0, 21.0, 20.0, 10.0, 9.0, 14.0, 11.0, 8.0, 5.0, 7.0, 1.0, 7.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.140625, -21.4345703125, -20.728515625, -20.0224609375, -19.31640625, -18.6103515625, -17.904296875, -17.1982421875, -16.4921875, -15.7861328125, -15.080078125, -14.3740234375, -13.66796875, -12.9619140625, -12.255859375, -11.5498046875, -10.84375, -10.1376953125, -9.431640625, -8.7255859375, -8.01953125, -7.3134765625, -6.607421875, -5.9013671875, -5.1953125, -4.4892578125, -3.783203125, -3.0771484375, -2.37109375, -1.6650390625, -0.958984375, -0.2529296875, 0.453125, 1.1591796875, 1.865234375, 2.5712890625, 3.27734375, 3.9833984375, 4.689453125, 5.3955078125, 6.1015625, 6.8076171875, 7.513671875, 8.2197265625, 8.92578125, 9.6318359375, 10.337890625, 11.0439453125, 11.75, 12.4560546875, 13.162109375, 13.8681640625, 14.57421875, 15.2802734375, 15.986328125, 16.6923828125, 17.3984375, 18.1044921875, 18.810546875, 19.5166015625, 20.22265625, 20.9287109375, 21.634765625, 22.3408203125, 23.046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 8.0, 8.0, 13.0, 16.0, 36.0, 52.0, 83.0, 121.0, 176.0, 300.0, 419.0, 678.0, 1158.0, 1738.0, 2732.0, 4284.0, 6489.0, 9930.0, 14869.0, 21193.0, 30163.0, 41211.0, 53412.0, 67100.0, 79719.0, 89975.0, 94945.0, 95641.0, 90527.0, 80396.0, 68480.0, 54235.0, 41678.0, 30780.0, 21677.0, 15071.0, 10176.0, 6762.0, 4452.0, 2822.0, 1801.0, 1187.0, 789.0, 475.0, 273.0, 179.0, 117.0, 74.0, 52.0, 33.0, 26.0, 10.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0], "bins": [-7.8671875, -7.6290283203125, -7.390869140625, -7.1527099609375, -6.91455078125, -6.6763916015625, -6.438232421875, -6.2000732421875, -5.9619140625, -5.7237548828125, -5.485595703125, -5.2474365234375, -5.00927734375, -4.7711181640625, -4.532958984375, -4.2947998046875, -4.056640625, -3.8184814453125, -3.580322265625, -3.3421630859375, -3.10400390625, -2.8658447265625, -2.627685546875, -2.3895263671875, -2.1513671875, -1.9132080078125, -1.675048828125, -1.4368896484375, -1.19873046875, -0.9605712890625, -0.722412109375, -0.4842529296875, -0.24609375, -0.0079345703125, 0.230224609375, 0.4683837890625, 0.70654296875, 0.9447021484375, 1.182861328125, 1.4210205078125, 1.6591796875, 1.8973388671875, 2.135498046875, 2.3736572265625, 2.61181640625, 2.8499755859375, 3.088134765625, 3.3262939453125, 3.564453125, 3.8026123046875, 4.040771484375, 4.2789306640625, 4.51708984375, 4.7552490234375, 4.993408203125, 5.2315673828125, 5.4697265625, 5.7078857421875, 5.946044921875, 6.1842041015625, 6.42236328125, 6.6605224609375, 6.898681640625, 7.1368408203125, 7.375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 5.0, 19.0, 12.0, 13.0, 20.0, 22.0, 25.0, 24.0, 22.0, 32.0, 33.0, 40.0, 45.0, 44.0, 31.0, 27.0, 33.0, 54.0, 42.0, 40.0, 47.0, 51.0, 29.0, 32.0, 35.0, 25.0, 26.0, 24.0, 23.0, 23.0, 14.0, 13.0, 13.0, 8.0, 7.0, 9.0, 10.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010309219360351562, -0.0009992718696594238, -0.0009676218032836914, -0.000935971736907959, -0.0009043216705322266, -0.0008726716041564941, -0.0008410215377807617, -0.0008093714714050293, -0.0007777214050292969, -0.0007460713386535645, -0.000714421272277832, -0.0006827712059020996, -0.0006511211395263672, -0.0006194710731506348, -0.0005878210067749023, -0.0005561709403991699, -0.0005245208740234375, -0.0004928708076477051, -0.00046122074127197266, -0.00042957067489624023, -0.0003979206085205078, -0.0003662705421447754, -0.00033462047576904297, -0.00030297040939331055, -0.0002713203430175781, -0.0002396702766418457, -0.00020802021026611328, -0.00017637014389038086, -0.00014472007751464844, -0.00011307001113891602, -8.14199447631836e-05, -4.976987838745117e-05, -1.811981201171875e-05, 1.3530254364013672e-05, 4.5180320739746094e-05, 7.683038711547852e-05, 0.00010848045349121094, 0.00014013051986694336, 0.00017178058624267578, 0.0002034306526184082, 0.00023508071899414062, 0.00026673078536987305, 0.00029838085174560547, 0.0003300309181213379, 0.0003616809844970703, 0.00039333105087280273, 0.00042498111724853516, 0.0004566311836242676, 0.00048828125, 0.0005199313163757324, 0.0005515813827514648, 0.0005832314491271973, 0.0006148815155029297, 0.0006465315818786621, 0.0006781816482543945, 0.000709831714630127, 0.0007414817810058594, 0.0007731318473815918, 0.0008047819137573242, 0.0008364319801330566, 0.0008680820465087891, 0.0008997321128845215, 0.0009313821792602539, 0.0009630322456359863, 0.0009946823120117188]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 18.0, 16.0, 37.0, 50.0, 70.0, 140.0, 231.0, 308.0, 512.0, 778.0, 1203.0, 1913.0, 2943.0, 4739.0, 7386.0, 11228.0, 17307.0, 26324.0, 37684.0, 53014.0, 70226.0, 88401.0, 102814.0, 110810.0, 108970.0, 99849.0, 84162.0, 65702.0, 48871.0, 34847.0, 23832.0, 15581.0, 10282.0, 6540.0, 4215.0, 2725.0, 1731.0, 1103.0, 709.0, 447.0, 283.0, 177.0, 128.0, 97.0, 57.0, 42.0, 27.0, 11.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.015625, -9.6912841796875, -9.366943359375, -9.0426025390625, -8.71826171875, -8.3939208984375, -8.069580078125, -7.7452392578125, -7.4208984375, -7.0965576171875, -6.772216796875, -6.4478759765625, -6.12353515625, -5.7991943359375, -5.474853515625, -5.1505126953125, -4.826171875, -4.5018310546875, -4.177490234375, -3.8531494140625, -3.52880859375, -3.2044677734375, -2.880126953125, -2.5557861328125, -2.2314453125, -1.9071044921875, -1.582763671875, -1.2584228515625, -0.93408203125, -0.6097412109375, -0.285400390625, 0.0389404296875, 0.36328125, 0.6876220703125, 1.011962890625, 1.3363037109375, 1.66064453125, 1.9849853515625, 2.309326171875, 2.6336669921875, 2.9580078125, 3.2823486328125, 3.606689453125, 3.9310302734375, 4.25537109375, 4.5797119140625, 4.904052734375, 5.2283935546875, 5.552734375, 5.8770751953125, 6.201416015625, 6.5257568359375, 6.85009765625, 7.1744384765625, 7.498779296875, 7.8231201171875, 8.1474609375, 8.4718017578125, 8.796142578125, 9.1204833984375, 9.44482421875, 9.7691650390625, 10.093505859375, 10.4178466796875, 10.7421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 5.0, 3.0, 11.0, 9.0, 17.0, 18.0, 21.0, 14.0, 35.0, 30.0, 39.0, 44.0, 49.0, 48.0, 59.0, 58.0, 56.0, 69.0, 59.0, 54.0, 42.0, 47.0, 45.0, 35.0, 38.0, 16.0, 17.0, 16.0, 8.0, 11.0, 4.0, 4.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.90814208984375, -5.7069091796875, -5.50567626953125, -5.304443359375, -5.10321044921875, -4.9019775390625, -4.70074462890625, -4.49951171875, -4.29827880859375, -4.0970458984375, -3.89581298828125, -3.694580078125, -3.49334716796875, -3.2921142578125, -3.09088134765625, -2.8896484375, -2.68841552734375, -2.4871826171875, -2.28594970703125, -2.084716796875, -1.88348388671875, -1.6822509765625, -1.48101806640625, -1.27978515625, -1.07855224609375, -0.8773193359375, -0.67608642578125, -0.474853515625, -0.27362060546875, -0.0723876953125, 0.12884521484375, 0.330078125, 0.53131103515625, 0.7325439453125, 0.93377685546875, 1.135009765625, 1.33624267578125, 1.5374755859375, 1.73870849609375, 1.93994140625, 2.14117431640625, 2.3424072265625, 2.54364013671875, 2.744873046875, 2.94610595703125, 3.1473388671875, 3.34857177734375, 3.5498046875, 3.75103759765625, 3.9522705078125, 4.15350341796875, 4.354736328125, 4.55596923828125, 4.7572021484375, 4.95843505859375, 5.15966796875, 5.36090087890625, 5.5621337890625, 5.76336669921875, 5.964599609375, 6.16583251953125, 6.3670654296875, 6.56829833984375, 6.76953125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 8.0, 12.0, 7.0, 17.0, 14.0, 15.0, 16.0, 17.0, 31.0, 20.0, 38.0, 32.0, 43.0, 40.0, 31.0, 57.0, 40.0, 45.0, 49.0, 52.0, 43.0, 38.0, 43.0, 24.0, 22.0, 31.0, 24.0, 29.0, 26.0, 23.0, 17.0, 23.0, 13.0, 13.0, 11.0, 5.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.32360076904297, -30.26119613647461, -29.19879150390625, -28.136384963989258, -27.0739803314209, -26.01157569885254, -24.949169158935547, -23.886764526367188, -22.824359893798828, -21.76195526123047, -20.69955062866211, -19.637144088745117, -18.574739456176758, -17.5123348236084, -16.449928283691406, -15.387523651123047, -14.325119018554688, -13.262714385986328, -12.200308799743652, -11.137903213500977, -10.075498580932617, -9.013093948364258, -7.950688362121582, -6.8882832527160645, -5.825878143310547, -4.763473033905029, -3.7010679244995117, -2.638662815093994, -1.5762577056884766, -0.513852596282959, 0.5485525131225586, 1.6109576225280762, 2.6733627319335938, 3.7357678413391113, 4.798172950744629, 5.8605780601501465, 6.922983169555664, 7.985388278961182, 9.0477933883667, 10.110198974609375, 11.172603607177734, 12.235008239746094, 13.29741382598877, 14.359819412231445, 15.422224044799805, 16.484628677368164, 17.547035217285156, 18.609439849853516, 19.671844482421875, 20.734249114990234, 21.796653747558594, 22.859060287475586, 23.921464920043945, 24.983869552612305, 26.046276092529297, 27.108680725097656, 28.171085357666016, 29.233489990234375, 30.295894622802734, 31.358301162719727, 32.42070770263672, 33.48311233520508, 34.54551696777344, 35.6079216003418, 36.670326232910156]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 7.0, 5.0, 8.0, 17.0, 10.0, 14.0, 17.0, 17.0, 13.0, 24.0, 40.0, 21.0, 41.0, 39.0, 26.0, 47.0, 45.0, 47.0, 40.0, 30.0, 49.0, 35.0, 42.0, 44.0, 39.0, 41.0, 34.0, 31.0, 18.0, 24.0, 17.0, 21.0, 18.0, 16.0, 11.0, 12.0, 7.0, 9.0, 8.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-43.800445556640625, -42.559967041015625, -41.319488525390625, -40.079010009765625, -38.838531494140625, -37.598052978515625, -36.357574462890625, -35.117095947265625, -33.876617431640625, -32.636138916015625, -31.395660400390625, -30.155181884765625, -28.914703369140625, -27.674224853515625, -26.433748245239258, -25.193269729614258, -23.95279312133789, -22.71231460571289, -21.47183609008789, -20.23135757446289, -18.99087905883789, -17.75040054321289, -16.509923934936523, -15.269445419311523, -14.028966903686523, -12.788488388061523, -11.548009872436523, -10.30753231048584, -9.06705379486084, -7.82657527923584, -6.586097240447998, -5.345619201660156, -4.105140686035156, -2.8646624088287354, -1.6241841316223145, -0.38370585441589355, 0.8567724227905273, 2.0972509384155273, 3.337728977203369, 4.578207015991211, 5.818685531616211, 7.059164047241211, 8.299642562866211, 9.540120124816895, 10.780598640441895, 12.021077156066895, 13.261554718017578, 14.502033233642578, 15.742511749267578, 16.982990264892578, 18.223468780517578, 19.463947296142578, 20.704425811767578, 21.944904327392578, 23.185380935668945, 24.425859451293945, 25.666337966918945, 26.906816482543945, 28.147294998168945, 29.387773513793945, 30.628250122070312, 31.868728637695312, 33.10920715332031, 34.34968566894531, 35.59016418457031]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 13.0, 12.0, 25.0, 32.0, 51.0, 111.0, 151.0, 289.0, 434.0, 778.0, 1265.0, 1974.0, 3366.0, 5265.0, 8420.0, 13238.0, 20618.0, 31371.0, 47979.0, 69343.0, 97788.0, 135348.0, 178086.0, 229624.0, 278767.0, 323072.0, 357010.0, 373244.0, 369504.0, 345760.0, 305699.0, 258341.0, 207236.0, 158982.0, 118180.0, 84629.0, 58540.0, 39492.0, 25818.0, 16791.0, 10769.0, 6663.0, 4045.0, 2487.0, 1512.0, 935.0, 536.0, 300.0, 188.0, 84.0, 50.0, 32.0, 13.0, 14.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0], "bins": [-21.078125, -20.414794921875, -19.75146484375, -19.088134765625, -18.4248046875, -17.761474609375, -17.09814453125, -16.434814453125, -15.771484375, -15.108154296875, -14.44482421875, -13.781494140625, -13.1181640625, -12.454833984375, -11.79150390625, -11.128173828125, -10.46484375, -9.801513671875, -9.13818359375, -8.474853515625, -7.8115234375, -7.148193359375, -6.48486328125, -5.821533203125, -5.158203125, -4.494873046875, -3.83154296875, -3.168212890625, -2.5048828125, -1.841552734375, -1.17822265625, -0.514892578125, 0.1484375, 0.811767578125, 1.47509765625, 2.138427734375, 2.8017578125, 3.465087890625, 4.12841796875, 4.791748046875, 5.455078125, 6.118408203125, 6.78173828125, 7.445068359375, 8.1083984375, 8.771728515625, 9.43505859375, 10.098388671875, 10.76171875, 11.425048828125, 12.08837890625, 12.751708984375, 13.4150390625, 14.078369140625, 14.74169921875, 15.405029296875, 16.068359375, 16.731689453125, 17.39501953125, 18.058349609375, 18.7216796875, 19.385009765625, 20.04833984375, 20.711669921875, 21.375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 10.0, 6.0, 12.0, 12.0, 16.0, 14.0, 18.0, 16.0, 17.0, 33.0, 31.0, 38.0, 37.0, 30.0, 45.0, 39.0, 45.0, 45.0, 31.0, 43.0, 36.0, 48.0, 40.0, 43.0, 35.0, 34.0, 35.0, 26.0, 19.0, 18.0, 20.0, 19.0, 19.0, 10.0, 12.0, 10.0, 6.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-38.28125, -37.205322265625, -36.12939453125, -35.053466796875, -33.9775390625, -32.901611328125, -31.82568359375, -30.749755859375, -29.673828125, -28.597900390625, -27.52197265625, -26.446044921875, -25.3701171875, -24.294189453125, -23.21826171875, -22.142333984375, -21.06640625, -19.990478515625, -18.91455078125, -17.838623046875, -16.7626953125, -15.686767578125, -14.61083984375, -13.534912109375, -12.458984375, -11.383056640625, -10.30712890625, -9.231201171875, -8.1552734375, -7.079345703125, -6.00341796875, -4.927490234375, -3.8515625, -2.775634765625, -1.69970703125, -0.623779296875, 0.4521484375, 1.528076171875, 2.60400390625, 3.679931640625, 4.755859375, 5.831787109375, 6.90771484375, 7.983642578125, 9.0595703125, 10.135498046875, 11.21142578125, 12.287353515625, 13.36328125, 14.439208984375, 15.51513671875, 16.591064453125, 17.6669921875, 18.742919921875, 19.81884765625, 20.894775390625, 21.970703125, 23.046630859375, 24.12255859375, 25.198486328125, 26.2744140625, 27.350341796875, 28.42626953125, 29.502197265625, 30.578125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 6.0, 24.0, 34.0, 44.0, 77.0, 167.0, 286.0, 509.0, 851.0, 1447.0, 2416.0, 3860.0, 6199.0, 9867.0, 15076.0, 23595.0, 34799.0, 49971.0, 70414.0, 96981.0, 127712.0, 164477.0, 202910.0, 243498.0, 279920.0, 308627.0, 326733.0, 331818.0, 324422.0, 303976.0, 271296.0, 233913.0, 193321.0, 155416.0, 120227.0, 89512.0, 65183.0, 45498.0, 31727.0, 21149.0, 13566.0, 8658.0, 5518.0, 3410.0, 2143.0, 1264.0, 779.0, 469.0, 232.0, 139.0, 57.0, 46.0, 28.0, 13.0, 8.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-19.75, -19.099853515625, -18.44970703125, -17.799560546875, -17.1494140625, -16.499267578125, -15.84912109375, -15.198974609375, -14.548828125, -13.898681640625, -13.24853515625, -12.598388671875, -11.9482421875, -11.298095703125, -10.64794921875, -9.997802734375, -9.34765625, -8.697509765625, -8.04736328125, -7.397216796875, -6.7470703125, -6.096923828125, -5.44677734375, -4.796630859375, -4.146484375, -3.496337890625, -2.84619140625, -2.196044921875, -1.5458984375, -0.895751953125, -0.24560546875, 0.404541015625, 1.0546875, 1.704833984375, 2.35498046875, 3.005126953125, 3.6552734375, 4.305419921875, 4.95556640625, 5.605712890625, 6.255859375, 6.906005859375, 7.55615234375, 8.206298828125, 8.8564453125, 9.506591796875, 10.15673828125, 10.806884765625, 11.45703125, 12.107177734375, 12.75732421875, 13.407470703125, 14.0576171875, 14.707763671875, 15.35791015625, 16.008056640625, 16.658203125, 17.308349609375, 17.95849609375, 18.608642578125, 19.2587890625, 19.908935546875, 20.55908203125, 21.209228515625, 21.859375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 7.0, 12.0, 6.0, 13.0, 20.0, 22.0, 21.0, 35.0, 42.0, 44.0, 55.0, 83.0, 91.0, 107.0, 114.0, 137.0, 147.0, 151.0, 186.0, 204.0, 193.0, 214.0, 213.0, 184.0, 200.0, 177.0, 176.0, 173.0, 150.0, 145.0, 122.0, 107.0, 116.0, 75.0, 76.0, 55.0, 38.0, 49.0, 34.0, 18.0, 17.0, 16.0, 17.0, 6.0, 0.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0390625, -13.5797119140625, -13.120361328125, -12.6610107421875, -12.20166015625, -11.7423095703125, -11.282958984375, -10.8236083984375, -10.3642578125, -9.9049072265625, -9.445556640625, -8.9862060546875, -8.52685546875, -8.0675048828125, -7.608154296875, -7.1488037109375, -6.689453125, -6.2301025390625, -5.770751953125, -5.3114013671875, -4.85205078125, -4.3927001953125, -3.933349609375, -3.4739990234375, -3.0146484375, -2.5552978515625, -2.095947265625, -1.6365966796875, -1.17724609375, -0.7178955078125, -0.258544921875, 0.2008056640625, 0.66015625, 1.1195068359375, 1.578857421875, 2.0382080078125, 2.49755859375, 2.9569091796875, 3.416259765625, 3.8756103515625, 4.3349609375, 4.7943115234375, 5.253662109375, 5.7130126953125, 6.17236328125, 6.6317138671875, 7.091064453125, 7.5504150390625, 8.009765625, 8.4691162109375, 8.928466796875, 9.3878173828125, 9.84716796875, 10.3065185546875, 10.765869140625, 11.2252197265625, 11.6845703125, 12.1439208984375, 12.603271484375, 13.0626220703125, 13.52197265625, 13.9813232421875, 14.440673828125, 14.9000244140625, 15.359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 7.0, 3.0, 8.0, 6.0, 7.0, 8.0, 13.0, 10.0, 10.0, 18.0, 16.0, 17.0, 25.0, 34.0, 28.0, 24.0, 28.0, 41.0, 34.0, 43.0, 40.0, 44.0, 39.0, 41.0, 40.0, 40.0, 35.0, 41.0, 40.0, 26.0, 29.0, 21.0, 29.0, 24.0, 20.0, 17.0, 19.0, 13.0, 8.0, 11.0, 13.0, 8.0, 7.0, 2.0, 3.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.375167846679688, -29.360464096069336, -28.345760345458984, -27.3310546875, -26.31635093688965, -25.301647186279297, -24.286941528320312, -23.27223777770996, -22.25753402709961, -21.242830276489258, -20.228126525878906, -19.213420867919922, -18.19871711730957, -17.18401336669922, -16.169307708740234, -15.154603958129883, -14.139900207519531, -13.12519645690918, -12.110491752624512, -11.095787048339844, -10.081083297729492, -9.06637954711914, -8.051674842834473, -7.036970615386963, -6.022266387939453, -5.007562160491943, -3.9928579330444336, -2.978153705596924, -1.963449478149414, -0.9487452507019043, 0.06595897674560547, 1.0806632041931152, 2.0953636169433594, 3.110067844390869, 4.124772071838379, 5.139476299285889, 6.154180526733398, 7.168884754180908, 8.183588981628418, 9.198293685913086, 10.212997436523438, 11.227701187133789, 12.242405891418457, 13.257110595703125, 14.271814346313477, 15.286518096923828, 16.301223754882812, 17.315927505493164, 18.330631256103516, 19.345335006713867, 20.36003875732422, 21.374744415283203, 22.389448165893555, 23.404151916503906, 24.41885757446289, 25.433561325073242, 26.448265075683594, 27.462968826293945, 28.477672576904297, 29.49237823486328, 30.507081985473633, 31.521785736083984, 32.53649139404297, 33.55119323730469, 34.56589889526367]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 8.0, 14.0, 9.0, 7.0, 12.0, 13.0, 17.0, 10.0, 20.0, 19.0, 23.0, 36.0, 38.0, 29.0, 37.0, 50.0, 34.0, 43.0, 30.0, 39.0, 41.0, 46.0, 27.0, 44.0, 32.0, 35.0, 34.0, 39.0, 21.0, 20.0, 22.0, 23.0, 19.0, 19.0, 19.0, 18.0, 8.0, 11.0, 8.0, 6.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-39.163963317871094, -38.01884460449219, -36.87372970581055, -35.72861099243164, -34.583492279052734, -33.438377380371094, -32.29325866699219, -31.14813995361328, -30.003023147583008, -28.857906341552734, -27.712787628173828, -26.567670822143555, -25.42255401611328, -24.277435302734375, -23.1323184967041, -21.987201690673828, -20.842082977294922, -19.69696617126465, -18.551847457885742, -17.40673065185547, -16.261611938476562, -15.116495132446289, -13.971378326416016, -12.826260566711426, -11.681142807006836, -10.536025047302246, -9.390907287597656, -8.245790481567383, -7.100672721862793, -5.955554962158203, -4.8104376792907715, -3.66532039642334, -2.52020263671875, -1.3750851154327393, -0.22996759414672852, 0.9151499271392822, 2.060267448425293, 3.205385208129883, 4.3505024909973145, 5.495619773864746, 6.640737533569336, 7.785855293273926, 8.930973052978516, 10.076089859008789, 11.221207618713379, 12.366325378417969, 13.511442184448242, 14.656559944152832, 15.801677703857422, 16.946794509887695, 18.0919132232666, 19.237030029296875, 20.38214874267578, 21.527265548706055, 22.672382354736328, 23.817501068115234, 24.962617874145508, 26.10773468017578, 27.252853393554688, 28.39797019958496, 29.543087005615234, 30.68820571899414, 31.833322525024414, 32.97843933105469, 34.123558044433594]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 13.0, 10.0, 15.0, 15.0, 35.0, 37.0, 46.0, 77.0, 128.0, 220.0, 340.0, 538.0, 908.0, 1640.0, 3014.0, 5709.0, 12022.0, 27121.0, 68181.0, 173603.0, 326991.0, 248740.0, 104445.0, 40413.0, 17217.0, 7959.0, 4028.0, 2089.0, 1195.0, 694.0, 396.0, 246.0, 156.0, 114.0, 70.0, 34.0, 31.0, 24.0, 10.0, 14.0, 7.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.4296875, -11.1097412109375, -10.789794921875, -10.4698486328125, -10.14990234375, -9.8299560546875, -9.510009765625, -9.1900634765625, -8.8701171875, -8.5501708984375, -8.230224609375, -7.9102783203125, -7.59033203125, -7.2703857421875, -6.950439453125, -6.6304931640625, -6.310546875, -5.9906005859375, -5.670654296875, -5.3507080078125, -5.03076171875, -4.7108154296875, -4.390869140625, -4.0709228515625, -3.7509765625, -3.4310302734375, -3.111083984375, -2.7911376953125, -2.47119140625, -2.1512451171875, -1.831298828125, -1.5113525390625, -1.19140625, -0.8714599609375, -0.551513671875, -0.2315673828125, 0.08837890625, 0.4083251953125, 0.728271484375, 1.0482177734375, 1.3681640625, 1.6881103515625, 2.008056640625, 2.3280029296875, 2.64794921875, 2.9678955078125, 3.287841796875, 3.6077880859375, 3.927734375, 4.2476806640625, 4.567626953125, 4.8875732421875, 5.20751953125, 5.5274658203125, 5.847412109375, 6.1673583984375, 6.4873046875, 6.8072509765625, 7.127197265625, 7.4471435546875, 7.76708984375, 8.0870361328125, 8.406982421875, 8.7269287109375, 9.046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 9.0, 12.0, 8.0, 9.0, 12.0, 12.0, 17.0, 11.0, 18.0, 19.0, 24.0, 35.0, 37.0, 27.0, 38.0, 53.0, 34.0, 40.0, 34.0, 37.0, 42.0, 46.0, 29.0, 40.0, 35.0, 34.0, 35.0, 39.0, 20.0, 21.0, 21.0, 22.0, 21.0, 19.0, 19.0, 17.0, 9.0, 9.0, 10.0, 6.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-39.34375, -38.1982421875, -37.052734375, -35.9072265625, -34.76171875, -33.6162109375, -32.470703125, -31.3251953125, -30.1796875, -29.0341796875, -27.888671875, -26.7431640625, -25.59765625, -24.4521484375, -23.306640625, -22.1611328125, -21.015625, -19.8701171875, -18.724609375, -17.5791015625, -16.43359375, -15.2880859375, -14.142578125, -12.9970703125, -11.8515625, -10.7060546875, -9.560546875, -8.4150390625, -7.26953125, -6.1240234375, -4.978515625, -3.8330078125, -2.6875, -1.5419921875, -0.396484375, 0.7490234375, 1.89453125, 3.0400390625, 4.185546875, 5.3310546875, 6.4765625, 7.6220703125, 8.767578125, 9.9130859375, 11.05859375, 12.2041015625, 13.349609375, 14.4951171875, 15.640625, 16.7861328125, 17.931640625, 19.0771484375, 20.22265625, 21.3681640625, 22.513671875, 23.6591796875, 24.8046875, 25.9501953125, 27.095703125, 28.2412109375, 29.38671875, 30.5322265625, 31.677734375, 32.8232421875, 33.96875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 12.0, 11.0, 15.0, 20.0, 24.0, 32.0, 49.0, 71.0, 82.0, 108.0, 196.0, 279.0, 429.0, 622.0, 988.0, 1616.0, 2921.0, 5544.0, 11241.0, 25753.0, 69733.0, 216626.0, 409574.0, 193738.0, 62563.0, 23625.0, 10542.0, 5137.0, 2678.0, 1520.0, 925.0, 591.0, 359.0, 270.0, 195.0, 120.0, 79.0, 70.0, 42.0, 41.0, 25.0, 20.0, 20.0, 11.0, 6.0, 10.0, 2.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5234375, -8.2340087890625, -7.944580078125, -7.6551513671875, -7.36572265625, -7.0762939453125, -6.786865234375, -6.4974365234375, -6.2080078125, -5.9185791015625, -5.629150390625, -5.3397216796875, -5.05029296875, -4.7608642578125, -4.471435546875, -4.1820068359375, -3.892578125, -3.6031494140625, -3.313720703125, -3.0242919921875, -2.73486328125, -2.4454345703125, -2.156005859375, -1.8665771484375, -1.5771484375, -1.2877197265625, -0.998291015625, -0.7088623046875, -0.41943359375, -0.1300048828125, 0.159423828125, 0.4488525390625, 0.73828125, 1.0277099609375, 1.317138671875, 1.6065673828125, 1.89599609375, 2.1854248046875, 2.474853515625, 2.7642822265625, 3.0537109375, 3.3431396484375, 3.632568359375, 3.9219970703125, 4.21142578125, 4.5008544921875, 4.790283203125, 5.0797119140625, 5.369140625, 5.6585693359375, 5.947998046875, 6.2374267578125, 6.52685546875, 6.8162841796875, 7.105712890625, 7.3951416015625, 7.6845703125, 7.9739990234375, 8.263427734375, 8.5528564453125, 8.84228515625, 9.1317138671875, 9.421142578125, 9.7105712890625, 10.0]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 10.0, 12.0, 11.0, 8.0, 14.0, 23.0, 20.0, 24.0, 33.0, 24.0, 30.0, 34.0, 43.0, 32.0, 38.0, 48.0, 32.0, 38.0, 43.0, 43.0, 34.0, 38.0, 31.0, 34.0, 29.0, 41.0, 27.0, 24.0, 18.0, 25.0, 20.0, 19.0, 16.0, 16.0, 14.0, 11.0, 9.0, 6.0, 5.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.671875, -23.877197265625, -23.08251953125, -22.287841796875, -21.4931640625, -20.698486328125, -19.90380859375, -19.109130859375, -18.314453125, -17.519775390625, -16.72509765625, -15.930419921875, -15.1357421875, -14.341064453125, -13.54638671875, -12.751708984375, -11.95703125, -11.162353515625, -10.36767578125, -9.572998046875, -8.7783203125, -7.983642578125, -7.18896484375, -6.394287109375, -5.599609375, -4.804931640625, -4.01025390625, -3.215576171875, -2.4208984375, -1.626220703125, -0.83154296875, -0.036865234375, 0.7578125, 1.552490234375, 2.34716796875, 3.141845703125, 3.9365234375, 4.731201171875, 5.52587890625, 6.320556640625, 7.115234375, 7.909912109375, 8.70458984375, 9.499267578125, 10.2939453125, 11.088623046875, 11.88330078125, 12.677978515625, 13.47265625, 14.267333984375, 15.06201171875, 15.856689453125, 16.6513671875, 17.446044921875, 18.24072265625, 19.035400390625, 19.830078125, 20.624755859375, 21.41943359375, 22.214111328125, 23.0087890625, 23.803466796875, 24.59814453125, 25.392822265625, 26.1875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 8.0, 6.0, 0.0, 9.0, 11.0, 15.0, 18.0, 26.0, 34.0, 40.0, 57.0, 89.0, 140.0, 230.0, 394.0, 712.0, 1368.0, 2887.0, 7044.0, 22541.0, 127347.0, 748534.0, 105366.0, 19759.0, 6390.0, 2637.0, 1254.0, 667.0, 347.0, 216.0, 130.0, 86.0, 65.0, 34.0, 31.0, 15.0, 20.0, 10.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-10.15625, -9.89886474609375, -9.6414794921875, -9.38409423828125, -9.126708984375, -8.86932373046875, -8.6119384765625, -8.35455322265625, -8.09716796875, -7.83978271484375, -7.5823974609375, -7.32501220703125, -7.067626953125, -6.81024169921875, -6.5528564453125, -6.29547119140625, -6.0380859375, -5.78070068359375, -5.5233154296875, -5.26593017578125, -5.008544921875, -4.75115966796875, -4.4937744140625, -4.23638916015625, -3.97900390625, -3.72161865234375, -3.4642333984375, -3.20684814453125, -2.949462890625, -2.69207763671875, -2.4346923828125, -2.17730712890625, -1.919921875, -1.66253662109375, -1.4051513671875, -1.14776611328125, -0.890380859375, -0.63299560546875, -0.3756103515625, -0.11822509765625, 0.13916015625, 0.39654541015625, 0.6539306640625, 0.91131591796875, 1.168701171875, 1.42608642578125, 1.6834716796875, 1.94085693359375, 2.1982421875, 2.45562744140625, 2.7130126953125, 2.97039794921875, 3.227783203125, 3.48516845703125, 3.7425537109375, 3.99993896484375, 4.25732421875, 4.51470947265625, 4.7720947265625, 5.02947998046875, 5.286865234375, 5.54425048828125, 5.8016357421875, 6.05902099609375, 6.31640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 12.0, 15.0, 21.0, 23.0, 53.0, 70.0, 94.0, 131.0, 145.0, 110.0, 119.0, 72.0, 41.0, 28.0, 32.0, 15.0, 10.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003485679626464844, -0.00033321231603622437, -0.00031785666942596436, -0.00030250102281570435, -0.00028714537620544434, -0.0002717897295951843, -0.0002564340829849243, -0.0002410784363746643, -0.0002257227897644043, -0.0002103671431541443, -0.00019501149654388428, -0.00017965584993362427, -0.00016430020332336426, -0.00014894455671310425, -0.00013358891010284424, -0.00011823326349258423, -0.00010287761688232422, -8.752197027206421e-05, -7.21663236618042e-05, -5.681067705154419e-05, -4.145503044128418e-05, -2.609938383102417e-05, -1.074373722076416e-05, 4.61190938949585e-06, 1.996755599975586e-05, 3.532320261001587e-05, 5.067884922027588e-05, 6.603449583053589e-05, 8.13901424407959e-05, 9.674578905105591e-05, 0.00011210143566131592, 0.00012745708227157593, 0.00014281272888183594, 0.00015816837549209595, 0.00017352402210235596, 0.00018887966871261597, 0.00020423531532287598, 0.00021959096193313599, 0.000234946608543396, 0.000250302255153656, 0.000265657901763916, 0.000281013548374176, 0.00029636919498443604, 0.00031172484159469604, 0.00032708048820495605, 0.00034243613481521606, 0.0003577917814254761, 0.0003731474280357361, 0.0003885030746459961, 0.0004038587212562561, 0.0004192143678665161, 0.0004345700144767761, 0.00044992566108703613, 0.00046528130769729614, 0.00048063695430755615, 0.0004959926009178162, 0.0005113482475280762, 0.0005267038941383362, 0.0005420595407485962, 0.0005574151873588562, 0.0005727708339691162, 0.0005881264805793762, 0.0006034821271896362, 0.0006188377737998962, 0.0006341934204101562]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 15.0, 17.0, 20.0, 31.0, 39.0, 72.0, 99.0, 152.0, 212.0, 322.0, 474.0, 709.0, 1253.0, 2122.0, 4458.0, 11105.0, 35460.0, 139543.0, 494775.0, 265007.0, 61564.0, 17656.0, 6342.0, 2887.0, 1583.0, 893.0, 579.0, 393.0, 236.0, 180.0, 101.0, 87.0, 48.0, 26.0, 25.0, 17.0, 15.0, 10.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0], "bins": [-12.4140625, -12.0933837890625, -11.772705078125, -11.4520263671875, -11.13134765625, -10.8106689453125, -10.489990234375, -10.1693115234375, -9.8486328125, -9.5279541015625, -9.207275390625, -8.8865966796875, -8.56591796875, -8.2452392578125, -7.924560546875, -7.6038818359375, -7.283203125, -6.9625244140625, -6.641845703125, -6.3211669921875, -6.00048828125, -5.6798095703125, -5.359130859375, -5.0384521484375, -4.7177734375, -4.3970947265625, -4.076416015625, -3.7557373046875, -3.43505859375, -3.1143798828125, -2.793701171875, -2.4730224609375, -2.15234375, -1.8316650390625, -1.510986328125, -1.1903076171875, -0.86962890625, -0.5489501953125, -0.228271484375, 0.0924072265625, 0.4130859375, 0.7337646484375, 1.054443359375, 1.3751220703125, 1.69580078125, 2.0164794921875, 2.337158203125, 2.6578369140625, 2.978515625, 3.2991943359375, 3.619873046875, 3.9405517578125, 4.26123046875, 4.5819091796875, 4.902587890625, 5.2232666015625, 5.5439453125, 5.8646240234375, 6.185302734375, 6.5059814453125, 6.82666015625, 7.1473388671875, 7.468017578125, 7.7886962890625, 8.109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 8.0, 9.0, 10.0, 9.0, 9.0, 9.0, 18.0, 13.0, 22.0, 18.0, 29.0, 43.0, 51.0, 68.0, 56.0, 69.0, 69.0, 81.0, 65.0, 51.0, 46.0, 42.0, 22.0, 35.0, 22.0, 13.0, 13.0, 14.0, 11.0, 13.0, 7.0, 7.0, 9.0, 7.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.9691619873046875, -1.909027099609375, -1.8488922119140625, -1.78875732421875, -1.7286224365234375, -1.668487548828125, -1.6083526611328125, -1.5482177734375, -1.4880828857421875, -1.427947998046875, -1.3678131103515625, -1.30767822265625, -1.2475433349609375, -1.187408447265625, -1.1272735595703125, -1.067138671875, -1.0070037841796875, -0.946868896484375, -0.8867340087890625, -0.82659912109375, -0.7664642333984375, -0.706329345703125, -0.6461944580078125, -0.5860595703125, -0.5259246826171875, -0.465789794921875, -0.4056549072265625, -0.34552001953125, -0.2853851318359375, -0.225250244140625, -0.1651153564453125, -0.10498046875, -0.0448455810546875, 0.015289306640625, 0.0754241943359375, 0.13555908203125, 0.1956939697265625, 0.255828857421875, 0.3159637451171875, 0.3760986328125, 0.4362335205078125, 0.496368408203125, 0.5565032958984375, 0.61663818359375, 0.6767730712890625, 0.736907958984375, 0.7970428466796875, 0.857177734375, 0.9173126220703125, 0.977447509765625, 1.0375823974609375, 1.09771728515625, 1.1578521728515625, 1.217987060546875, 1.2781219482421875, 1.3382568359375, 1.3983917236328125, 1.458526611328125, 1.5186614990234375, 1.57879638671875, 1.6389312744140625, 1.699066162109375, 1.7592010498046875, 1.8193359375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 6.0, 3.0, 7.0, 5.0, 7.0, 5.0, 6.0, 12.0, 13.0, 11.0, 14.0, 15.0, 17.0, 25.0, 27.0, 31.0, 27.0, 26.0, 35.0, 35.0, 43.0, 46.0, 38.0, 44.0, 38.0, 45.0, 37.0, 37.0, 38.0, 45.0, 29.0, 23.0, 30.0, 25.0, 25.0, 19.0, 19.0, 13.0, 20.0, 13.0, 6.0, 13.0, 7.0, 9.0, 3.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.806119918823242, -29.78373908996582, -28.76136016845703, -27.73897933959961, -26.71660041809082, -25.6942195892334, -24.67184066772461, -23.649459838867188, -22.627079010009766, -21.604698181152344, -20.582319259643555, -19.559938430786133, -18.537559509277344, -17.515178680419922, -16.4927978515625, -15.470418930053711, -14.448040008544922, -13.425660133361816, -12.403280258178711, -11.380899429321289, -10.3585205078125, -9.336139678955078, -8.313759803771973, -7.291379928588867, -6.269000053405762, -5.246620178222656, -4.224240303039551, -3.201859951019287, -2.1794800758361816, -1.1571002006530762, -0.1347198486328125, 0.887660026550293, 1.9100379943847656, 2.932417869567871, 3.9547979831695557, 4.97717809677124, 5.999557971954346, 7.021937847137451, 8.044318199157715, 9.06669807434082, 10.089077949523926, 11.111457824707031, 12.133837699890137, 13.156217575073242, 14.178598403930664, 15.200977325439453, 16.223358154296875, 17.245738983154297, 18.268117904663086, 19.290498733520508, 20.312877655029297, 21.33525848388672, 22.357637405395508, 23.38001823425293, 24.40239715576172, 25.42477798461914, 26.447158813476562, 27.469539642333984, 28.491918563842773, 29.514299392700195, 30.536678314208984, 31.559059143066406, 32.58143997192383, 33.60382080078125, 34.626197814941406]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 13.0, 6.0, 9.0, 14.0, 12.0, 14.0, 16.0, 16.0, 22.0, 26.0, 37.0, 36.0, 27.0, 39.0, 45.0, 36.0, 42.0, 32.0, 39.0, 34.0, 46.0, 36.0, 37.0, 37.0, 29.0, 40.0, 32.0, 22.0, 24.0, 19.0, 24.0, 20.0, 21.0, 17.0, 17.0, 11.0, 7.0, 8.0, 7.0, 5.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-39.06671905517578, -37.92647171020508, -36.786224365234375, -35.64597702026367, -34.50572967529297, -33.365482330322266, -32.22523498535156, -31.08498764038086, -29.944740295410156, -28.804492950439453, -27.66424560546875, -26.523998260498047, -25.383750915527344, -24.24350357055664, -23.103256225585938, -21.963008880615234, -20.82276153564453, -19.682514190673828, -18.542266845703125, -17.402019500732422, -16.26177215576172, -15.121524810791016, -13.981277465820312, -12.84103012084961, -11.700782775878906, -10.560535430908203, -9.4202880859375, -8.280040740966797, -7.139793395996094, -5.999546051025391, -4.8592987060546875, -3.7190513610839844, -2.5788002014160156, -1.4385528564453125, -0.2983055114746094, 0.8419418334960938, 1.9821891784667969, 3.1224365234375, 4.262683868408203, 5.402931213378906, 6.543178558349609, 7.6834259033203125, 8.823673248291016, 9.963920593261719, 11.104167938232422, 12.244415283203125, 13.384662628173828, 14.524909973144531, 15.665157318115234, 16.805404663085938, 17.94565200805664, 19.085899353027344, 20.226146697998047, 21.36639404296875, 22.506641387939453, 23.646888732910156, 24.78713607788086, 25.927383422851562, 27.067630767822266, 28.20787811279297, 29.348125457763672, 30.488372802734375, 31.628620147705078, 32.76886749267578, 33.909114837646484]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 6.0, 6.0, 16.0, 20.0, 34.0, 44.0, 79.0, 154.0, 257.0, 404.0, 744.0, 1202.0, 1957.0, 3132.0, 5036.0, 7757.0, 11770.0, 17597.0, 25373.0, 35253.0, 47551.0, 61684.0, 74922.0, 87285.0, 95393.0, 97914.0, 94915.0, 86706.0, 75014.0, 60598.0, 46979.0, 34839.0, 24812.0, 17365.0, 11525.0, 7431.0, 4808.0, 3121.0, 1864.0, 1198.0, 725.0, 441.0, 251.0, 163.0, 85.0, 46.0, 27.0, 25.0, 11.0, 12.0, 6.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-18.796875, -18.2353515625, -17.673828125, -17.1123046875, -16.55078125, -15.9892578125, -15.427734375, -14.8662109375, -14.3046875, -13.7431640625, -13.181640625, -12.6201171875, -12.05859375, -11.4970703125, -10.935546875, -10.3740234375, -9.8125, -9.2509765625, -8.689453125, -8.1279296875, -7.56640625, -7.0048828125, -6.443359375, -5.8818359375, -5.3203125, -4.7587890625, -4.197265625, -3.6357421875, -3.07421875, -2.5126953125, -1.951171875, -1.3896484375, -0.828125, -0.2666015625, 0.294921875, 0.8564453125, 1.41796875, 1.9794921875, 2.541015625, 3.1025390625, 3.6640625, 4.2255859375, 4.787109375, 5.3486328125, 5.91015625, 6.4716796875, 7.033203125, 7.5947265625, 8.15625, 8.7177734375, 9.279296875, 9.8408203125, 10.40234375, 10.9638671875, 11.525390625, 12.0869140625, 12.6484375, 13.2099609375, 13.771484375, 14.3330078125, 14.89453125, 15.4560546875, 16.017578125, 16.5791015625, 17.140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 11.0, 10.0, 9.0, 11.0, 12.0, 12.0, 16.0, 16.0, 12.0, 26.0, 27.0, 35.0, 37.0, 32.0, 38.0, 41.0, 38.0, 43.0, 28.0, 39.0, 50.0, 36.0, 35.0, 40.0, 28.0, 38.0, 34.0, 31.0, 22.0, 24.0, 15.0, 27.0, 19.0, 21.0, 14.0, 22.0, 7.0, 8.0, 10.0, 5.0, 3.0, 5.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-38.03125, -36.9140625, -35.796875, -34.6796875, -33.5625, -32.4453125, -31.328125, -30.2109375, -29.09375, -27.9765625, -26.859375, -25.7421875, -24.625, -23.5078125, -22.390625, -21.2734375, -20.15625, -19.0390625, -17.921875, -16.8046875, -15.6875, -14.5703125, -13.453125, -12.3359375, -11.21875, -10.1015625, -8.984375, -7.8671875, -6.75, -5.6328125, -4.515625, -3.3984375, -2.28125, -1.1640625, -0.046875, 1.0703125, 2.1875, 3.3046875, 4.421875, 5.5390625, 6.65625, 7.7734375, 8.890625, 10.0078125, 11.125, 12.2421875, 13.359375, 14.4765625, 15.59375, 16.7109375, 17.828125, 18.9453125, 20.0625, 21.1796875, 22.296875, 23.4140625, 24.53125, 25.6484375, 26.765625, 27.8828125, 29.0, 30.1171875, 31.234375, 32.3515625, 33.46875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 8.0, 15.0, 30.0, 34.0, 57.0, 85.0, 154.0, 257.0, 397.0, 592.0, 992.0, 1631.0, 2637.0, 4123.0, 6017.0, 9433.0, 13706.0, 19879.0, 28063.0, 37554.0, 48970.0, 61702.0, 73396.0, 83863.0, 90933.0, 92796.0, 89820.0, 82680.0, 71764.0, 60039.0, 47219.0, 36032.0, 26569.0, 19080.0, 13085.0, 8661.0, 5883.0, 3923.0, 2396.0, 1558.0, 941.0, 606.0, 371.0, 222.0, 151.0, 87.0, 50.0, 33.0, 37.0, 14.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.6875, -17.14208984375, -16.5966796875, -16.05126953125, -15.505859375, -14.96044921875, -14.4150390625, -13.86962890625, -13.32421875, -12.77880859375, -12.2333984375, -11.68798828125, -11.142578125, -10.59716796875, -10.0517578125, -9.50634765625, -8.9609375, -8.41552734375, -7.8701171875, -7.32470703125, -6.779296875, -6.23388671875, -5.6884765625, -5.14306640625, -4.59765625, -4.05224609375, -3.5068359375, -2.96142578125, -2.416015625, -1.87060546875, -1.3251953125, -0.77978515625, -0.234375, 0.31103515625, 0.8564453125, 1.40185546875, 1.947265625, 2.49267578125, 3.0380859375, 3.58349609375, 4.12890625, 4.67431640625, 5.2197265625, 5.76513671875, 6.310546875, 6.85595703125, 7.4013671875, 7.94677734375, 8.4921875, 9.03759765625, 9.5830078125, 10.12841796875, 10.673828125, 11.21923828125, 11.7646484375, 12.31005859375, 12.85546875, 13.40087890625, 13.9462890625, 14.49169921875, 15.037109375, 15.58251953125, 16.1279296875, 16.67333984375, 17.21875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [7.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 9.0, 6.0, 8.0, 16.0, 10.0, 13.0, 15.0, 22.0, 28.0, 23.0, 29.0, 34.0, 41.0, 34.0, 53.0, 38.0, 35.0, 43.0, 55.0, 37.0, 44.0, 50.0, 28.0, 42.0, 33.0, 48.0, 23.0, 32.0, 20.0, 21.0, 20.0, 12.0, 9.0, 8.0, 8.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.484375, -18.7197265625, -17.955078125, -17.1904296875, -16.42578125, -15.6611328125, -14.896484375, -14.1318359375, -13.3671875, -12.6025390625, -11.837890625, -11.0732421875, -10.30859375, -9.5439453125, -8.779296875, -8.0146484375, -7.25, -6.4853515625, -5.720703125, -4.9560546875, -4.19140625, -3.4267578125, -2.662109375, -1.8974609375, -1.1328125, -0.3681640625, 0.396484375, 1.1611328125, 1.92578125, 2.6904296875, 3.455078125, 4.2197265625, 4.984375, 5.7490234375, 6.513671875, 7.2783203125, 8.04296875, 8.8076171875, 9.572265625, 10.3369140625, 11.1015625, 11.8662109375, 12.630859375, 13.3955078125, 14.16015625, 14.9248046875, 15.689453125, 16.4541015625, 17.21875, 17.9833984375, 18.748046875, 19.5126953125, 20.27734375, 21.0419921875, 21.806640625, 22.5712890625, 23.3359375, 24.1005859375, 24.865234375, 25.6298828125, 26.39453125, 27.1591796875, 27.923828125, 28.6884765625, 29.453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 14.0, 20.0, 21.0, 35.0, 49.0, 65.0, 114.0, 147.0, 237.0, 395.0, 643.0, 1071.0, 1692.0, 2943.0, 4881.0, 8142.0, 13456.0, 22074.0, 34610.0, 51341.0, 72257.0, 93826.0, 112102.0, 122074.0, 119465.0, 107637.0, 87928.0, 65857.0, 46067.0, 30541.0, 19025.0, 11950.0, 7089.0, 4260.0, 2457.0, 1529.0, 952.0, 576.0, 357.0, 227.0, 145.0, 92.0, 59.0, 46.0, 31.0, 18.0, 10.0, 7.0, 13.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-9.7109375, -9.396240234375, -9.08154296875, -8.766845703125, -8.4521484375, -8.137451171875, -7.82275390625, -7.508056640625, -7.193359375, -6.878662109375, -6.56396484375, -6.249267578125, -5.9345703125, -5.619873046875, -5.30517578125, -4.990478515625, -4.67578125, -4.361083984375, -4.04638671875, -3.731689453125, -3.4169921875, -3.102294921875, -2.78759765625, -2.472900390625, -2.158203125, -1.843505859375, -1.52880859375, -1.214111328125, -0.8994140625, -0.584716796875, -0.27001953125, 0.044677734375, 0.359375, 0.674072265625, 0.98876953125, 1.303466796875, 1.6181640625, 1.932861328125, 2.24755859375, 2.562255859375, 2.876953125, 3.191650390625, 3.50634765625, 3.821044921875, 4.1357421875, 4.450439453125, 4.76513671875, 5.079833984375, 5.39453125, 5.709228515625, 6.02392578125, 6.338623046875, 6.6533203125, 6.968017578125, 7.28271484375, 7.597412109375, 7.912109375, 8.226806640625, 8.54150390625, 8.856201171875, 9.1708984375, 9.485595703125, 9.80029296875, 10.114990234375, 10.4296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 14.0, 10.0, 9.0, 16.0, 22.0, 19.0, 22.0, 34.0, 29.0, 42.0, 39.0, 45.0, 53.0, 51.0, 51.0, 53.0, 51.0, 49.0, 64.0, 43.0, 50.0, 44.0, 39.0, 31.0, 22.0, 23.0, 9.0, 12.0, 8.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011548995971679688, -0.0011162906885147095, -0.0010776817798614502, -0.001039072871208191, -0.0010004639625549316, -0.0009618550539016724, -0.0009232461452484131, -0.0008846372365951538, -0.0008460283279418945, -0.0008074194192886353, -0.000768810510635376, -0.0007302016019821167, -0.0006915926933288574, -0.0006529837846755981, -0.0006143748760223389, -0.0005757659673690796, -0.0005371570587158203, -0.000498548150062561, -0.00045993924140930176, -0.0004213303327560425, -0.0003827214241027832, -0.0003441125154495239, -0.00030550360679626465, -0.00026689469814300537, -0.0002282857894897461, -0.00018967688083648682, -0.00015106797218322754, -0.00011245906352996826, -7.385015487670898e-05, -3.524124622344971e-05, 3.3676624298095703e-06, 4.197657108306885e-05, 8.058547973632812e-05, 0.0001191943883895874, 0.00015780329704284668, 0.00019641220569610596, 0.00023502111434936523, 0.0002736300230026245, 0.0003122389316558838, 0.00035084784030914307, 0.00038945674896240234, 0.0004280656576156616, 0.0004666745662689209, 0.0005052834749221802, 0.0005438923835754395, 0.0005825012922286987, 0.000621110200881958, 0.0006597191095352173, 0.0006983280181884766, 0.0007369369268417358, 0.0007755458354949951, 0.0008141547441482544, 0.0008527636528015137, 0.000891372561454773, 0.0009299814701080322, 0.0009685903787612915, 0.0010071992874145508, 0.00104580819606781, 0.0010844171047210693, 0.0011230260133743286, 0.0011616349220275879, 0.0012002438306808472, 0.0012388527393341064, 0.0012774616479873657, 0.001316070556640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 13.0, 20.0, 22.0, 44.0, 76.0, 118.0, 171.0, 274.0, 398.0, 694.0, 1038.0, 1777.0, 2911.0, 4866.0, 8262.0, 13889.0, 22717.0, 36385.0, 56057.0, 81092.0, 106928.0, 127563.0, 134117.0, 125130.0, 104265.0, 77941.0, 53871.0, 34500.0, 21050.0, 12722.0, 7737.0, 4636.0, 2795.0, 1667.0, 1056.0, 624.0, 407.0, 231.0, 185.0, 108.0, 71.0, 46.0, 29.0, 15.0, 13.0, 11.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1875, -11.787109375, -11.38671875, -10.986328125, -10.5859375, -10.185546875, -9.78515625, -9.384765625, -8.984375, -8.583984375, -8.18359375, -7.783203125, -7.3828125, -6.982421875, -6.58203125, -6.181640625, -5.78125, -5.380859375, -4.98046875, -4.580078125, -4.1796875, -3.779296875, -3.37890625, -2.978515625, -2.578125, -2.177734375, -1.77734375, -1.376953125, -0.9765625, -0.576171875, -0.17578125, 0.224609375, 0.625, 1.025390625, 1.42578125, 1.826171875, 2.2265625, 2.626953125, 3.02734375, 3.427734375, 3.828125, 4.228515625, 4.62890625, 5.029296875, 5.4296875, 5.830078125, 6.23046875, 6.630859375, 7.03125, 7.431640625, 7.83203125, 8.232421875, 8.6328125, 9.033203125, 9.43359375, 9.833984375, 10.234375, 10.634765625, 11.03515625, 11.435546875, 11.8359375, 12.236328125, 12.63671875, 13.037109375, 13.4375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 9.0, 8.0, 4.0, 9.0, 9.0, 19.0, 15.0, 23.0, 29.0, 26.0, 32.0, 46.0, 44.0, 46.0, 35.0, 38.0, 53.0, 47.0, 49.0, 52.0, 46.0, 54.0, 40.0, 43.0, 24.0, 30.0, 27.0, 24.0, 17.0, 29.0, 19.0, 14.0, 9.0, 2.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.60546875, -5.43853759765625, -5.2716064453125, -5.10467529296875, -4.937744140625, -4.77081298828125, -4.6038818359375, -4.43695068359375, -4.27001953125, -4.10308837890625, -3.9361572265625, -3.76922607421875, -3.602294921875, -3.43536376953125, -3.2684326171875, -3.10150146484375, -2.9345703125, -2.76763916015625, -2.6007080078125, -2.43377685546875, -2.266845703125, -2.09991455078125, -1.9329833984375, -1.76605224609375, -1.59912109375, -1.43218994140625, -1.2652587890625, -1.09832763671875, -0.931396484375, -0.76446533203125, -0.5975341796875, -0.43060302734375, -0.263671875, -0.09674072265625, 0.0701904296875, 0.23712158203125, 0.404052734375, 0.57098388671875, 0.7379150390625, 0.90484619140625, 1.07177734375, 1.23870849609375, 1.4056396484375, 1.57257080078125, 1.739501953125, 1.90643310546875, 2.0733642578125, 2.24029541015625, 2.4072265625, 2.57415771484375, 2.7410888671875, 2.90802001953125, 3.074951171875, 3.24188232421875, 3.4088134765625, 3.57574462890625, 3.74267578125, 3.90960693359375, 4.0765380859375, 4.24346923828125, 4.410400390625, 4.57733154296875, 4.7442626953125, 4.91119384765625, 5.078125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 5.0, 3.0, 6.0, 10.0, 6.0, 9.0, 16.0, 7.0, 19.0, 19.0, 15.0, 17.0, 19.0, 23.0, 30.0, 33.0, 29.0, 40.0, 21.0, 39.0, 36.0, 36.0, 39.0, 39.0, 34.0, 29.0, 44.0, 38.0, 34.0, 27.0, 26.0, 29.0, 18.0, 25.0, 20.0, 22.0, 22.0, 19.0, 12.0, 19.0, 10.0, 11.0, 5.0, 4.0, 6.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-30.002649307250977, -29.071632385253906, -28.140615463256836, -27.209598541259766, -26.278581619262695, -25.347564697265625, -24.416547775268555, -23.485530853271484, -22.554513931274414, -21.623497009277344, -20.692480087280273, -19.761463165283203, -18.830446243286133, -17.899429321289062, -16.968412399291992, -16.037395477294922, -15.106378555297852, -14.175361633300781, -13.244344711303711, -12.31332778930664, -11.38231086730957, -10.4512939453125, -9.52027702331543, -8.58926010131836, -7.658243179321289, -6.727226257324219, -5.796209335327148, -4.865192413330078, -3.934175491333008, -3.0031585693359375, -2.072141647338867, -1.1411247253417969, -0.21010971069335938, 0.7209072113037109, 1.6519241333007812, 2.5829410552978516, 3.513957977294922, 4.444974899291992, 5.3759918212890625, 6.307008743286133, 7.238025665283203, 8.169042587280273, 9.100059509277344, 10.031076431274414, 10.962093353271484, 11.893110275268555, 12.824127197265625, 13.755144119262695, 14.686161041259766, 15.617177963256836, 16.548194885253906, 17.479211807250977, 18.410228729248047, 19.341245651245117, 20.272262573242188, 21.203279495239258, 22.134296417236328, 23.0653133392334, 23.99633026123047, 24.92734718322754, 25.85836410522461, 26.78938102722168, 27.72039794921875, 28.65141487121582, 29.58243179321289]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 6.0, 7.0, 3.0, 4.0, 10.0, 15.0, 16.0, 14.0, 14.0, 15.0, 23.0, 23.0, 23.0, 23.0, 24.0, 44.0, 40.0, 34.0, 40.0, 38.0, 52.0, 40.0, 37.0, 34.0, 41.0, 42.0, 32.0, 28.0, 36.0, 39.0, 34.0, 16.0, 22.0, 20.0, 19.0, 15.0, 15.0, 14.0, 17.0, 6.0, 11.0, 5.0, 8.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-42.03581619262695, -40.80253219604492, -39.56924819946289, -38.335960388183594, -37.10267639160156, -35.86939239501953, -34.6361083984375, -33.40282440185547, -32.16953659057617, -30.93625259399414, -29.702966690063477, -28.469682693481445, -27.23639678955078, -26.00311279296875, -24.76982879638672, -23.536542892456055, -22.303258895874023, -21.069974899291992, -19.836688995361328, -18.603404998779297, -17.370119094848633, -16.1368350982666, -14.903550148010254, -13.670265197753906, -12.436980247497559, -11.203695297241211, -9.970410346984863, -8.737125396728516, -7.503840923309326, -6.2705559730529785, -5.037271499633789, -3.8039865493774414, -2.5707015991210938, -1.3374167680740356, -0.10413193702697754, 1.129152774810791, 2.3624377250671387, 3.5957226753234863, 4.829007148742676, 6.062292098999023, 7.295577049255371, 8.528861999511719, 9.762146949768066, 10.995431900024414, 12.228715896606445, 13.46200180053711, 14.69528579711914, 15.928570747375488, 17.161855697631836, 18.395139694213867, 19.62842559814453, 20.861709594726562, 22.094995498657227, 23.328279495239258, 24.561565399169922, 25.794849395751953, 27.028133392333984, 28.261417388916016, 29.49470329284668, 30.72798728942871, 31.961273193359375, 33.194557189941406, 34.42784118652344, 35.66112518310547, 36.894412994384766]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [6.0, 4.0, 4.0, 4.0, 15.0, 22.0, 33.0, 65.0, 97.0, 179.0, 241.0, 466.0, 752.0, 1217.0, 1941.0, 3032.0, 4983.0, 7825.0, 12156.0, 18248.0, 27344.0, 40568.0, 57842.0, 81278.0, 111066.0, 145603.0, 186855.0, 229801.0, 271037.0, 306926.0, 332514.0, 344036.0, 340826.0, 321101.0, 290023.0, 249902.0, 207623.0, 164729.0, 127175.0, 94002.0, 68800.0, 48109.0, 32972.0, 22324.0, 14809.0, 9570.0, 6143.0, 3855.0, 2497.0, 1483.0, 890.0, 565.0, 305.0, 185.0, 113.0, 61.0, 41.0, 16.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0], "bins": [-20.84375, -20.18701171875, -19.5302734375, -18.87353515625, -18.216796875, -17.56005859375, -16.9033203125, -16.24658203125, -15.58984375, -14.93310546875, -14.2763671875, -13.61962890625, -12.962890625, -12.30615234375, -11.6494140625, -10.99267578125, -10.3359375, -9.67919921875, -9.0224609375, -8.36572265625, -7.708984375, -7.05224609375, -6.3955078125, -5.73876953125, -5.08203125, -4.42529296875, -3.7685546875, -3.11181640625, -2.455078125, -1.79833984375, -1.1416015625, -0.48486328125, 0.171875, 0.82861328125, 1.4853515625, 2.14208984375, 2.798828125, 3.45556640625, 4.1123046875, 4.76904296875, 5.42578125, 6.08251953125, 6.7392578125, 7.39599609375, 8.052734375, 8.70947265625, 9.3662109375, 10.02294921875, 10.6796875, 11.33642578125, 11.9931640625, 12.64990234375, 13.306640625, 13.96337890625, 14.6201171875, 15.27685546875, 15.93359375, 16.59033203125, 17.2470703125, 17.90380859375, 18.560546875, 19.21728515625, 19.8740234375, 20.53076171875, 21.1875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 9.0, 4.0, 5.0, 4.0, 9.0, 18.0, 17.0, 9.0, 18.0, 13.0, 24.0, 23.0, 23.0, 27.0, 23.0, 46.0, 38.0, 37.0, 37.0, 34.0, 54.0, 40.0, 38.0, 39.0, 32.0, 43.0, 34.0, 30.0, 39.0, 29.0, 32.0, 18.0, 23.0, 18.0, 20.0, 14.0, 18.0, 13.0, 15.0, 8.0, 9.0, 8.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-36.875, -35.78955078125, -34.7041015625, -33.61865234375, -32.533203125, -31.44775390625, -30.3623046875, -29.27685546875, -28.19140625, -27.10595703125, -26.0205078125, -24.93505859375, -23.849609375, -22.76416015625, -21.6787109375, -20.59326171875, -19.5078125, -18.42236328125, -17.3369140625, -16.25146484375, -15.166015625, -14.08056640625, -12.9951171875, -11.90966796875, -10.82421875, -9.73876953125, -8.6533203125, -7.56787109375, -6.482421875, -5.39697265625, -4.3115234375, -3.22607421875, -2.140625, -1.05517578125, 0.0302734375, 1.11572265625, 2.201171875, 3.28662109375, 4.3720703125, 5.45751953125, 6.54296875, 7.62841796875, 8.7138671875, 9.79931640625, 10.884765625, 11.97021484375, 13.0556640625, 14.14111328125, 15.2265625, 16.31201171875, 17.3974609375, 18.48291015625, 19.568359375, 20.65380859375, 21.7392578125, 22.82470703125, 23.91015625, 24.99560546875, 26.0810546875, 27.16650390625, 28.251953125, 29.33740234375, 30.4228515625, 31.50830078125, 32.59375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 14.0, 30.0, 51.0, 87.0, 142.0, 255.0, 461.0, 764.0, 1277.0, 2235.0, 3653.0, 5787.0, 9236.0, 14455.0, 22287.0, 32599.0, 47249.0, 67396.0, 91537.0, 122513.0, 156792.0, 195797.0, 234726.0, 271118.0, 300959.0, 321236.0, 329569.0, 323518.0, 304824.0, 276699.0, 242022.0, 202673.0, 163989.0, 128320.0, 97121.0, 71293.0, 50888.0, 35016.0, 23686.0, 15687.0, 9788.0, 6417.0, 4077.0, 2485.0, 1435.0, 908.0, 549.0, 304.0, 165.0, 75.0, 58.0, 37.0, 11.0, 12.0, 5.0, 3.0, 1.0], "bins": [-22.75, -22.07275390625, -21.3955078125, -20.71826171875, -20.041015625, -19.36376953125, -18.6865234375, -18.00927734375, -17.33203125, -16.65478515625, -15.9775390625, -15.30029296875, -14.623046875, -13.94580078125, -13.2685546875, -12.59130859375, -11.9140625, -11.23681640625, -10.5595703125, -9.88232421875, -9.205078125, -8.52783203125, -7.8505859375, -7.17333984375, -6.49609375, -5.81884765625, -5.1416015625, -4.46435546875, -3.787109375, -3.10986328125, -2.4326171875, -1.75537109375, -1.078125, -0.40087890625, 0.2763671875, 0.95361328125, 1.630859375, 2.30810546875, 2.9853515625, 3.66259765625, 4.33984375, 5.01708984375, 5.6943359375, 6.37158203125, 7.048828125, 7.72607421875, 8.4033203125, 9.08056640625, 9.7578125, 10.43505859375, 11.1123046875, 11.78955078125, 12.466796875, 13.14404296875, 13.8212890625, 14.49853515625, 15.17578125, 15.85302734375, 16.5302734375, 17.20751953125, 17.884765625, 18.56201171875, 19.2392578125, 19.91650390625, 20.59375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 7.0, 8.0, 8.0, 11.0, 15.0, 29.0, 31.0, 43.0, 47.0, 67.0, 86.0, 69.0, 117.0, 132.0, 138.0, 161.0, 161.0, 200.0, 195.0, 215.0, 201.0, 202.0, 196.0, 214.0, 207.0, 188.0, 179.0, 144.0, 129.0, 113.0, 131.0, 93.0, 78.0, 69.0, 55.0, 36.0, 26.0, 23.0, 13.0, 13.0, 9.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3125, -14.78857421875, -14.2646484375, -13.74072265625, -13.216796875, -12.69287109375, -12.1689453125, -11.64501953125, -11.12109375, -10.59716796875, -10.0732421875, -9.54931640625, -9.025390625, -8.50146484375, -7.9775390625, -7.45361328125, -6.9296875, -6.40576171875, -5.8818359375, -5.35791015625, -4.833984375, -4.31005859375, -3.7861328125, -3.26220703125, -2.73828125, -2.21435546875, -1.6904296875, -1.16650390625, -0.642578125, -0.11865234375, 0.4052734375, 0.92919921875, 1.453125, 1.97705078125, 2.5009765625, 3.02490234375, 3.548828125, 4.07275390625, 4.5966796875, 5.12060546875, 5.64453125, 6.16845703125, 6.6923828125, 7.21630859375, 7.740234375, 8.26416015625, 8.7880859375, 9.31201171875, 9.8359375, 10.35986328125, 10.8837890625, 11.40771484375, 11.931640625, 12.45556640625, 12.9794921875, 13.50341796875, 14.02734375, 14.55126953125, 15.0751953125, 15.59912109375, 16.123046875, 16.64697265625, 17.1708984375, 17.69482421875, 18.21875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 9.0, 7.0, 3.0, 11.0, 13.0, 10.0, 18.0, 20.0, 23.0, 17.0, 34.0, 28.0, 22.0, 23.0, 31.0, 38.0, 37.0, 33.0, 34.0, 43.0, 48.0, 34.0, 38.0, 50.0, 35.0, 37.0, 34.0, 34.0, 28.0, 31.0, 28.0, 21.0, 22.0, 16.0, 21.0, 10.0, 10.0, 7.0, 10.0, 7.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-37.81067657470703, -36.777008056640625, -35.74333953857422, -34.70967102050781, -33.676002502441406, -32.642333984375, -31.608667373657227, -30.57499885559082, -29.541330337524414, -28.507661819458008, -27.4739933013916, -26.440324783325195, -25.406658172607422, -24.372989654541016, -23.33932113647461, -22.305652618408203, -21.271984100341797, -20.23831558227539, -19.204647064208984, -18.170978546142578, -17.137310028076172, -16.103641510009766, -15.069974899291992, -14.036306381225586, -13.00263786315918, -11.968969345092773, -10.935300827026367, -9.901633262634277, -8.867964744567871, -7.834296226501465, -6.800628185272217, -5.766960144042969, -4.73328971862793, -3.6996214389801025, -2.6659531593322754, -1.6322848796844482, -0.5986166000366211, 0.43505191802978516, 1.4687199592590332, 2.5023880004882812, 3.5360565185546875, 4.569725036621094, 5.603393077850342, 6.63706111907959, 7.670729637145996, 8.704398155212402, 9.738065719604492, 10.771734237670898, 11.805402755737305, 12.839071273803711, 13.872739791870117, 14.906407356262207, 15.940075874328613, 16.973743438720703, 18.00741195678711, 19.041080474853516, 20.074748992919922, 21.108417510986328, 22.142086029052734, 23.17575454711914, 24.209423065185547, 25.243091583251953, 26.276758193969727, 27.310426712036133, 28.34409523010254]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 9.0, 7.0, 12.0, 16.0, 11.0, 25.0, 16.0, 21.0, 22.0, 34.0, 24.0, 31.0, 31.0, 40.0, 44.0, 39.0, 50.0, 49.0, 34.0, 33.0, 43.0, 48.0, 35.0, 32.0, 25.0, 39.0, 30.0, 26.0, 20.0, 23.0, 27.0, 14.0, 18.0, 12.0, 14.0, 7.0, 6.0, 10.0, 1.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.48579788208008, -42.18503189086914, -40.8842658996582, -39.583499908447266, -38.28273391723633, -36.98196792602539, -35.68120193481445, -34.38043975830078, -33.079673767089844, -31.778907775878906, -30.47814178466797, -29.17737579345703, -27.876609802246094, -26.575843811035156, -25.27507972717285, -23.974313735961914, -22.673545837402344, -21.372779846191406, -20.07201385498047, -18.77124786376953, -17.470481872558594, -16.169715881347656, -14.868951797485352, -13.568185806274414, -12.267419815063477, -10.966653823852539, -9.665887832641602, -8.36512279510498, -7.064356803894043, -5.7635908126831055, -4.462825298309326, -3.162059783935547, -1.861297607421875, -0.5605318546295166, 0.7402338981628418, 2.0409996509552, 3.3417654037475586, 4.642531394958496, 5.943296909332275, 7.244062423706055, 8.544828414916992, 9.84559440612793, 11.146360397338867, 12.447125434875488, 13.747891426086426, 15.048657417297363, 16.349422454833984, 17.650188446044922, 18.95095443725586, 20.251720428466797, 21.552486419677734, 22.853252410888672, 24.15401840209961, 25.454784393310547, 26.75554847717285, 28.05631446838379, 29.357080459594727, 30.657846450805664, 31.9586124420166, 33.259376525878906, 34.560142517089844, 35.86090850830078, 37.16167449951172, 38.462440490722656, 39.763206481933594]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 12.0, 11.0, 28.0, 43.0, 49.0, 79.0, 104.0, 194.0, 287.0, 408.0, 682.0, 1074.0, 1724.0, 2888.0, 4816.0, 8357.0, 14417.0, 25695.0, 46702.0, 83420.0, 142023.0, 202804.0, 197634.0, 135307.0, 78491.0, 43646.0, 24407.0, 13547.0, 7770.0, 4598.0, 2896.0, 1676.0, 1026.0, 621.0, 368.0, 242.0, 166.0, 110.0, 56.0, 55.0, 40.0, 21.0, 18.0, 13.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0], "bins": [-6.20703125, -6.03436279296875, -5.8616943359375, -5.68902587890625, -5.516357421875, -5.34368896484375, -5.1710205078125, -4.99835205078125, -4.82568359375, -4.65301513671875, -4.4803466796875, -4.30767822265625, -4.135009765625, -3.96234130859375, -3.7896728515625, -3.61700439453125, -3.4443359375, -3.27166748046875, -3.0989990234375, -2.92633056640625, -2.753662109375, -2.58099365234375, -2.4083251953125, -2.23565673828125, -2.06298828125, -1.89031982421875, -1.7176513671875, -1.54498291015625, -1.372314453125, -1.19964599609375, -1.0269775390625, -0.85430908203125, -0.681640625, -0.50897216796875, -0.3363037109375, -0.16363525390625, 0.009033203125, 0.18170166015625, 0.3543701171875, 0.52703857421875, 0.69970703125, 0.87237548828125, 1.0450439453125, 1.21771240234375, 1.390380859375, 1.56304931640625, 1.7357177734375, 1.90838623046875, 2.0810546875, 2.25372314453125, 2.4263916015625, 2.59906005859375, 2.771728515625, 2.94439697265625, 3.1170654296875, 3.28973388671875, 3.46240234375, 3.63507080078125, 3.8077392578125, 3.98040771484375, 4.153076171875, 4.32574462890625, 4.4984130859375, 4.67108154296875, 4.84375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 8.0, 12.0, 16.0, 10.0, 26.0, 16.0, 22.0, 22.0, 33.0, 23.0, 32.0, 31.0, 39.0, 45.0, 38.0, 50.0, 48.0, 36.0, 34.0, 41.0, 46.0, 39.0, 31.0, 25.0, 37.0, 31.0, 26.0, 22.0, 22.0, 28.0, 13.0, 17.0, 13.0, 14.0, 6.0, 7.0, 10.0, 1.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.46875, -42.1669921875, -40.865234375, -39.5634765625, -38.26171875, -36.9599609375, -35.658203125, -34.3564453125, -33.0546875, -31.7529296875, -30.451171875, -29.1494140625, -27.84765625, -26.5458984375, -25.244140625, -23.9423828125, -22.640625, -21.3388671875, -20.037109375, -18.7353515625, -17.43359375, -16.1318359375, -14.830078125, -13.5283203125, -12.2265625, -10.9248046875, -9.623046875, -8.3212890625, -7.01953125, -5.7177734375, -4.416015625, -3.1142578125, -1.8125, -0.5107421875, 0.791015625, 2.0927734375, 3.39453125, 4.6962890625, 5.998046875, 7.2998046875, 8.6015625, 9.9033203125, 11.205078125, 12.5068359375, 13.80859375, 15.1103515625, 16.412109375, 17.7138671875, 19.015625, 20.3173828125, 21.619140625, 22.9208984375, 24.22265625, 25.5244140625, 26.826171875, 28.1279296875, 29.4296875, 30.7314453125, 32.033203125, 33.3349609375, 34.63671875, 35.9384765625, 37.240234375, 38.5419921875, 39.84375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 11.0, 5.0, 14.0, 28.0, 36.0, 57.0, 72.0, 81.0, 156.0, 195.0, 301.0, 424.0, 678.0, 973.0, 1576.0, 2420.0, 4175.0, 7203.0, 13074.0, 25238.0, 51475.0, 113474.0, 239548.0, 286308.0, 158441.0, 70524.0, 32797.0, 16616.0, 8929.0, 5189.0, 2991.0, 1849.0, 1207.0, 803.0, 547.0, 340.0, 214.0, 166.0, 126.0, 89.0, 60.0, 35.0, 36.0, 25.0, 11.0, 11.0, 13.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9140625, -5.7115478515625, -5.509033203125, -5.3065185546875, -5.10400390625, -4.9014892578125, -4.698974609375, -4.4964599609375, -4.2939453125, -4.0914306640625, -3.888916015625, -3.6864013671875, -3.48388671875, -3.2813720703125, -3.078857421875, -2.8763427734375, -2.673828125, -2.4713134765625, -2.268798828125, -2.0662841796875, -1.86376953125, -1.6612548828125, -1.458740234375, -1.2562255859375, -1.0537109375, -0.8511962890625, -0.648681640625, -0.4461669921875, -0.24365234375, -0.0411376953125, 0.161376953125, 0.3638916015625, 0.56640625, 0.7689208984375, 0.971435546875, 1.1739501953125, 1.37646484375, 1.5789794921875, 1.781494140625, 1.9840087890625, 2.1865234375, 2.3890380859375, 2.591552734375, 2.7940673828125, 2.99658203125, 3.1990966796875, 3.401611328125, 3.6041259765625, 3.806640625, 4.0091552734375, 4.211669921875, 4.4141845703125, 4.61669921875, 4.8192138671875, 5.021728515625, 5.2242431640625, 5.4267578125, 5.6292724609375, 5.831787109375, 6.0343017578125, 6.23681640625, 6.4393310546875, 6.641845703125, 6.8443603515625, 7.046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 8.0, 15.0, 8.0, 14.0, 16.0, 15.0, 22.0, 29.0, 28.0, 34.0, 34.0, 45.0, 40.0, 49.0, 45.0, 50.0, 52.0, 49.0, 42.0, 53.0, 36.0, 39.0, 30.0, 41.0, 31.0, 26.0, 29.0, 17.0, 9.0, 14.0, 14.0, 16.0, 7.0, 6.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.203125, -29.229736328125, -28.25634765625, -27.282958984375, -26.3095703125, -25.336181640625, -24.36279296875, -23.389404296875, -22.416015625, -21.442626953125, -20.46923828125, -19.495849609375, -18.5224609375, -17.549072265625, -16.57568359375, -15.602294921875, -14.62890625, -13.655517578125, -12.68212890625, -11.708740234375, -10.7353515625, -9.761962890625, -8.78857421875, -7.815185546875, -6.841796875, -5.868408203125, -4.89501953125, -3.921630859375, -2.9482421875, -1.974853515625, -1.00146484375, -0.028076171875, 0.9453125, 1.918701171875, 2.89208984375, 3.865478515625, 4.8388671875, 5.812255859375, 6.78564453125, 7.759033203125, 8.732421875, 9.705810546875, 10.67919921875, 11.652587890625, 12.6259765625, 13.599365234375, 14.57275390625, 15.546142578125, 16.51953125, 17.492919921875, 18.46630859375, 19.439697265625, 20.4130859375, 21.386474609375, 22.35986328125, 23.333251953125, 24.306640625, 25.280029296875, 26.25341796875, 27.226806640625, 28.2001953125, 29.173583984375, 30.14697265625, 31.120361328125, 32.09375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 13.0, 14.0, 15.0, 23.0, 35.0, 47.0, 57.0, 78.0, 95.0, 146.0, 211.0, 290.0, 435.0, 643.0, 954.0, 1470.0, 2460.0, 3978.0, 7013.0, 13525.0, 29265.0, 77235.0, 302064.0, 421448.0, 111044.0, 37916.0, 17129.0, 8429.0, 4739.0, 2849.0, 1700.0, 1063.0, 700.0, 424.0, 343.0, 211.0, 137.0, 99.0, 71.0, 50.0, 39.0, 27.0, 20.0, 15.0, 8.0, 11.0, 4.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1640625, -3.055511474609375, -2.94696044921875, -2.838409423828125, -2.7298583984375, -2.621307373046875, -2.51275634765625, -2.404205322265625, -2.295654296875, -2.187103271484375, -2.07855224609375, -1.970001220703125, -1.8614501953125, -1.752899169921875, -1.64434814453125, -1.535797119140625, -1.42724609375, -1.318695068359375, -1.21014404296875, -1.101593017578125, -0.9930419921875, -0.884490966796875, -0.77593994140625, -0.667388916015625, -0.558837890625, -0.450286865234375, -0.34173583984375, -0.233184814453125, -0.1246337890625, -0.016082763671875, 0.09246826171875, 0.201019287109375, 0.3095703125, 0.418121337890625, 0.52667236328125, 0.635223388671875, 0.7437744140625, 0.852325439453125, 0.96087646484375, 1.069427490234375, 1.177978515625, 1.286529541015625, 1.39508056640625, 1.503631591796875, 1.6121826171875, 1.720733642578125, 1.82928466796875, 1.937835693359375, 2.04638671875, 2.154937744140625, 2.26348876953125, 2.372039794921875, 2.4805908203125, 2.589141845703125, 2.69769287109375, 2.806243896484375, 2.914794921875, 3.023345947265625, 3.13189697265625, 3.240447998046875, 3.3489990234375, 3.457550048828125, 3.56610107421875, 3.674652099609375, 3.783203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 6.0, 6.0, 8.0, 14.0, 7.0, 13.0, 9.0, 14.0, 19.0, 33.0, 29.0, 27.0, 40.0, 49.0, 45.0, 44.0, 47.0, 49.0, 48.0, 34.0, 62.0, 43.0, 34.0, 42.0, 37.0, 34.0, 26.0, 37.0, 27.0, 23.0, 20.0, 11.0, 18.0, 10.0, 3.0, 13.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00015974044799804688, -0.00015488825738430023, -0.0001500360667705536, -0.00014518387615680695, -0.0001403316855430603, -0.00013547949492931366, -0.00013062730431556702, -0.00012577511370182037, -0.00012092292308807373, -0.00011607073247432709, -0.00011121854186058044, -0.0001063663512468338, -0.00010151416063308716, -9.666197001934052e-05, -9.180977940559387e-05, -8.695758879184723e-05, -8.210539817810059e-05, -7.725320756435394e-05, -7.24010169506073e-05, -6.754882633686066e-05, -6.269663572311401e-05, -5.784444510936737e-05, -5.299225449562073e-05, -4.8140063881874084e-05, -4.328787326812744e-05, -3.84356826543808e-05, -3.3583492040634155e-05, -2.8731301426887512e-05, -2.387911081314087e-05, -1.9026920199394226e-05, -1.4174729585647583e-05, -9.32253897190094e-06, -4.470348358154297e-06, 3.818422555923462e-07, 5.234032869338989e-06, 1.0086223483085632e-05, 1.4938414096832275e-05, 1.979060471057892e-05, 2.464279532432556e-05, 2.9494985938072205e-05, 3.434717655181885e-05, 3.919936716556549e-05, 4.4051557779312134e-05, 4.890374839305878e-05, 5.375593900680542e-05, 5.860812962055206e-05, 6.34603202342987e-05, 6.831251084804535e-05, 7.316470146179199e-05, 7.801689207553864e-05, 8.286908268928528e-05, 8.772127330303192e-05, 9.257346391677856e-05, 9.742565453052521e-05, 0.00010227784514427185, 0.0001071300357580185, 0.00011198222637176514, 0.00011683441698551178, 0.00012168660759925842, 0.00012653879821300507, 0.0001313909888267517, 0.00013624317944049835, 0.000141095370054245, 0.00014594756066799164, 0.00015079975128173828]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 12.0, 17.0, 30.0, 46.0, 68.0, 102.0, 138.0, 192.0, 301.0, 414.0, 660.0, 899.0, 1419.0, 2238.0, 3376.0, 5411.0, 8840.0, 14700.0, 25701.0, 46478.0, 86993.0, 161360.0, 237351.0, 198933.0, 112350.0, 59726.0, 32921.0, 18634.0, 10835.0, 6513.0, 4084.0, 2662.0, 1694.0, 1099.0, 778.0, 461.0, 363.0, 244.0, 152.0, 118.0, 77.0, 53.0, 35.0, 20.0, 14.0, 8.0, 10.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.703125, -3.58251953125, -3.4619140625, -3.34130859375, -3.220703125, -3.10009765625, -2.9794921875, -2.85888671875, -2.73828125, -2.61767578125, -2.4970703125, -2.37646484375, -2.255859375, -2.13525390625, -2.0146484375, -1.89404296875, -1.7734375, -1.65283203125, -1.5322265625, -1.41162109375, -1.291015625, -1.17041015625, -1.0498046875, -0.92919921875, -0.80859375, -0.68798828125, -0.5673828125, -0.44677734375, -0.326171875, -0.20556640625, -0.0849609375, 0.03564453125, 0.15625, 0.27685546875, 0.3974609375, 0.51806640625, 0.638671875, 0.75927734375, 0.8798828125, 1.00048828125, 1.12109375, 1.24169921875, 1.3623046875, 1.48291015625, 1.603515625, 1.72412109375, 1.8447265625, 1.96533203125, 2.0859375, 2.20654296875, 2.3271484375, 2.44775390625, 2.568359375, 2.68896484375, 2.8095703125, 2.93017578125, 3.05078125, 3.17138671875, 3.2919921875, 3.41259765625, 3.533203125, 3.65380859375, 3.7744140625, 3.89501953125, 4.015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 0.0, 4.0, 3.0, 3.0, 8.0, 7.0, 17.0, 18.0, 17.0, 24.0, 43.0, 45.0, 35.0, 52.0, 60.0, 83.0, 67.0, 66.0, 85.0, 59.0, 42.0, 59.0, 44.0, 36.0, 25.0, 21.0, 16.0, 11.0, 10.0, 11.0, 9.0, 6.0, 6.0, 4.0, 0.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.037109375, -1.979034423828125, -1.92095947265625, -1.862884521484375, -1.8048095703125, -1.746734619140625, -1.68865966796875, -1.630584716796875, -1.572509765625, -1.514434814453125, -1.45635986328125, -1.398284912109375, -1.3402099609375, -1.282135009765625, -1.22406005859375, -1.165985107421875, -1.10791015625, -1.049835205078125, -0.99176025390625, -0.933685302734375, -0.8756103515625, -0.817535400390625, -0.75946044921875, -0.701385498046875, -0.643310546875, -0.585235595703125, -0.52716064453125, -0.469085693359375, -0.4110107421875, -0.352935791015625, -0.29486083984375, -0.236785888671875, -0.1787109375, -0.120635986328125, -0.06256103515625, -0.004486083984375, 0.0535888671875, 0.111663818359375, 0.16973876953125, 0.227813720703125, 0.285888671875, 0.343963623046875, 0.40203857421875, 0.460113525390625, 0.5181884765625, 0.576263427734375, 0.63433837890625, 0.692413330078125, 0.75048828125, 0.808563232421875, 0.86663818359375, 0.924713134765625, 0.9827880859375, 1.040863037109375, 1.09893798828125, 1.157012939453125, 1.215087890625, 1.273162841796875, 1.33123779296875, 1.389312744140625, 1.4473876953125, 1.505462646484375, 1.56353759765625, 1.621612548828125, 1.6796875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 7.0, 11.0, 12.0, 6.0, 23.0, 20.0, 24.0, 20.0, 29.0, 26.0, 27.0, 22.0, 33.0, 42.0, 30.0, 33.0, 39.0, 36.0, 48.0, 39.0, 42.0, 36.0, 37.0, 41.0, 35.0, 33.0, 31.0, 33.0, 25.0, 23.0, 18.0, 17.0, 20.0, 11.0, 8.0, 7.0, 11.0, 9.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-37.677852630615234, -36.64337158203125, -35.608890533447266, -34.57440948486328, -33.53993225097656, -32.50545120239258, -31.470970153808594, -30.43648910522461, -29.402008056640625, -28.36752700805664, -27.33304786682129, -26.298566818237305, -25.26408576965332, -24.22960662841797, -23.195125579833984, -22.16064453125, -21.12616539001465, -20.091684341430664, -19.057205200195312, -18.022724151611328, -16.988243103027344, -15.953763008117676, -14.919282913208008, -13.884801864624023, -12.850321769714355, -11.815841674804688, -10.781360626220703, -9.746880531311035, -8.712400436401367, -7.677919387817383, -6.643439292907715, -5.608958721160889, -4.574480056762695, -3.539999485015869, -2.505519151687622, -1.471038818359375, -0.43655824661254883, 0.5979223251342773, 1.6324024200439453, 2.6668829917907715, 3.7013635635375977, 4.735844135284424, 5.77032470703125, 6.804804801940918, 7.839285373687744, 8.87376594543457, 9.908246040344238, 10.942726135253906, 11.97720718383789, 13.011687278747559, 14.046168327331543, 15.080648422241211, 16.115129470825195, 17.149608612060547, 18.18408966064453, 19.218570709228516, 20.2530517578125, 21.287532806396484, 22.322011947631836, 23.35649299621582, 24.390974044799805, 25.425453186035156, 26.45993423461914, 27.494415283203125, 28.528894424438477]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 8.0, 9.0, 7.0, 14.0, 14.0, 12.0, 25.0, 16.0, 17.0, 22.0, 32.0, 25.0, 31.0, 36.0, 35.0, 44.0, 40.0, 42.0, 54.0, 38.0, 30.0, 44.0, 42.0, 41.0, 34.0, 24.0, 36.0, 31.0, 23.0, 25.0, 24.0, 25.0, 16.0, 20.0, 10.0, 16.0, 6.0, 6.0, 10.0, 2.0, 2.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.422523498535156, -42.125492095947266, -40.828460693359375, -39.531429290771484, -38.234397888183594, -36.9373664855957, -35.64033508300781, -34.343299865722656, -33.04627227783203, -31.74924087524414, -30.45220947265625, -29.15517807006836, -27.85814666748047, -26.561115264892578, -25.264081954956055, -23.967050552368164, -22.67001724243164, -21.37298583984375, -20.07595443725586, -18.77892303466797, -17.481891632080078, -16.184860229492188, -14.887826919555664, -13.590795516967773, -12.293764114379883, -10.996732711791992, -9.699701309204102, -8.402668952941895, -7.105637550354004, -5.808606147766113, -4.5115742683410645, -3.2145423889160156, -1.917510986328125, -0.6204793453216553, 0.6765522956848145, 1.9735839366912842, 3.270615577697754, 4.5676469802856445, 5.864678859710693, 7.161710739135742, 8.458742141723633, 9.755773544311523, 11.052804946899414, 12.349837303161621, 13.646868705749512, 14.943900108337402, 16.24093246459961, 17.5379638671875, 18.83499526977539, 20.13202667236328, 21.429058074951172, 22.726089477539062, 24.023120880126953, 25.320152282714844, 26.617185592651367, 27.914216995239258, 29.21124839782715, 30.50827980041504, 31.80531120300293, 33.10234451293945, 34.399375915527344, 35.696407318115234, 36.993438720703125, 38.290470123291016, 39.587501525878906]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 20.0, 23.0, 39.0, 84.0, 138.0, 231.0, 428.0, 666.0, 1172.0, 1942.0, 3214.0, 5016.0, 8059.0, 12325.0, 18579.0, 26757.0, 36966.0, 49436.0, 63003.0, 77017.0, 87527.0, 95372.0, 97365.0, 94319.0, 85626.0, 73027.0, 59780.0, 46068.0, 33873.0, 24596.0, 16520.0, 10967.0, 7011.0, 4565.0, 2788.0, 1636.0, 992.0, 580.0, 343.0, 208.0, 108.0, 71.0, 38.0, 23.0, 13.0, 7.0, 11.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.625, -18.049560546875, -17.47412109375, -16.898681640625, -16.3232421875, -15.747802734375, -15.17236328125, -14.596923828125, -14.021484375, -13.446044921875, -12.87060546875, -12.295166015625, -11.7197265625, -11.144287109375, -10.56884765625, -9.993408203125, -9.41796875, -8.842529296875, -8.26708984375, -7.691650390625, -7.1162109375, -6.540771484375, -5.96533203125, -5.389892578125, -4.814453125, -4.239013671875, -3.66357421875, -3.088134765625, -2.5126953125, -1.937255859375, -1.36181640625, -0.786376953125, -0.2109375, 0.364501953125, 0.93994140625, 1.515380859375, 2.0908203125, 2.666259765625, 3.24169921875, 3.817138671875, 4.392578125, 4.968017578125, 5.54345703125, 6.118896484375, 6.6943359375, 7.269775390625, 7.84521484375, 8.420654296875, 8.99609375, 9.571533203125, 10.14697265625, 10.722412109375, 11.2978515625, 11.873291015625, 12.44873046875, 13.024169921875, 13.599609375, 14.175048828125, 14.75048828125, 15.325927734375, 15.9013671875, 16.476806640625, 17.05224609375, 17.627685546875, 18.203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 9.0, 9.0, 6.0, 14.0, 14.0, 12.0, 25.0, 16.0, 16.0, 22.0, 35.0, 23.0, 29.0, 33.0, 39.0, 41.0, 43.0, 39.0, 55.0, 39.0, 31.0, 42.0, 43.0, 39.0, 34.0, 25.0, 36.0, 34.0, 22.0, 23.0, 26.0, 25.0, 18.0, 13.0, 14.0, 18.0, 6.0, 3.0, 13.0, 2.0, 3.0, 3.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.71875, -41.44482421875, -40.1708984375, -38.89697265625, -37.623046875, -36.34912109375, -35.0751953125, -33.80126953125, -32.52734375, -31.25341796875, -29.9794921875, -28.70556640625, -27.431640625, -26.15771484375, -24.8837890625, -23.60986328125, -22.3359375, -21.06201171875, -19.7880859375, -18.51416015625, -17.240234375, -15.96630859375, -14.6923828125, -13.41845703125, -12.14453125, -10.87060546875, -9.5966796875, -8.32275390625, -7.048828125, -5.77490234375, -4.5009765625, -3.22705078125, -1.953125, -0.67919921875, 0.5947265625, 1.86865234375, 3.142578125, 4.41650390625, 5.6904296875, 6.96435546875, 8.23828125, 9.51220703125, 10.7861328125, 12.06005859375, 13.333984375, 14.60791015625, 15.8818359375, 17.15576171875, 18.4296875, 19.70361328125, 20.9775390625, 22.25146484375, 23.525390625, 24.79931640625, 26.0732421875, 27.34716796875, 28.62109375, 29.89501953125, 31.1689453125, 32.44287109375, 33.716796875, 34.99072265625, 36.2646484375, 37.53857421875, 38.8125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 8.0, 15.0, 12.0, 26.0, 33.0, 49.0, 94.0, 136.0, 215.0, 355.0, 527.0, 781.0, 1218.0, 1841.0, 2717.0, 3976.0, 5887.0, 8457.0, 11774.0, 16261.0, 21985.0, 29062.0, 37424.0, 46729.0, 55583.0, 64745.0, 71957.0, 78053.0, 80351.0, 79521.0, 76094.0, 69438.0, 61512.0, 51926.0, 42633.0, 33862.0, 26331.0, 19451.0, 14490.0, 10443.0, 7353.0, 4981.0, 3479.0, 2324.0, 1555.0, 1061.0, 674.0, 412.0, 263.0, 191.0, 87.0, 81.0, 46.0, 37.0, 22.0, 16.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-15.265625, -14.77001953125, -14.2744140625, -13.77880859375, -13.283203125, -12.78759765625, -12.2919921875, -11.79638671875, -11.30078125, -10.80517578125, -10.3095703125, -9.81396484375, -9.318359375, -8.82275390625, -8.3271484375, -7.83154296875, -7.3359375, -6.84033203125, -6.3447265625, -5.84912109375, -5.353515625, -4.85791015625, -4.3623046875, -3.86669921875, -3.37109375, -2.87548828125, -2.3798828125, -1.88427734375, -1.388671875, -0.89306640625, -0.3974609375, 0.09814453125, 0.59375, 1.08935546875, 1.5849609375, 2.08056640625, 2.576171875, 3.07177734375, 3.5673828125, 4.06298828125, 4.55859375, 5.05419921875, 5.5498046875, 6.04541015625, 6.541015625, 7.03662109375, 7.5322265625, 8.02783203125, 8.5234375, 9.01904296875, 9.5146484375, 10.01025390625, 10.505859375, 11.00146484375, 11.4970703125, 11.99267578125, 12.48828125, 12.98388671875, 13.4794921875, 13.97509765625, 14.470703125, 14.96630859375, 15.4619140625, 15.95751953125, 16.453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 9.0, 3.0, 6.0, 6.0, 14.0, 8.0, 18.0, 20.0, 21.0, 19.0, 19.0, 28.0, 29.0, 33.0, 33.0, 46.0, 42.0, 37.0, 37.0, 48.0, 45.0, 51.0, 40.0, 37.0, 30.0, 31.0, 42.0, 31.0, 43.0, 28.0, 26.0, 26.0, 13.0, 14.0, 16.0, 11.0, 13.0, 2.0, 8.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-33.53125, -32.6240234375, -31.716796875, -30.8095703125, -29.90234375, -28.9951171875, -28.087890625, -27.1806640625, -26.2734375, -25.3662109375, -24.458984375, -23.5517578125, -22.64453125, -21.7373046875, -20.830078125, -19.9228515625, -19.015625, -18.1083984375, -17.201171875, -16.2939453125, -15.38671875, -14.4794921875, -13.572265625, -12.6650390625, -11.7578125, -10.8505859375, -9.943359375, -9.0361328125, -8.12890625, -7.2216796875, -6.314453125, -5.4072265625, -4.5, -3.5927734375, -2.685546875, -1.7783203125, -0.87109375, 0.0361328125, 0.943359375, 1.8505859375, 2.7578125, 3.6650390625, 4.572265625, 5.4794921875, 6.38671875, 7.2939453125, 8.201171875, 9.1083984375, 10.015625, 10.9228515625, 11.830078125, 12.7373046875, 13.64453125, 14.5517578125, 15.458984375, 16.3662109375, 17.2734375, 18.1806640625, 19.087890625, 19.9951171875, 20.90234375, 21.8095703125, 22.716796875, 23.6240234375, 24.53125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 13.0, 22.0, 35.0, 69.0, 89.0, 157.0, 242.0, 421.0, 708.0, 1111.0, 1896.0, 3225.0, 5330.0, 8627.0, 13766.0, 21151.0, 31952.0, 46349.0, 63317.0, 81058.0, 97731.0, 107883.0, 111969.0, 106165.0, 92884.0, 75823.0, 57353.0, 41404.0, 28456.0, 18636.0, 11966.0, 7355.0, 4484.0, 2733.0, 1640.0, 1037.0, 593.0, 371.0, 203.0, 159.0, 72.0, 42.0, 25.0, 15.0, 7.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-10.125, -9.8302001953125, -9.535400390625, -9.2406005859375, -8.94580078125, -8.6510009765625, -8.356201171875, -8.0614013671875, -7.7666015625, -7.4718017578125, -7.177001953125, -6.8822021484375, -6.58740234375, -6.2926025390625, -5.997802734375, -5.7030029296875, -5.408203125, -5.1134033203125, -4.818603515625, -4.5238037109375, -4.22900390625, -3.9342041015625, -3.639404296875, -3.3446044921875, -3.0498046875, -2.7550048828125, -2.460205078125, -2.1654052734375, -1.87060546875, -1.5758056640625, -1.281005859375, -0.9862060546875, -0.69140625, -0.3966064453125, -0.101806640625, 0.1929931640625, 0.48779296875, 0.7825927734375, 1.077392578125, 1.3721923828125, 1.6669921875, 1.9617919921875, 2.256591796875, 2.5513916015625, 2.84619140625, 3.1409912109375, 3.435791015625, 3.7305908203125, 4.025390625, 4.3201904296875, 4.614990234375, 4.9097900390625, 5.20458984375, 5.4993896484375, 5.794189453125, 6.0889892578125, 6.3837890625, 6.6785888671875, 6.973388671875, 7.2681884765625, 7.56298828125, 7.8577880859375, 8.152587890625, 8.4473876953125, 8.7421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 6.0, 4.0, 3.0, 6.0, 5.0, 11.0, 10.0, 20.0, 14.0, 22.0, 23.0, 30.0, 21.0, 25.0, 28.0, 27.0, 28.0, 39.0, 39.0, 35.0, 44.0, 43.0, 35.0, 51.0, 36.0, 30.0, 37.0, 36.0, 31.0, 31.0, 24.0, 17.0, 28.0, 28.0, 14.0, 23.0, 14.0, 11.0, 11.0, 14.0, 5.0, 5.0, 2.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.000881195068359375, -0.000851556658744812, -0.000821918249130249, -0.000792279839515686, -0.000762641429901123, -0.0007330030202865601, -0.0007033646106719971, -0.0006737262010574341, -0.0006440877914428711, -0.0006144493818283081, -0.0005848109722137451, -0.0005551725625991821, -0.0005255341529846191, -0.0004958957433700562, -0.00046625733375549316, -0.0004366189241409302, -0.0004069805145263672, -0.0003773421049118042, -0.0003477036952972412, -0.0003180652856826782, -0.00028842687606811523, -0.00025878846645355225, -0.00022915005683898926, -0.00019951164722442627, -0.00016987323760986328, -0.0001402348279953003, -0.0001105964183807373, -8.095800876617432e-05, -5.131959915161133e-05, -2.168118953704834e-05, 7.957220077514648e-06, 3.759562969207764e-05, 6.723403930664062e-05, 9.687244892120361e-05, 0.0001265108585357666, 0.0001561492681503296, 0.00018578767776489258, 0.00021542608737945557, 0.00024506449699401855, 0.00027470290660858154, 0.00030434131622314453, 0.0003339797258377075, 0.0003636181354522705, 0.0003932565450668335, 0.0004228949546813965, 0.00045253336429595947, 0.00048217177391052246, 0.0005118101835250854, 0.0005414485931396484, 0.0005710870027542114, 0.0006007254123687744, 0.0006303638219833374, 0.0006600022315979004, 0.0006896406412124634, 0.0007192790508270264, 0.0007489174604415894, 0.0007785558700561523, 0.0008081942796707153, 0.0008378326892852783, 0.0008674710988998413, 0.0008971095085144043, 0.0009267479181289673, 0.0009563863277435303, 0.0009860247373580933, 0.0010156631469726562]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 15.0, 25.0, 21.0, 42.0, 59.0, 95.0, 141.0, 234.0, 386.0, 566.0, 890.0, 1447.0, 2389.0, 3761.0, 6056.0, 9590.0, 15228.0, 23066.0, 34456.0, 49380.0, 66440.0, 84595.0, 100421.0, 110288.0, 111358.0, 103594.0, 89361.0, 71599.0, 53730.0, 37934.0, 25814.0, 16666.0, 10917.0, 6771.0, 4126.0, 2573.0, 1669.0, 1004.0, 691.0, 415.0, 274.0, 139.0, 115.0, 61.0, 52.0, 30.0, 21.0, 13.0, 12.0, 9.0, 7.0, 2.0, 1.0, 2.0], "bins": [-11.53125, -11.193359375, -10.85546875, -10.517578125, -10.1796875, -9.841796875, -9.50390625, -9.166015625, -8.828125, -8.490234375, -8.15234375, -7.814453125, -7.4765625, -7.138671875, -6.80078125, -6.462890625, -6.125, -5.787109375, -5.44921875, -5.111328125, -4.7734375, -4.435546875, -4.09765625, -3.759765625, -3.421875, -3.083984375, -2.74609375, -2.408203125, -2.0703125, -1.732421875, -1.39453125, -1.056640625, -0.71875, -0.380859375, -0.04296875, 0.294921875, 0.6328125, 0.970703125, 1.30859375, 1.646484375, 1.984375, 2.322265625, 2.66015625, 2.998046875, 3.3359375, 3.673828125, 4.01171875, 4.349609375, 4.6875, 5.025390625, 5.36328125, 5.701171875, 6.0390625, 6.376953125, 6.71484375, 7.052734375, 7.390625, 7.728515625, 8.06640625, 8.404296875, 8.7421875, 9.080078125, 9.41796875, 9.755859375, 10.09375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 10.0, 10.0, 8.0, 13.0, 11.0, 17.0, 16.0, 22.0, 29.0, 33.0, 37.0, 38.0, 46.0, 49.0, 64.0, 52.0, 46.0, 57.0, 56.0, 46.0, 46.0, 30.0, 41.0, 33.0, 22.0, 30.0, 23.0, 22.0, 16.0, 15.0, 7.0, 4.0, 5.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.234375, -5.0631103515625, -4.891845703125, -4.7205810546875, -4.54931640625, -4.3780517578125, -4.206787109375, -4.0355224609375, -3.8642578125, -3.6929931640625, -3.521728515625, -3.3504638671875, -3.17919921875, -3.0079345703125, -2.836669921875, -2.6654052734375, -2.494140625, -2.3228759765625, -2.151611328125, -1.9803466796875, -1.80908203125, -1.6378173828125, -1.466552734375, -1.2952880859375, -1.1240234375, -0.9527587890625, -0.781494140625, -0.6102294921875, -0.43896484375, -0.2677001953125, -0.096435546875, 0.0748291015625, 0.24609375, 0.4173583984375, 0.588623046875, 0.7598876953125, 0.93115234375, 1.1024169921875, 1.273681640625, 1.4449462890625, 1.6162109375, 1.7874755859375, 1.958740234375, 2.1300048828125, 2.30126953125, 2.4725341796875, 2.643798828125, 2.8150634765625, 2.986328125, 3.1575927734375, 3.328857421875, 3.5001220703125, 3.67138671875, 3.8426513671875, 4.013916015625, 4.1851806640625, 4.3564453125, 4.5277099609375, 4.698974609375, 4.8702392578125, 5.04150390625, 5.2127685546875, 5.384033203125, 5.5552978515625, 5.7265625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 6.0, 8.0, 13.0, 13.0, 14.0, 16.0, 19.0, 30.0, 22.0, 26.0, 23.0, 32.0, 24.0, 28.0, 37.0, 38.0, 47.0, 43.0, 45.0, 50.0, 35.0, 37.0, 41.0, 35.0, 45.0, 25.0, 39.0, 38.0, 23.0, 14.0, 16.0, 21.0, 20.0, 14.0, 10.0, 7.0, 13.0, 3.0, 7.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-37.35649490356445, -36.284942626953125, -35.21338653564453, -34.1418342590332, -33.070281982421875, -31.998727798461914, -30.927173614501953, -29.855621337890625, -28.784067153930664, -27.712512969970703, -26.640960693359375, -25.569406509399414, -24.497852325439453, -23.426300048828125, -22.354745864868164, -21.283191680908203, -20.211639404296875, -19.140085220336914, -18.068532943725586, -16.996978759765625, -15.92542552947998, -14.853872299194336, -13.782318115234375, -12.71076488494873, -11.639211654663086, -10.567658424377441, -9.496105194091797, -8.424551010131836, -7.352997779846191, -6.281444549560547, -5.209890842437744, -4.138337135314941, -3.0667800903320312, -1.9952266216278076, -0.923673152923584, 0.14788031578063965, 1.2194337844848633, 2.290987014770508, 3.3625407218933105, 4.434094429016113, 5.505647659301758, 6.577200889587402, 7.648754596710205, 8.720308303833008, 9.791861534118652, 10.863414764404297, 11.934968948364258, 13.006522178649902, 14.078075408935547, 15.149628639221191, 16.221181869506836, 17.292736053466797, 18.364288330078125, 19.435842514038086, 20.507396697998047, 21.578948974609375, 22.650503158569336, 23.722057342529297, 24.793609619140625, 25.865163803100586, 26.936717987060547, 28.008270263671875, 29.079824447631836, 30.151378631591797, 31.222930908203125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 6.0, 13.0, 11.0, 12.0, 17.0, 20.0, 16.0, 23.0, 27.0, 29.0, 23.0, 28.0, 42.0, 45.0, 27.0, 46.0, 42.0, 32.0, 51.0, 38.0, 39.0, 52.0, 45.0, 24.0, 36.0, 27.0, 38.0, 25.0, 32.0, 14.0, 18.0, 19.0, 12.0, 9.0, 14.0, 8.0, 9.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.5936164855957, -45.1582145690918, -43.72281265258789, -42.287410736083984, -40.85200881958008, -39.41660690307617, -37.981201171875, -36.545799255371094, -35.11039733886719, -33.67499542236328, -32.239593505859375, -30.80419158935547, -29.368789672851562, -27.933387756347656, -26.497983932495117, -25.06258201599121, -23.627182006835938, -22.19178009033203, -20.756378173828125, -19.32097625732422, -17.885574340820312, -16.450172424316406, -15.014768600463867, -13.579366683959961, -12.143964767456055, -10.708562850952148, -9.273160934448242, -7.8377580642700195, -6.402356147766113, -4.966954231262207, -3.5315513610839844, -2.096149444580078, -0.6607475280761719, 0.7746546268463135, 2.210056781768799, 3.6454591751098633, 5.0808610916137695, 6.516263008117676, 7.951665878295898, 9.387067794799805, 10.822469711303711, 12.257871627807617, 13.693273544311523, 15.128676414489746, 16.56407928466797, 17.999481201171875, 19.43488311767578, 20.870285034179688, 22.305686950683594, 23.7410888671875, 25.176490783691406, 26.611892700195312, 28.04729461669922, 29.482696533203125, 30.918100357055664, 32.35350036621094, 33.788902282714844, 35.22430419921875, 36.659706115722656, 38.09510803222656, 39.53050994873047, 40.965911865234375, 42.40131378173828, 43.83671569824219, 45.27212142944336]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 11.0, 22.0, 28.0, 58.0, 72.0, 151.0, 226.0, 398.0, 656.0, 1047.0, 1610.0, 2578.0, 4109.0, 6505.0, 9713.0, 14865.0, 22231.0, 32378.0, 46729.0, 64682.0, 88245.0, 118969.0, 152407.0, 192165.0, 231216.0, 270810.0, 302796.0, 323496.0, 333971.0, 328128.0, 308708.0, 279572.0, 241849.0, 203273.0, 163806.0, 126329.0, 95611.0, 70618.0, 50282.0, 35145.0, 23749.0, 16075.0, 10515.0, 6937.0, 4384.0, 2846.0, 1654.0, 1017.0, 692.0, 380.0, 231.0, 147.0, 94.0, 44.0, 32.0, 12.0, 7.0, 6.0, 4.0, 2.0, 2.0], "bins": [-22.03125, -21.33447265625, -20.6376953125, -19.94091796875, -19.244140625, -18.54736328125, -17.8505859375, -17.15380859375, -16.45703125, -15.76025390625, -15.0634765625, -14.36669921875, -13.669921875, -12.97314453125, -12.2763671875, -11.57958984375, -10.8828125, -10.18603515625, -9.4892578125, -8.79248046875, -8.095703125, -7.39892578125, -6.7021484375, -6.00537109375, -5.30859375, -4.61181640625, -3.9150390625, -3.21826171875, -2.521484375, -1.82470703125, -1.1279296875, -0.43115234375, 0.265625, 0.96240234375, 1.6591796875, 2.35595703125, 3.052734375, 3.74951171875, 4.4462890625, 5.14306640625, 5.83984375, 6.53662109375, 7.2333984375, 7.93017578125, 8.626953125, 9.32373046875, 10.0205078125, 10.71728515625, 11.4140625, 12.11083984375, 12.8076171875, 13.50439453125, 14.201171875, 14.89794921875, 15.5947265625, 16.29150390625, 16.98828125, 17.68505859375, 18.3818359375, 19.07861328125, 19.775390625, 20.47216796875, 21.1689453125, 21.86572265625, 22.5625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 4.0, 15.0, 11.0, 13.0, 14.0, 21.0, 18.0, 20.0, 26.0, 26.0, 25.0, 31.0, 37.0, 44.0, 35.0, 31.0, 49.0, 36.0, 47.0, 38.0, 42.0, 44.0, 45.0, 25.0, 33.0, 34.0, 34.0, 27.0, 28.0, 22.0, 14.0, 22.0, 13.0, 10.0, 11.0, 15.0, 3.0, 11.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.875, -40.583984375, -39.29296875, -38.001953125, -36.7109375, -35.419921875, -34.12890625, -32.837890625, -31.546875, -30.255859375, -28.96484375, -27.673828125, -26.3828125, -25.091796875, -23.80078125, -22.509765625, -21.21875, -19.927734375, -18.63671875, -17.345703125, -16.0546875, -14.763671875, -13.47265625, -12.181640625, -10.890625, -9.599609375, -8.30859375, -7.017578125, -5.7265625, -4.435546875, -3.14453125, -1.853515625, -0.5625, 0.728515625, 2.01953125, 3.310546875, 4.6015625, 5.892578125, 7.18359375, 8.474609375, 9.765625, 11.056640625, 12.34765625, 13.638671875, 14.9296875, 16.220703125, 17.51171875, 18.802734375, 20.09375, 21.384765625, 22.67578125, 23.966796875, 25.2578125, 26.548828125, 27.83984375, 29.130859375, 30.421875, 31.712890625, 33.00390625, 34.294921875, 35.5859375, 36.876953125, 38.16796875, 39.458984375, 40.75]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 19.0, 35.0, 64.0, 169.0, 238.0, 505.0, 969.0, 1739.0, 3342.0, 5904.0, 10238.0, 17064.0, 28313.0, 44189.0, 67939.0, 99267.0, 140249.0, 188489.0, 241819.0, 295047.0, 340422.0, 372575.0, 385123.0, 375999.0, 350043.0, 306286.0, 254770.0, 200687.0, 152338.0, 108571.0, 74701.0, 49728.0, 31538.0, 19264.0, 11678.0, 6692.0, 3847.0, 2112.0, 1092.0, 593.0, 317.0, 155.0, 73.0, 44.0, 27.0, 12.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-30.734375, -29.87158203125, -29.0087890625, -28.14599609375, -27.283203125, -26.42041015625, -25.5576171875, -24.69482421875, -23.83203125, -22.96923828125, -22.1064453125, -21.24365234375, -20.380859375, -19.51806640625, -18.6552734375, -17.79248046875, -16.9296875, -16.06689453125, -15.2041015625, -14.34130859375, -13.478515625, -12.61572265625, -11.7529296875, -10.89013671875, -10.02734375, -9.16455078125, -8.3017578125, -7.43896484375, -6.576171875, -5.71337890625, -4.8505859375, -3.98779296875, -3.125, -2.26220703125, -1.3994140625, -0.53662109375, 0.326171875, 1.18896484375, 2.0517578125, 2.91455078125, 3.77734375, 4.64013671875, 5.5029296875, 6.36572265625, 7.228515625, 8.09130859375, 8.9541015625, 9.81689453125, 10.6796875, 11.54248046875, 12.4052734375, 13.26806640625, 14.130859375, 14.99365234375, 15.8564453125, 16.71923828125, 17.58203125, 18.44482421875, 19.3076171875, 20.17041015625, 21.033203125, 21.89599609375, 22.7587890625, 23.62158203125, 24.484375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 7.0, 12.0, 9.0, 12.0, 13.0, 24.0, 31.0, 48.0, 47.0, 51.0, 63.0, 69.0, 95.0, 97.0, 115.0, 124.0, 136.0, 153.0, 154.0, 154.0, 197.0, 192.0, 174.0, 190.0, 184.0, 183.0, 153.0, 173.0, 163.0, 128.0, 134.0, 122.0, 100.0, 91.0, 95.0, 61.0, 58.0, 56.0, 40.0, 33.0, 35.0, 19.0, 22.0, 7.0, 25.0, 8.0, 6.0, 9.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.296875, -15.7744140625, -15.251953125, -14.7294921875, -14.20703125, -13.6845703125, -13.162109375, -12.6396484375, -12.1171875, -11.5947265625, -11.072265625, -10.5498046875, -10.02734375, -9.5048828125, -8.982421875, -8.4599609375, -7.9375, -7.4150390625, -6.892578125, -6.3701171875, -5.84765625, -5.3251953125, -4.802734375, -4.2802734375, -3.7578125, -3.2353515625, -2.712890625, -2.1904296875, -1.66796875, -1.1455078125, -0.623046875, -0.1005859375, 0.421875, 0.9443359375, 1.466796875, 1.9892578125, 2.51171875, 3.0341796875, 3.556640625, 4.0791015625, 4.6015625, 5.1240234375, 5.646484375, 6.1689453125, 6.69140625, 7.2138671875, 7.736328125, 8.2587890625, 8.78125, 9.3037109375, 9.826171875, 10.3486328125, 10.87109375, 11.3935546875, 11.916015625, 12.4384765625, 12.9609375, 13.4833984375, 14.005859375, 14.5283203125, 15.05078125, 15.5732421875, 16.095703125, 16.6181640625, 17.140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 7.0, 3.0, 8.0, 6.0, 6.0, 16.0, 11.0, 13.0, 25.0, 17.0, 29.0, 33.0, 33.0, 27.0, 50.0, 45.0, 30.0, 40.0, 40.0, 43.0, 43.0, 44.0, 40.0, 37.0, 33.0, 39.0, 43.0, 37.0, 30.0, 21.0, 35.0, 19.0, 26.0, 14.0, 7.0, 9.0, 12.0, 7.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.42011260986328, -38.20119857788086, -36.98228454589844, -35.76336669921875, -34.54445266723633, -33.325538635253906, -32.10662078857422, -30.887706756591797, -29.668792724609375, -28.449878692626953, -27.2309627532959, -26.012046813964844, -24.793132781982422, -23.57421875, -22.355302810668945, -21.13638687133789, -19.91747283935547, -18.698558807373047, -17.479642868041992, -16.260726928710938, -15.041812896728516, -13.822897911071777, -12.603982925415039, -11.3850679397583, -10.166152954101562, -8.947237968444824, -7.728322982788086, -6.509407997131348, -5.290493011474609, -4.071578025817871, -2.852663040161133, -1.6337480545043945, -0.4148292541503906, 0.8040857315063477, 2.023000717163086, 3.241915702819824, 4.4608306884765625, 5.679745674133301, 6.898660659790039, 8.117575645446777, 9.336490631103516, 10.555405616760254, 11.774320602416992, 12.99323558807373, 14.212150573730469, 15.431065559387207, 16.649980545043945, 17.868896484375, 19.087810516357422, 20.306724548339844, 21.5256404876709, 22.744556427001953, 23.963470458984375, 25.182384490966797, 26.40130043029785, 27.620216369628906, 28.839130401611328, 30.05804443359375, 31.276960372924805, 32.49587631225586, 33.71479034423828, 34.9337043762207, 36.152618408203125, 37.37153625488281, 38.590450286865234]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 6.0, 6.0, 6.0, 5.0, 9.0, 11.0, 15.0, 17.0, 20.0, 26.0, 21.0, 22.0, 30.0, 28.0, 28.0, 25.0, 32.0, 34.0, 41.0, 47.0, 43.0, 34.0, 25.0, 39.0, 43.0, 39.0, 32.0, 34.0, 33.0, 26.0, 33.0, 31.0, 25.0, 12.0, 26.0, 16.0, 16.0, 7.0, 11.0, 11.0, 11.0, 12.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.32664108276367, -41.88127136230469, -40.4359016418457, -38.99053192138672, -37.545162200927734, -36.09979248046875, -34.6544189453125, -33.20905303955078, -31.763681411743164, -30.31831169128418, -28.872941970825195, -27.427570343017578, -25.982200622558594, -24.53683090209961, -23.091461181640625, -21.64609146118164, -20.200721740722656, -18.755352020263672, -17.309982299804688, -15.864611625671387, -14.419241905212402, -12.973872184753418, -11.528501510620117, -10.083131790161133, -8.637762069702148, -7.192392349243164, -5.7470221519470215, -4.301651954650879, -2.8562822341918945, -1.4109125137329102, 0.034458160400390625, 1.479827880859375, 2.9251976013183594, 4.370567321777344, 5.815937519073486, 7.261307716369629, 8.706677436828613, 10.152047157287598, 11.597417831420898, 13.042787551879883, 14.488157272338867, 15.933526992797852, 17.378896713256836, 18.824268341064453, 20.269638061523438, 21.715007781982422, 23.160377502441406, 24.60574722290039, 26.051116943359375, 27.49648666381836, 28.941856384277344, 30.387226104736328, 31.832595825195312, 33.2779655456543, 34.72333526611328, 36.16870880126953, 37.61407470703125, 39.059444427490234, 40.50481414794922, 41.9501838684082, 43.39555358886719, 44.84092330932617, 46.286293029785156, 47.731666564941406, 49.17703628540039]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 8.0, 9.0, 18.0, 24.0, 47.0, 57.0, 114.0, 168.0, 311.0, 537.0, 1051.0, 2122.0, 4280.0, 9227.0, 20371.0, 47150.0, 111903.0, 241089.0, 300873.0, 175065.0, 75460.0, 32060.0, 13934.0, 6348.0, 2998.0, 1510.0, 788.0, 428.0, 224.0, 153.0, 84.0, 50.0, 34.0, 16.0, 9.0, 17.0, 9.0, 0.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8046875, -9.5008544921875, -9.197021484375, -8.8931884765625, -8.58935546875, -8.2855224609375, -7.981689453125, -7.6778564453125, -7.3740234375, -7.0701904296875, -6.766357421875, -6.4625244140625, -6.15869140625, -5.8548583984375, -5.551025390625, -5.2471923828125, -4.943359375, -4.6395263671875, -4.335693359375, -4.0318603515625, -3.72802734375, -3.4241943359375, -3.120361328125, -2.8165283203125, -2.5126953125, -2.2088623046875, -1.905029296875, -1.6011962890625, -1.29736328125, -0.9935302734375, -0.689697265625, -0.3858642578125, -0.08203125, 0.2218017578125, 0.525634765625, 0.8294677734375, 1.13330078125, 1.4371337890625, 1.740966796875, 2.0447998046875, 2.3486328125, 2.6524658203125, 2.956298828125, 3.2601318359375, 3.56396484375, 3.8677978515625, 4.171630859375, 4.4754638671875, 4.779296875, 5.0831298828125, 5.386962890625, 5.6907958984375, 5.99462890625, 6.2984619140625, 6.602294921875, 6.9061279296875, 7.2099609375, 7.5137939453125, 7.817626953125, 8.1214599609375, 8.42529296875, 8.7291259765625, 9.032958984375, 9.3367919921875, 9.640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 5.0, 8.0, 10.0, 14.0, 20.0, 17.0, 27.0, 22.0, 20.0, 29.0, 31.0, 28.0, 25.0, 27.0, 36.0, 41.0, 48.0, 42.0, 34.0, 27.0, 38.0, 44.0, 36.0, 30.0, 40.0, 31.0, 27.0, 33.0, 31.0, 25.0, 12.0, 27.0, 16.0, 16.0, 8.0, 11.0, 11.0, 10.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.34375, -41.89501953125, -40.4462890625, -38.99755859375, -37.548828125, -36.10009765625, -34.6513671875, -33.20263671875, -31.75390625, -30.30517578125, -28.8564453125, -27.40771484375, -25.958984375, -24.51025390625, -23.0615234375, -21.61279296875, -20.1640625, -18.71533203125, -17.2666015625, -15.81787109375, -14.369140625, -12.92041015625, -11.4716796875, -10.02294921875, -8.57421875, -7.12548828125, -5.6767578125, -4.22802734375, -2.779296875, -1.33056640625, 0.1181640625, 1.56689453125, 3.015625, 4.46435546875, 5.9130859375, 7.36181640625, 8.810546875, 10.25927734375, 11.7080078125, 13.15673828125, 14.60546875, 16.05419921875, 17.5029296875, 18.95166015625, 20.400390625, 21.84912109375, 23.2978515625, 24.74658203125, 26.1953125, 27.64404296875, 29.0927734375, 30.54150390625, 31.990234375, 33.43896484375, 34.8876953125, 36.33642578125, 37.78515625, 39.23388671875, 40.6826171875, 42.13134765625, 43.580078125, 45.02880859375, 46.4775390625, 47.92626953125, 49.375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 8.0, 13.0, 23.0, 35.0, 53.0, 57.0, 93.0, 152.0, 241.0, 384.0, 668.0, 1041.0, 1765.0, 3315.0, 6194.0, 13326.0, 30415.0, 78767.0, 221955.0, 376292.0, 194117.0, 68285.0, 26672.0, 11802.0, 5729.0, 2987.0, 1621.0, 1015.0, 544.0, 335.0, 238.0, 132.0, 82.0, 47.0, 35.0, 34.0, 17.0, 19.0, 14.0, 7.0, 4.0, 6.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.1328125, -9.8297119140625, -9.526611328125, -9.2235107421875, -8.92041015625, -8.6173095703125, -8.314208984375, -8.0111083984375, -7.7080078125, -7.4049072265625, -7.101806640625, -6.7987060546875, -6.49560546875, -6.1925048828125, -5.889404296875, -5.5863037109375, -5.283203125, -4.9801025390625, -4.677001953125, -4.3739013671875, -4.07080078125, -3.7677001953125, -3.464599609375, -3.1614990234375, -2.8583984375, -2.5552978515625, -2.252197265625, -1.9490966796875, -1.64599609375, -1.3428955078125, -1.039794921875, -0.7366943359375, -0.43359375, -0.1304931640625, 0.172607421875, 0.4757080078125, 0.77880859375, 1.0819091796875, 1.385009765625, 1.6881103515625, 1.9912109375, 2.2943115234375, 2.597412109375, 2.9005126953125, 3.20361328125, 3.5067138671875, 3.809814453125, 4.1129150390625, 4.416015625, 4.7191162109375, 5.022216796875, 5.3253173828125, 5.62841796875, 5.9315185546875, 6.234619140625, 6.5377197265625, 6.8408203125, 7.1439208984375, 7.447021484375, 7.7501220703125, 8.05322265625, 8.3563232421875, 8.659423828125, 8.9625244140625, 9.265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 10.0, 6.0, 19.0, 17.0, 23.0, 15.0, 27.0, 30.0, 23.0, 24.0, 45.0, 49.0, 33.0, 55.0, 44.0, 49.0, 43.0, 47.0, 48.0, 41.0, 38.0, 40.0, 27.0, 35.0, 32.0, 28.0, 17.0, 16.0, 17.0, 12.0, 14.0, 12.0, 6.0, 10.0, 8.0, 11.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.03125, -36.92529296875, -35.8193359375, -34.71337890625, -33.607421875, -32.50146484375, -31.3955078125, -30.28955078125, -29.18359375, -28.07763671875, -26.9716796875, -25.86572265625, -24.759765625, -23.65380859375, -22.5478515625, -21.44189453125, -20.3359375, -19.22998046875, -18.1240234375, -17.01806640625, -15.912109375, -14.80615234375, -13.7001953125, -12.59423828125, -11.48828125, -10.38232421875, -9.2763671875, -8.17041015625, -7.064453125, -5.95849609375, -4.8525390625, -3.74658203125, -2.640625, -1.53466796875, -0.4287109375, 0.67724609375, 1.783203125, 2.88916015625, 3.9951171875, 5.10107421875, 6.20703125, 7.31298828125, 8.4189453125, 9.52490234375, 10.630859375, 11.73681640625, 12.8427734375, 13.94873046875, 15.0546875, 16.16064453125, 17.2666015625, 18.37255859375, 19.478515625, 20.58447265625, 21.6904296875, 22.79638671875, 23.90234375, 25.00830078125, 26.1142578125, 27.22021484375, 28.326171875, 29.43212890625, 30.5380859375, 31.64404296875, 32.75]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 7.0, 11.0, 21.0, 17.0, 32.0, 47.0, 67.0, 98.0, 142.0, 199.0, 350.0, 650.0, 1130.0, 1980.0, 3958.0, 8310.0, 19745.0, 57396.0, 278435.0, 517671.0, 103904.0, 30627.0, 12014.0, 5387.0, 2692.0, 1486.0, 861.0, 499.0, 276.0, 206.0, 120.0, 77.0, 53.0, 36.0, 23.0, 12.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5625, -4.4114990234375, -4.260498046875, -4.1094970703125, -3.95849609375, -3.8074951171875, -3.656494140625, -3.5054931640625, -3.3544921875, -3.2034912109375, -3.052490234375, -2.9014892578125, -2.75048828125, -2.5994873046875, -2.448486328125, -2.2974853515625, -2.146484375, -1.9954833984375, -1.844482421875, -1.6934814453125, -1.54248046875, -1.3914794921875, -1.240478515625, -1.0894775390625, -0.9384765625, -0.7874755859375, -0.636474609375, -0.4854736328125, -0.33447265625, -0.1834716796875, -0.032470703125, 0.1185302734375, 0.26953125, 0.4205322265625, 0.571533203125, 0.7225341796875, 0.87353515625, 1.0245361328125, 1.175537109375, 1.3265380859375, 1.4775390625, 1.6285400390625, 1.779541015625, 1.9305419921875, 2.08154296875, 2.2325439453125, 2.383544921875, 2.5345458984375, 2.685546875, 2.8365478515625, 2.987548828125, 3.1385498046875, 3.28955078125, 3.4405517578125, 3.591552734375, 3.7425537109375, 3.8935546875, 4.0445556640625, 4.195556640625, 4.3465576171875, 4.49755859375, 4.6485595703125, 4.799560546875, 4.9505615234375, 5.1015625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 2.0, 4.0, 6.0, 8.0, 1.0, 13.0, 18.0, 18.0, 18.0, 23.0, 28.0, 43.0, 27.0, 35.0, 44.0, 31.0, 56.0, 43.0, 60.0, 61.0, 44.0, 41.0, 41.0, 55.0, 47.0, 33.0, 40.0, 30.0, 20.0, 18.0, 15.0, 16.0, 12.0, 13.0, 10.0, 7.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00016450881958007812, -0.00015909597277641296, -0.0001536831259727478, -0.00014827027916908264, -0.00014285743236541748, -0.00013744458556175232, -0.00013203173875808716, -0.000126618891954422, -0.00012120604515075684, -0.00011579319834709167, -0.00011038035154342651, -0.00010496750473976135, -9.955465793609619e-05, -9.414181113243103e-05, -8.872896432876587e-05, -8.331611752510071e-05, -7.790327072143555e-05, -7.249042391777039e-05, -6.707757711410522e-05, -6.166473031044006e-05, -5.62518835067749e-05, -5.083903670310974e-05, -4.542618989944458e-05, -4.001334309577942e-05, -3.460049629211426e-05, -2.9187649488449097e-05, -2.3774802684783936e-05, -1.8361955881118774e-05, -1.2949109077453613e-05, -7.536262273788452e-06, -2.123415470123291e-06, 3.28943133354187e-06, 8.702278137207031e-06, 1.4115124940872192e-05, 1.9527971744537354e-05, 2.4940818548202515e-05, 3.0353665351867676e-05, 3.576651215553284e-05, 4.1179358959198e-05, 4.659220576286316e-05, 5.200505256652832e-05, 5.741789937019348e-05, 6.283074617385864e-05, 6.82435929775238e-05, 7.365643978118896e-05, 7.906928658485413e-05, 8.448213338851929e-05, 8.989498019218445e-05, 9.530782699584961e-05, 0.00010072067379951477, 0.00010613352060317993, 0.00011154636740684509, 0.00011695921421051025, 0.00012237206101417542, 0.00012778490781784058, 0.00013319775462150574, 0.0001386106014251709, 0.00014402344822883606, 0.00014943629503250122, 0.00015484914183616638, 0.00016026198863983154, 0.0001656748354434967, 0.00017108768224716187, 0.00017650052905082703, 0.0001819133758544922]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 8.0, 9.0, 9.0, 20.0, 32.0, 55.0, 68.0, 103.0, 140.0, 217.0, 322.0, 505.0, 715.0, 1239.0, 1896.0, 3135.0, 5052.0, 8337.0, 14201.0, 24988.0, 45772.0, 83527.0, 148188.0, 219006.0, 203156.0, 127100.0, 70095.0, 38404.0, 21477.0, 12232.0, 7191.0, 4249.0, 2463.0, 1624.0, 1068.0, 653.0, 407.0, 292.0, 218.0, 112.0, 83.0, 54.0, 41.0, 29.0, 20.0, 13.0, 11.0, 8.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.716796875, -3.603668212890625, -3.49053955078125, -3.377410888671875, -3.2642822265625, -3.151153564453125, -3.03802490234375, -2.924896240234375, -2.811767578125, -2.698638916015625, -2.58551025390625, -2.472381591796875, -2.3592529296875, -2.246124267578125, -2.13299560546875, -2.019866943359375, -1.90673828125, -1.793609619140625, -1.68048095703125, -1.567352294921875, -1.4542236328125, -1.341094970703125, -1.22796630859375, -1.114837646484375, -1.001708984375, -0.888580322265625, -0.77545166015625, -0.662322998046875, -0.5491943359375, -0.436065673828125, -0.32293701171875, -0.209808349609375, -0.0966796875, 0.016448974609375, 0.12957763671875, 0.242706298828125, 0.3558349609375, 0.468963623046875, 0.58209228515625, 0.695220947265625, 0.808349609375, 0.921478271484375, 1.03460693359375, 1.147735595703125, 1.2608642578125, 1.373992919921875, 1.48712158203125, 1.600250244140625, 1.71337890625, 1.826507568359375, 1.93963623046875, 2.052764892578125, 2.1658935546875, 2.279022216796875, 2.39215087890625, 2.505279541015625, 2.618408203125, 2.731536865234375, 2.84466552734375, 2.957794189453125, 3.0709228515625, 3.184051513671875, 3.29718017578125, 3.410308837890625, 3.5234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 6.0, 12.0, 14.0, 15.0, 17.0, 24.0, 32.0, 62.0, 48.0, 75.0, 89.0, 96.0, 86.0, 71.0, 63.0, 66.0, 44.0, 43.0, 29.0, 21.0, 14.0, 19.0, 10.0, 9.0, 3.0, 9.0, 7.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.013671875, -2.919097900390625, -2.82452392578125, -2.729949951171875, -2.6353759765625, -2.540802001953125, -2.44622802734375, -2.351654052734375, -2.257080078125, -2.162506103515625, -2.06793212890625, -1.973358154296875, -1.8787841796875, -1.784210205078125, -1.68963623046875, -1.595062255859375, -1.50048828125, -1.405914306640625, -1.31134033203125, -1.216766357421875, -1.1221923828125, -1.027618408203125, -0.93304443359375, -0.838470458984375, -0.743896484375, -0.649322509765625, -0.55474853515625, -0.460174560546875, -0.3656005859375, -0.271026611328125, -0.17645263671875, -0.081878662109375, 0.0126953125, 0.107269287109375, 0.20184326171875, 0.296417236328125, 0.3909912109375, 0.485565185546875, 0.58013916015625, 0.674713134765625, 0.769287109375, 0.863861083984375, 0.95843505859375, 1.053009033203125, 1.1475830078125, 1.242156982421875, 1.33673095703125, 1.431304931640625, 1.52587890625, 1.620452880859375, 1.71502685546875, 1.809600830078125, 1.9041748046875, 1.998748779296875, 2.09332275390625, 2.187896728515625, 2.282470703125, 2.377044677734375, 2.47161865234375, 2.566192626953125, 2.6607666015625, 2.755340576171875, 2.84991455078125, 2.944488525390625, 3.0390625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 4.0, 8.0, 9.0, 16.0, 13.0, 20.0, 21.0, 26.0, 28.0, 27.0, 35.0, 38.0, 50.0, 36.0, 35.0, 47.0, 36.0, 46.0, 38.0, 42.0, 41.0, 41.0, 34.0, 40.0, 42.0, 31.0, 24.0, 30.0, 24.0, 27.0, 13.0, 12.0, 12.0, 8.0, 8.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.04429626464844, -37.81381607055664, -36.58333206176758, -35.35285186767578, -34.12236785888672, -32.89188766479492, -31.661407470703125, -30.430925369262695, -29.200443267822266, -27.969961166381836, -26.739479064941406, -25.50899887084961, -24.27851676940918, -23.04803466796875, -21.817554473876953, -20.587072372436523, -19.356590270996094, -18.126108169555664, -16.895626068115234, -15.665145874023438, -14.434663772583008, -13.204181671142578, -11.973700523376465, -10.743219375610352, -9.512737274169922, -8.282255172729492, -7.051774024963379, -5.821292400360107, -4.590810775756836, -3.3603291511535645, -2.129847526550293, -0.8993663787841797, 0.33111572265625, 1.5615973472595215, 2.792078971862793, 4.0225605964660645, 5.253042221069336, 6.483523845672607, 7.714005470275879, 8.944486618041992, 10.174968719482422, 11.405450820922852, 12.635931968688965, 13.866413116455078, 15.096895217895508, 16.327377319335938, 17.557857513427734, 18.788339614868164, 20.018821716308594, 21.249303817749023, 22.479785919189453, 23.71026611328125, 24.94074821472168, 26.17123031616211, 27.401710510253906, 28.632192611694336, 29.862674713134766, 31.093156814575195, 32.323638916015625, 33.55411911010742, 34.78459930419922, 36.01508331298828, 37.24556350708008, 38.476043701171875, 39.70652770996094]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 5.0, 11.0, 16.0, 8.0, 16.0, 26.0, 21.0, 22.0, 21.0, 30.0, 30.0, 28.0, 29.0, 31.0, 40.0, 35.0, 47.0, 39.0, 32.0, 31.0, 38.0, 45.0, 37.0, 29.0, 37.0, 29.0, 27.0, 34.0, 32.0, 19.0, 17.0, 22.0, 20.0, 12.0, 7.0, 17.0, 8.0, 9.0, 13.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.920928955078125, -41.475074768066406, -40.02922058105469, -38.58336639404297, -37.13751220703125, -35.69165802001953, -34.24580383300781, -32.799949645996094, -31.354095458984375, -29.908241271972656, -28.462387084960938, -27.01653289794922, -25.5706787109375, -24.12482452392578, -22.678970336914062, -21.233116149902344, -19.787261962890625, -18.341407775878906, -16.895553588867188, -15.449699401855469, -14.00384521484375, -12.557991027832031, -11.112136840820312, -9.666282653808594, -8.220428466796875, -6.774574279785156, -5.3287200927734375, -3.8828659057617188, -2.43701171875, -0.9911575317382812, 0.4546966552734375, 1.9005508422851562, 3.3464088439941406, 4.792263031005859, 6.238117218017578, 7.683971405029297, 9.129825592041016, 10.575679779052734, 12.021533966064453, 13.467388153076172, 14.91324234008789, 16.35909652709961, 17.804950714111328, 19.250804901123047, 20.696659088134766, 22.142513275146484, 23.588367462158203, 25.034221649169922, 26.48007583618164, 27.92593002319336, 29.371784210205078, 30.817638397216797, 32.263492584228516, 33.709346771240234, 35.15520095825195, 36.60105514526367, 38.04690933227539, 39.49276351928711, 40.93861770629883, 42.38447189331055, 43.830326080322266, 45.276180267333984, 46.7220344543457, 48.16788864135742, 49.61374282836914]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 12.0, 26.0, 30.0, 49.0, 79.0, 143.0, 225.0, 288.0, 521.0, 851.0, 1391.0, 2059.0, 3032.0, 4602.0, 6928.0, 9554.0, 13800.0, 19112.0, 25466.0, 33232.0, 42391.0, 52059.0, 61534.0, 69525.0, 76654.0, 80678.0, 81547.0, 78863.0, 73172.0, 65872.0, 56845.0, 46548.0, 37966.0, 29328.0, 21940.0, 16489.0, 11482.0, 8064.0, 5439.0, 3685.0, 2539.0, 1607.0, 1073.0, 686.0, 429.0, 279.0, 177.0, 100.0, 69.0, 49.0, 27.0, 14.0, 11.0, 8.0, 5.0, 4.0], "bins": [-17.875, -17.35302734375, -16.8310546875, -16.30908203125, -15.787109375, -15.26513671875, -14.7431640625, -14.22119140625, -13.69921875, -13.17724609375, -12.6552734375, -12.13330078125, -11.611328125, -11.08935546875, -10.5673828125, -10.04541015625, -9.5234375, -9.00146484375, -8.4794921875, -7.95751953125, -7.435546875, -6.91357421875, -6.3916015625, -5.86962890625, -5.34765625, -4.82568359375, -4.3037109375, -3.78173828125, -3.259765625, -2.73779296875, -2.2158203125, -1.69384765625, -1.171875, -0.64990234375, -0.1279296875, 0.39404296875, 0.916015625, 1.43798828125, 1.9599609375, 2.48193359375, 3.00390625, 3.52587890625, 4.0478515625, 4.56982421875, 5.091796875, 5.61376953125, 6.1357421875, 6.65771484375, 7.1796875, 7.70166015625, 8.2236328125, 8.74560546875, 9.267578125, 9.78955078125, 10.3115234375, 10.83349609375, 11.35546875, 11.87744140625, 12.3994140625, 12.92138671875, 13.443359375, 13.96533203125, 14.4873046875, 15.00927734375, 15.53125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 4.0, 12.0, 15.0, 8.0, 17.0, 25.0, 22.0, 21.0, 21.0, 30.0, 35.0, 19.0, 30.0, 35.0, 34.0, 39.0, 44.0, 38.0, 34.0, 32.0, 36.0, 42.0, 39.0, 31.0, 34.0, 28.0, 30.0, 32.0, 36.0, 21.0, 16.0, 22.0, 18.0, 15.0, 8.0, 15.0, 8.0, 9.0, 13.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.3125, -40.89306640625, -39.4736328125, -38.05419921875, -36.634765625, -35.21533203125, -33.7958984375, -32.37646484375, -30.95703125, -29.53759765625, -28.1181640625, -26.69873046875, -25.279296875, -23.85986328125, -22.4404296875, -21.02099609375, -19.6015625, -18.18212890625, -16.7626953125, -15.34326171875, -13.923828125, -12.50439453125, -11.0849609375, -9.66552734375, -8.24609375, -6.82666015625, -5.4072265625, -3.98779296875, -2.568359375, -1.14892578125, 0.2705078125, 1.68994140625, 3.109375, 4.52880859375, 5.9482421875, 7.36767578125, 8.787109375, 10.20654296875, 11.6259765625, 13.04541015625, 14.46484375, 15.88427734375, 17.3037109375, 18.72314453125, 20.142578125, 21.56201171875, 22.9814453125, 24.40087890625, 25.8203125, 27.23974609375, 28.6591796875, 30.07861328125, 31.498046875, 32.91748046875, 34.3369140625, 35.75634765625, 37.17578125, 38.59521484375, 40.0146484375, 41.43408203125, 42.853515625, 44.27294921875, 45.6923828125, 47.11181640625, 48.53125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 14.0, 21.0, 46.0, 54.0, 100.0, 176.0, 291.0, 456.0, 686.0, 1098.0, 1767.0, 2858.0, 4389.0, 6461.0, 10108.0, 14835.0, 21234.0, 29230.0, 39456.0, 50852.0, 64505.0, 75369.0, 85104.0, 91091.0, 92774.0, 88927.0, 81032.0, 70068.0, 57701.0, 45375.0, 34440.0, 24840.0, 17771.0, 12501.0, 8217.0, 5445.0, 3537.0, 2088.0, 1341.0, 844.0, 519.0, 368.0, 231.0, 135.0, 67.0, 48.0, 33.0, 16.0, 8.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-18.953125, -18.32666015625, -17.7001953125, -17.07373046875, -16.447265625, -15.82080078125, -15.1943359375, -14.56787109375, -13.94140625, -13.31494140625, -12.6884765625, -12.06201171875, -11.435546875, -10.80908203125, -10.1826171875, -9.55615234375, -8.9296875, -8.30322265625, -7.6767578125, -7.05029296875, -6.423828125, -5.79736328125, -5.1708984375, -4.54443359375, -3.91796875, -3.29150390625, -2.6650390625, -2.03857421875, -1.412109375, -0.78564453125, -0.1591796875, 0.46728515625, 1.09375, 1.72021484375, 2.3466796875, 2.97314453125, 3.599609375, 4.22607421875, 4.8525390625, 5.47900390625, 6.10546875, 6.73193359375, 7.3583984375, 7.98486328125, 8.611328125, 9.23779296875, 9.8642578125, 10.49072265625, 11.1171875, 11.74365234375, 12.3701171875, 12.99658203125, 13.623046875, 14.24951171875, 14.8759765625, 15.50244140625, 16.12890625, 16.75537109375, 17.3818359375, 18.00830078125, 18.634765625, 19.26123046875, 19.8876953125, 20.51416015625, 21.140625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 0.0, 4.0, 5.0, 4.0, 9.0, 6.0, 10.0, 13.0, 16.0, 18.0, 15.0, 26.0, 27.0, 33.0, 40.0, 36.0, 34.0, 32.0, 47.0, 34.0, 36.0, 52.0, 44.0, 40.0, 34.0, 37.0, 38.0, 35.0, 38.0, 29.0, 24.0, 30.0, 21.0, 21.0, 11.0, 21.0, 15.0, 14.0, 12.0, 11.0, 3.0, 9.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-35.28125, -34.263671875, -33.24609375, -32.228515625, -31.2109375, -30.193359375, -29.17578125, -28.158203125, -27.140625, -26.123046875, -25.10546875, -24.087890625, -23.0703125, -22.052734375, -21.03515625, -20.017578125, -19.0, -17.982421875, -16.96484375, -15.947265625, -14.9296875, -13.912109375, -12.89453125, -11.876953125, -10.859375, -9.841796875, -8.82421875, -7.806640625, -6.7890625, -5.771484375, -4.75390625, -3.736328125, -2.71875, -1.701171875, -0.68359375, 0.333984375, 1.3515625, 2.369140625, 3.38671875, 4.404296875, 5.421875, 6.439453125, 7.45703125, 8.474609375, 9.4921875, 10.509765625, 11.52734375, 12.544921875, 13.5625, 14.580078125, 15.59765625, 16.615234375, 17.6328125, 18.650390625, 19.66796875, 20.685546875, 21.703125, 22.720703125, 23.73828125, 24.755859375, 25.7734375, 26.791015625, 27.80859375, 28.826171875, 29.84375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 12.0, 18.0, 29.0, 56.0, 95.0, 136.0, 230.0, 411.0, 647.0, 1078.0, 1613.0, 2626.0, 4174.0, 6570.0, 10379.0, 15607.0, 23118.0, 33079.0, 45240.0, 58953.0, 73975.0, 87072.0, 96361.0, 100385.0, 97813.0, 89386.0, 77659.0, 62686.0, 48516.0, 35947.0, 25535.0, 17453.0, 11516.0, 7468.0, 4737.0, 3026.0, 1885.0, 1177.0, 750.0, 447.0, 284.0, 161.0, 109.0, 46.0, 40.0, 16.0, 21.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0], "bins": [-10.390625, -10.090576171875, -9.79052734375, -9.490478515625, -9.1904296875, -8.890380859375, -8.59033203125, -8.290283203125, -7.990234375, -7.690185546875, -7.39013671875, -7.090087890625, -6.7900390625, -6.489990234375, -6.18994140625, -5.889892578125, -5.58984375, -5.289794921875, -4.98974609375, -4.689697265625, -4.3896484375, -4.089599609375, -3.78955078125, -3.489501953125, -3.189453125, -2.889404296875, -2.58935546875, -2.289306640625, -1.9892578125, -1.689208984375, -1.38916015625, -1.089111328125, -0.7890625, -0.489013671875, -0.18896484375, 0.111083984375, 0.4111328125, 0.711181640625, 1.01123046875, 1.311279296875, 1.611328125, 1.911376953125, 2.21142578125, 2.511474609375, 2.8115234375, 3.111572265625, 3.41162109375, 3.711669921875, 4.01171875, 4.311767578125, 4.61181640625, 4.911865234375, 5.2119140625, 5.511962890625, 5.81201171875, 6.112060546875, 6.412109375, 6.712158203125, 7.01220703125, 7.312255859375, 7.6123046875, 7.912353515625, 8.21240234375, 8.512451171875, 8.8125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 4.0, 4.0, 9.0, 10.0, 13.0, 15.0, 6.0, 12.0, 20.0, 25.0, 20.0, 28.0, 25.0, 36.0, 31.0, 33.0, 44.0, 42.0, 45.0, 29.0, 34.0, 41.0, 47.0, 31.0, 47.0, 36.0, 25.0, 42.0, 38.0, 28.0, 24.0, 26.0, 24.0, 17.0, 19.0, 14.0, 6.0, 11.0, 16.0, 7.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010700225830078125, -0.0010326355695724487, -0.000995248556137085, -0.0009578615427017212, -0.0009204745292663574, -0.0008830875158309937, -0.0008457005023956299, -0.0008083134889602661, -0.0007709264755249023, -0.0007335394620895386, -0.0006961524486541748, -0.000658765435218811, -0.0006213784217834473, -0.0005839914083480835, -0.0005466043949127197, -0.000509217381477356, -0.0004718303680419922, -0.0004344433546066284, -0.00039705634117126465, -0.0003596693277359009, -0.0003222823143005371, -0.00028489530086517334, -0.00024750828742980957, -0.0002101212739944458, -0.00017273426055908203, -0.00013534724712371826, -9.796023368835449e-05, -6.057322025299072e-05, -2.3186206817626953e-05, 1.4200806617736816e-05, 5.1587820053100586e-05, 8.897483348846436e-05, 0.00012636184692382812, 0.0001637488603591919, 0.00020113587379455566, 0.00023852288722991943, 0.0002759099006652832, 0.00031329691410064697, 0.00035068392753601074, 0.0003880709409713745, 0.0004254579544067383, 0.00046284496784210205, 0.0005002319812774658, 0.0005376189947128296, 0.0005750060081481934, 0.0006123930215835571, 0.0006497800350189209, 0.0006871670484542847, 0.0007245540618896484, 0.0007619410753250122, 0.000799328088760376, 0.0008367151021957397, 0.0008741021156311035, 0.0009114891290664673, 0.0009488761425018311, 0.0009862631559371948, 0.0010236501693725586, 0.0010610371828079224, 0.0010984241962432861, 0.00113581120967865, 0.0011731982231140137, 0.0012105852365493774, 0.0012479722499847412, 0.001285359263420105, 0.0013227462768554688]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 12.0, 27.0, 47.0, 43.0, 101.0, 165.0, 278.0, 406.0, 683.0, 1119.0, 1661.0, 2753.0, 4418.0, 6808.0, 10459.0, 16110.0, 23410.0, 33444.0, 46420.0, 60753.0, 75403.0, 89069.0, 98500.0, 102128.0, 98403.0, 89154.0, 75702.0, 61015.0, 46558.0, 33986.0, 23654.0, 16337.0, 10640.0, 6883.0, 4468.0, 2877.0, 1748.0, 1099.0, 696.0, 417.0, 275.0, 156.0, 94.0, 54.0, 45.0, 24.0, 18.0, 10.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-10.8671875, -10.532958984375, -10.19873046875, -9.864501953125, -9.5302734375, -9.196044921875, -8.86181640625, -8.527587890625, -8.193359375, -7.859130859375, -7.52490234375, -7.190673828125, -6.8564453125, -6.522216796875, -6.18798828125, -5.853759765625, -5.51953125, -5.185302734375, -4.85107421875, -4.516845703125, -4.1826171875, -3.848388671875, -3.51416015625, -3.179931640625, -2.845703125, -2.511474609375, -2.17724609375, -1.843017578125, -1.5087890625, -1.174560546875, -0.84033203125, -0.506103515625, -0.171875, 0.162353515625, 0.49658203125, 0.830810546875, 1.1650390625, 1.499267578125, 1.83349609375, 2.167724609375, 2.501953125, 2.836181640625, 3.17041015625, 3.504638671875, 3.8388671875, 4.173095703125, 4.50732421875, 4.841552734375, 5.17578125, 5.510009765625, 5.84423828125, 6.178466796875, 6.5126953125, 6.846923828125, 7.18115234375, 7.515380859375, 7.849609375, 8.183837890625, 8.51806640625, 8.852294921875, 9.1865234375, 9.520751953125, 9.85498046875, 10.189208984375, 10.5234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 8.0, 10.0, 14.0, 24.0, 20.0, 16.0, 26.0, 31.0, 41.0, 57.0, 49.0, 76.0, 74.0, 51.0, 58.0, 59.0, 68.0, 45.0, 44.0, 54.0, 30.0, 26.0, 27.0, 18.0, 10.0, 9.0, 13.0, 13.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3828125, -7.15142822265625, -6.9200439453125, -6.68865966796875, -6.457275390625, -6.22589111328125, -5.9945068359375, -5.76312255859375, -5.53173828125, -5.30035400390625, -5.0689697265625, -4.83758544921875, -4.606201171875, -4.37481689453125, -4.1434326171875, -3.91204833984375, -3.6806640625, -3.44927978515625, -3.2178955078125, -2.98651123046875, -2.755126953125, -2.52374267578125, -2.2923583984375, -2.06097412109375, -1.82958984375, -1.59820556640625, -1.3668212890625, -1.13543701171875, -0.904052734375, -0.67266845703125, -0.4412841796875, -0.20989990234375, 0.021484375, 0.25286865234375, 0.4842529296875, 0.71563720703125, 0.947021484375, 1.17840576171875, 1.4097900390625, 1.64117431640625, 1.87255859375, 2.10394287109375, 2.3353271484375, 2.56671142578125, 2.798095703125, 3.02947998046875, 3.2608642578125, 3.49224853515625, 3.7236328125, 3.95501708984375, 4.1864013671875, 4.41778564453125, 4.649169921875, 4.88055419921875, 5.1119384765625, 5.34332275390625, 5.57470703125, 5.80609130859375, 6.0374755859375, 6.26885986328125, 6.500244140625, 6.73162841796875, 6.9630126953125, 7.19439697265625, 7.42578125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 2.0, 8.0, 17.0, 12.0, 9.0, 11.0, 13.0, 23.0, 31.0, 15.0, 37.0, 41.0, 50.0, 37.0, 29.0, 59.0, 51.0, 38.0, 38.0, 50.0, 55.0, 43.0, 40.0, 33.0, 33.0, 36.0, 32.0, 26.0, 28.0, 22.0, 19.0, 12.0, 10.0, 3.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.491859436035156, -43.1541862487793, -41.81651306152344, -40.47883605957031, -39.14116287231445, -37.803489685058594, -36.465816497802734, -35.128143310546875, -33.79046630859375, -32.45279312133789, -31.1151180267334, -29.77744483947754, -28.439769744873047, -27.102096557617188, -25.764423370361328, -24.42675018310547, -23.08907699584961, -21.75140380859375, -20.413728713989258, -19.0760555267334, -17.738380432128906, -16.400707244873047, -15.063034057617188, -13.725359916687012, -12.387685775756836, -11.05001163482666, -9.712337493896484, -8.374664306640625, -7.036990165710449, -5.699316024780273, -4.361642837524414, -3.0239686965942383, -1.6862983703613281, -0.34862446784973145, 0.9890494346618652, 2.326723098754883, 3.6643972396850586, 5.002071380615234, 6.339744567871094, 7.6774187088012695, 9.015092849731445, 10.352766990661621, 11.690441131591797, 13.028114318847656, 14.365788459777832, 15.703462600708008, 17.041135787963867, 18.37881088256836, 19.71648406982422, 21.054157257080078, 22.39183235168457, 23.72950553894043, 25.067180633544922, 26.40485382080078, 27.74252700805664, 29.0802001953125, 30.417875289916992, 31.75554847717285, 33.093223571777344, 34.4308967590332, 35.76856994628906, 37.10624694824219, 38.44391632080078, 39.781593322753906, 41.119266510009766]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 6.0, 5.0, 5.0, 9.0, 16.0, 16.0, 22.0, 23.0, 18.0, 23.0, 20.0, 29.0, 27.0, 35.0, 37.0, 38.0, 37.0, 30.0, 34.0, 40.0, 47.0, 42.0, 44.0, 38.0, 43.0, 35.0, 42.0, 39.0, 27.0, 30.0, 26.0, 24.0, 14.0, 11.0, 16.0, 8.0, 8.0, 6.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-63.33000564575195, -61.52952575683594, -59.72904586791992, -57.928565979003906, -56.12808609008789, -54.327606201171875, -52.527122497558594, -50.72664260864258, -48.92616271972656, -47.12568283081055, -45.32520294189453, -43.524723052978516, -41.7242431640625, -39.92375946044922, -38.12328338623047, -36.32279968261719, -34.52232360839844, -32.72184371948242, -30.921363830566406, -29.12088394165039, -27.320402145385742, -25.519922256469727, -23.71944236755371, -21.918960571289062, -20.118480682373047, -18.31800079345703, -16.517520904541016, -14.717040061950684, -12.916559219360352, -11.116079330444336, -9.31559944152832, -7.515118598937988, -5.714637756347656, -3.9141573905944824, -2.1136772632598877, -0.31319713592529297, 1.4872832298278809, 3.2877635955810547, 5.08824348449707, 6.888724327087402, 8.689204216003418, 10.489684104919434, 12.290164947509766, 14.090644836425781, 15.891124725341797, 17.691604614257812, 19.492084503173828, 21.292566299438477, 23.093046188354492, 24.893526077270508, 26.694005966186523, 28.494487762451172, 30.294967651367188, 32.0954475402832, 33.89592742919922, 35.696407318115234, 37.49688720703125, 39.297367095947266, 41.09784698486328, 42.8983268737793, 44.69880676269531, 46.499290466308594, 48.299766540527344, 50.100250244140625, 51.90073013305664]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 7.0, 14.0, 24.0, 36.0, 73.0, 102.0, 153.0, 262.0, 488.0, 728.0, 1275.0, 1975.0, 3350.0, 5334.0, 8301.0, 13318.0, 20516.0, 30692.0, 46394.0, 67492.0, 94655.0, 130536.0, 172230.0, 217775.0, 266889.0, 310391.0, 345147.0, 364210.0, 363898.0, 344646.0, 310806.0, 266175.0, 218414.0, 170987.0, 128293.0, 93994.0, 65214.0, 45311.0, 30591.0, 19935.0, 12681.0, 8064.0, 5037.0, 3050.0, 1959.0, 1175.0, 668.0, 411.0, 256.0, 129.0, 104.0, 57.0, 27.0, 20.0, 9.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-27.265625, -26.385498046875, -25.50537109375, -24.625244140625, -23.7451171875, -22.864990234375, -21.98486328125, -21.104736328125, -20.224609375, -19.344482421875, -18.46435546875, -17.584228515625, -16.7041015625, -15.823974609375, -14.94384765625, -14.063720703125, -13.18359375, -12.303466796875, -11.42333984375, -10.543212890625, -9.6630859375, -8.782958984375, -7.90283203125, -7.022705078125, -6.142578125, -5.262451171875, -4.38232421875, -3.502197265625, -2.6220703125, -1.741943359375, -0.86181640625, 0.018310546875, 0.8984375, 1.778564453125, 2.65869140625, 3.538818359375, 4.4189453125, 5.299072265625, 6.17919921875, 7.059326171875, 7.939453125, 8.819580078125, 9.69970703125, 10.579833984375, 11.4599609375, 12.340087890625, 13.22021484375, 14.100341796875, 14.98046875, 15.860595703125, 16.74072265625, 17.620849609375, 18.5009765625, 19.381103515625, 20.26123046875, 21.141357421875, 22.021484375, 22.901611328125, 23.78173828125, 24.661865234375, 25.5419921875, 26.422119140625, 27.30224609375, 28.182373046875, 29.0625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 1.0, 6.0, 9.0, 18.0, 13.0, 25.0, 19.0, 18.0, 24.0, 26.0, 22.0, 31.0, 34.0, 38.0, 36.0, 37.0, 30.0, 40.0, 40.0, 44.0, 39.0, 41.0, 40.0, 42.0, 40.0, 41.0, 36.0, 27.0, 29.0, 24.0, 23.0, 16.0, 11.0, 16.0, 9.0, 6.0, 9.0, 10.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-60.4375, -58.7158203125, -56.994140625, -55.2724609375, -53.55078125, -51.8291015625, -50.107421875, -48.3857421875, -46.6640625, -44.9423828125, -43.220703125, -41.4990234375, -39.77734375, -38.0556640625, -36.333984375, -34.6123046875, -32.890625, -31.1689453125, -29.447265625, -27.7255859375, -26.00390625, -24.2822265625, -22.560546875, -20.8388671875, -19.1171875, -17.3955078125, -15.673828125, -13.9521484375, -12.23046875, -10.5087890625, -8.787109375, -7.0654296875, -5.34375, -3.6220703125, -1.900390625, -0.1787109375, 1.54296875, 3.2646484375, 4.986328125, 6.7080078125, 8.4296875, 10.1513671875, 11.873046875, 13.5947265625, 15.31640625, 17.0380859375, 18.759765625, 20.4814453125, 22.203125, 23.9248046875, 25.646484375, 27.3681640625, 29.08984375, 30.8115234375, 32.533203125, 34.2548828125, 35.9765625, 37.6982421875, 39.419921875, 41.1416015625, 42.86328125, 44.5849609375, 46.306640625, 48.0283203125, 49.75]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [4.0, 5.0, 14.0, 16.0, 30.0, 45.0, 98.0, 192.0, 251.0, 412.0, 723.0, 1306.0, 1972.0, 3227.0, 4971.0, 7990.0, 12201.0, 18475.0, 27216.0, 38381.0, 54494.0, 74579.0, 99780.0, 129174.0, 162978.0, 198167.0, 233679.0, 264837.0, 290578.0, 306895.0, 313708.0, 307242.0, 293631.0, 266091.0, 234719.0, 199988.0, 163815.0, 130992.0, 100694.0, 75591.0, 55521.0, 39851.0, 27182.0, 18749.0, 12355.0, 7980.0, 5207.0, 3324.0, 1968.0, 1237.0, 697.0, 431.0, 270.0, 156.0, 87.0, 58.0, 31.0, 20.0, 9.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-24.6875, -23.878662109375, -23.06982421875, -22.260986328125, -21.4521484375, -20.643310546875, -19.83447265625, -19.025634765625, -18.216796875, -17.407958984375, -16.59912109375, -15.790283203125, -14.9814453125, -14.172607421875, -13.36376953125, -12.554931640625, -11.74609375, -10.937255859375, -10.12841796875, -9.319580078125, -8.5107421875, -7.701904296875, -6.89306640625, -6.084228515625, -5.275390625, -4.466552734375, -3.65771484375, -2.848876953125, -2.0400390625, -1.231201171875, -0.42236328125, 0.386474609375, 1.1953125, 2.004150390625, 2.81298828125, 3.621826171875, 4.4306640625, 5.239501953125, 6.04833984375, 6.857177734375, 7.666015625, 8.474853515625, 9.28369140625, 10.092529296875, 10.9013671875, 11.710205078125, 12.51904296875, 13.327880859375, 14.13671875, 14.945556640625, 15.75439453125, 16.563232421875, 17.3720703125, 18.180908203125, 18.98974609375, 19.798583984375, 20.607421875, 21.416259765625, 22.22509765625, 23.033935546875, 23.8427734375, 24.651611328125, 25.46044921875, 26.269287109375, 27.078125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 7.0, 1.0, 3.0, 4.0, 11.0, 11.0, 16.0, 20.0, 16.0, 28.0, 32.0, 33.0, 52.0, 66.0, 81.0, 81.0, 88.0, 109.0, 86.0, 135.0, 124.0, 156.0, 152.0, 173.0, 195.0, 173.0, 164.0, 183.0, 187.0, 168.0, 170.0, 133.0, 175.0, 120.0, 124.0, 100.0, 126.0, 91.0, 88.0, 79.0, 64.0, 49.0, 44.0, 42.0, 27.0, 22.0, 17.0, 14.0, 16.0, 11.0, 4.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.3125, -19.68017578125, -19.0478515625, -18.41552734375, -17.783203125, -17.15087890625, -16.5185546875, -15.88623046875, -15.25390625, -14.62158203125, -13.9892578125, -13.35693359375, -12.724609375, -12.09228515625, -11.4599609375, -10.82763671875, -10.1953125, -9.56298828125, -8.9306640625, -8.29833984375, -7.666015625, -7.03369140625, -6.4013671875, -5.76904296875, -5.13671875, -4.50439453125, -3.8720703125, -3.23974609375, -2.607421875, -1.97509765625, -1.3427734375, -0.71044921875, -0.078125, 0.55419921875, 1.1865234375, 1.81884765625, 2.451171875, 3.08349609375, 3.7158203125, 4.34814453125, 4.98046875, 5.61279296875, 6.2451171875, 6.87744140625, 7.509765625, 8.14208984375, 8.7744140625, 9.40673828125, 10.0390625, 10.67138671875, 11.3037109375, 11.93603515625, 12.568359375, 13.20068359375, 13.8330078125, 14.46533203125, 15.09765625, 15.72998046875, 16.3623046875, 16.99462890625, 17.626953125, 18.25927734375, 18.8916015625, 19.52392578125, 20.15625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 4.0, 6.0, 4.0, 10.0, 13.0, 12.0, 13.0, 17.0, 14.0, 34.0, 22.0, 25.0, 34.0, 40.0, 37.0, 30.0, 45.0, 35.0, 38.0, 51.0, 41.0, 35.0, 45.0, 46.0, 48.0, 42.0, 32.0, 28.0, 25.0, 31.0, 17.0, 27.0, 18.0, 13.0, 17.0, 15.0, 8.0, 8.0, 10.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.42487716674805, -46.97502899169922, -45.525184631347656, -44.07533645629883, -42.62548828125, -41.17564392089844, -39.72579574584961, -38.27594757080078, -36.82610321044922, -35.37625503540039, -33.92641067504883, -32.4765625, -31.026716232299805, -29.57686996459961, -28.12702178955078, -26.677175521850586, -25.227327346801758, -23.777481079101562, -22.327632904052734, -20.87778663635254, -19.427940368652344, -17.978092193603516, -16.52824592590332, -15.078399658203125, -13.628552436828613, -12.178705215454102, -10.728858947753906, -9.279011726379395, -7.829164981842041, -6.3793182373046875, -4.929471015930176, -3.4796247482299805, -2.0297775268554688, -0.5799306631088257, 0.8699162006378174, 2.31976318359375, 3.7696099281311035, 5.219456672668457, 6.669303894042969, 8.119150161743164, 9.568997383117676, 11.018844604492188, 12.468690872192383, 13.918538093566895, 15.368385314941406, 16.8182315826416, 18.268077850341797, 19.717926025390625, 21.16777229309082, 22.617618560791016, 24.067466735839844, 25.51731300354004, 26.967159271240234, 28.417007446289062, 29.866853713989258, 31.316699981689453, 32.76654815673828, 34.21639633178711, 35.66624069213867, 37.1160888671875, 38.56593704223633, 40.01578140258789, 41.46562957763672, 42.91547393798828, 44.36532211303711]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 13.0, 6.0, 12.0, 19.0, 13.0, 17.0, 25.0, 31.0, 31.0, 18.0, 23.0, 34.0, 43.0, 39.0, 53.0, 43.0, 43.0, 35.0, 44.0, 44.0, 47.0, 42.0, 46.0, 42.0, 35.0, 26.0, 25.0, 23.0, 15.0, 18.0, 20.0, 13.0, 12.0, 15.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.95011901855469, -68.76985931396484, -66.589599609375, -64.40933990478516, -62.22907638549805, -60.0488166809082, -57.868553161621094, -55.68829345703125, -53.508033752441406, -51.32777404785156, -49.14751434326172, -46.96725082397461, -44.786991119384766, -42.60673141479492, -40.42646789550781, -38.24620819091797, -36.065948486328125, -33.88568878173828, -31.705427169799805, -29.525165557861328, -27.344905853271484, -25.16464614868164, -22.984384536743164, -20.804122924804688, -18.623863220214844, -16.443603515625, -14.263341903686523, -12.083081245422363, -9.902820587158203, -7.722559928894043, -5.542299270629883, -3.3620386123657227, -1.1817779541015625, 0.9984827041625977, 3.178743362426758, 5.359004020690918, 7.539264678955078, 9.719525337219238, 11.899785995483398, 14.080046653747559, 16.26030731201172, 18.440567016601562, 20.62082862854004, 22.801090240478516, 24.98134994506836, 27.161609649658203, 29.34187126159668, 31.522132873535156, 33.702392578125, 35.882652282714844, 38.06291198730469, 40.2431755065918, 42.42343521118164, 44.603694915771484, 46.783958435058594, 48.96421813964844, 51.14447784423828, 53.324737548828125, 55.50499725341797, 57.68526077270508, 59.86552047729492, 62.045780181884766, 64.22604370117188, 66.40630340576172, 68.58656311035156]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 14.0, 17.0, 21.0, 39.0, 57.0, 114.0, 137.0, 204.0, 292.0, 476.0, 714.0, 1046.0, 1743.0, 2764.0, 4618.0, 7315.0, 12310.0, 20500.0, 34400.0, 57772.0, 95747.0, 146888.0, 186497.0, 170670.0, 119811.0, 74035.0, 44246.0, 26155.0, 15422.0, 9221.0, 5735.0, 3443.0, 2279.0, 1306.0, 904.0, 559.0, 345.0, 231.0, 148.0, 117.0, 70.0, 46.0, 32.0, 26.0, 26.0, 13.0, 8.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-7.0390625, -6.81005859375, -6.5810546875, -6.35205078125, -6.123046875, -5.89404296875, -5.6650390625, -5.43603515625, -5.20703125, -4.97802734375, -4.7490234375, -4.52001953125, -4.291015625, -4.06201171875, -3.8330078125, -3.60400390625, -3.375, -3.14599609375, -2.9169921875, -2.68798828125, -2.458984375, -2.22998046875, -2.0009765625, -1.77197265625, -1.54296875, -1.31396484375, -1.0849609375, -0.85595703125, -0.626953125, -0.39794921875, -0.1689453125, 0.06005859375, 0.2890625, 0.51806640625, 0.7470703125, 0.97607421875, 1.205078125, 1.43408203125, 1.6630859375, 1.89208984375, 2.12109375, 2.35009765625, 2.5791015625, 2.80810546875, 3.037109375, 3.26611328125, 3.4951171875, 3.72412109375, 3.953125, 4.18212890625, 4.4111328125, 4.64013671875, 4.869140625, 5.09814453125, 5.3271484375, 5.55615234375, 5.78515625, 6.01416015625, 6.2431640625, 6.47216796875, 6.701171875, 6.93017578125, 7.1591796875, 7.38818359375, 7.6171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 7.0, 10.0, 14.0, 6.0, 13.0, 18.0, 13.0, 16.0, 28.0, 29.0, 33.0, 19.0, 22.0, 32.0, 46.0, 39.0, 54.0, 43.0, 42.0, 34.0, 48.0, 42.0, 46.0, 44.0, 43.0, 40.0, 36.0, 26.0, 23.0, 24.0, 14.0, 19.0, 19.0, 14.0, 11.0, 15.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.4375, -68.2568359375, -66.076171875, -63.8955078125, -61.71484375, -59.5341796875, -57.353515625, -55.1728515625, -52.9921875, -50.8115234375, -48.630859375, -46.4501953125, -44.26953125, -42.0888671875, -39.908203125, -37.7275390625, -35.546875, -33.3662109375, -31.185546875, -29.0048828125, -26.82421875, -24.6435546875, -22.462890625, -20.2822265625, -18.1015625, -15.9208984375, -13.740234375, -11.5595703125, -9.37890625, -7.1982421875, -5.017578125, -2.8369140625, -0.65625, 1.5244140625, 3.705078125, 5.8857421875, 8.06640625, 10.2470703125, 12.427734375, 14.6083984375, 16.7890625, 18.9697265625, 21.150390625, 23.3310546875, 25.51171875, 27.6923828125, 29.873046875, 32.0537109375, 34.234375, 36.4150390625, 38.595703125, 40.7763671875, 42.95703125, 45.1376953125, 47.318359375, 49.4990234375, 51.6796875, 53.8603515625, 56.041015625, 58.2216796875, 60.40234375, 62.5830078125, 64.763671875, 66.9443359375, 69.125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 7.0, 10.0, 4.0, 19.0, 20.0, 23.0, 49.0, 62.0, 116.0, 120.0, 176.0, 237.0, 357.0, 552.0, 841.0, 1284.0, 1972.0, 3243.0, 5204.0, 8793.0, 15882.0, 28766.0, 55930.0, 111197.0, 212504.0, 260990.0, 163093.0, 82012.0, 41869.0, 22180.0, 12312.0, 7062.0, 4092.0, 2604.0, 1704.0, 1067.0, 689.0, 483.0, 323.0, 206.0, 166.0, 116.0, 80.0, 40.0, 38.0, 26.0, 12.0, 12.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4453125, -7.1910400390625, -6.936767578125, -6.6824951171875, -6.42822265625, -6.1739501953125, -5.919677734375, -5.6654052734375, -5.4111328125, -5.1568603515625, -4.902587890625, -4.6483154296875, -4.39404296875, -4.1397705078125, -3.885498046875, -3.6312255859375, -3.376953125, -3.1226806640625, -2.868408203125, -2.6141357421875, -2.35986328125, -2.1055908203125, -1.851318359375, -1.5970458984375, -1.3427734375, -1.0885009765625, -0.834228515625, -0.5799560546875, -0.32568359375, -0.0714111328125, 0.182861328125, 0.4371337890625, 0.69140625, 0.9456787109375, 1.199951171875, 1.4542236328125, 1.70849609375, 1.9627685546875, 2.217041015625, 2.4713134765625, 2.7255859375, 2.9798583984375, 3.234130859375, 3.4884033203125, 3.74267578125, 3.9969482421875, 4.251220703125, 4.5054931640625, 4.759765625, 5.0140380859375, 5.268310546875, 5.5225830078125, 5.77685546875, 6.0311279296875, 6.285400390625, 6.5396728515625, 6.7939453125, 7.0482177734375, 7.302490234375, 7.5567626953125, 7.81103515625, 8.0653076171875, 8.319580078125, 8.5738525390625, 8.828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 7.0, 12.0, 8.0, 12.0, 17.0, 20.0, 14.0, 21.0, 29.0, 28.0, 33.0, 25.0, 28.0, 45.0, 35.0, 36.0, 45.0, 35.0, 43.0, 38.0, 37.0, 38.0, 49.0, 34.0, 30.0, 36.0, 34.0, 31.0, 33.0, 23.0, 17.0, 18.0, 18.0, 13.0, 12.0, 9.0, 9.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.25, -45.87353515625, -44.4970703125, -43.12060546875, -41.744140625, -40.36767578125, -38.9912109375, -37.61474609375, -36.23828125, -34.86181640625, -33.4853515625, -32.10888671875, -30.732421875, -29.35595703125, -27.9794921875, -26.60302734375, -25.2265625, -23.85009765625, -22.4736328125, -21.09716796875, -19.720703125, -18.34423828125, -16.9677734375, -15.59130859375, -14.21484375, -12.83837890625, -11.4619140625, -10.08544921875, -8.708984375, -7.33251953125, -5.9560546875, -4.57958984375, -3.203125, -1.82666015625, -0.4501953125, 0.92626953125, 2.302734375, 3.67919921875, 5.0556640625, 6.43212890625, 7.80859375, 9.18505859375, 10.5615234375, 11.93798828125, 13.314453125, 14.69091796875, 16.0673828125, 17.44384765625, 18.8203125, 20.19677734375, 21.5732421875, 22.94970703125, 24.326171875, 25.70263671875, 27.0791015625, 28.45556640625, 29.83203125, 31.20849609375, 32.5849609375, 33.96142578125, 35.337890625, 36.71435546875, 38.0908203125, 39.46728515625, 40.84375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 7.0, 17.0, 14.0, 14.0, 13.0, 20.0, 34.0, 54.0, 75.0, 86.0, 107.0, 158.0, 217.0, 304.0, 470.0, 776.0, 1167.0, 2074.0, 3855.0, 7460.0, 16000.0, 41213.0, 151159.0, 546750.0, 192258.0, 48170.0, 17917.0, 8195.0, 4114.0, 2209.0, 1265.0, 767.0, 478.0, 339.0, 217.0, 156.0, 100.0, 82.0, 56.0, 48.0, 35.0, 20.0, 31.0, 15.0, 8.0, 4.0, 5.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-6.23046875, -6.0391845703125, -5.847900390625, -5.6566162109375, -5.46533203125, -5.2740478515625, -5.082763671875, -4.8914794921875, -4.7001953125, -4.5089111328125, -4.317626953125, -4.1263427734375, -3.93505859375, -3.7437744140625, -3.552490234375, -3.3612060546875, -3.169921875, -2.9786376953125, -2.787353515625, -2.5960693359375, -2.40478515625, -2.2135009765625, -2.022216796875, -1.8309326171875, -1.6396484375, -1.4483642578125, -1.257080078125, -1.0657958984375, -0.87451171875, -0.6832275390625, -0.491943359375, -0.3006591796875, -0.109375, 0.0819091796875, 0.273193359375, 0.4644775390625, 0.65576171875, 0.8470458984375, 1.038330078125, 1.2296142578125, 1.4208984375, 1.6121826171875, 1.803466796875, 1.9947509765625, 2.18603515625, 2.3773193359375, 2.568603515625, 2.7598876953125, 2.951171875, 3.1424560546875, 3.333740234375, 3.5250244140625, 3.71630859375, 3.9075927734375, 4.098876953125, 4.2901611328125, 4.4814453125, 4.6727294921875, 4.864013671875, 5.0552978515625, 5.24658203125, 5.4378662109375, 5.629150390625, 5.8204345703125, 6.01171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 0.0, 7.0, 6.0, 9.0, 11.0, 10.0, 27.0, 22.0, 20.0, 30.0, 33.0, 37.0, 56.0, 52.0, 56.0, 49.0, 59.0, 55.0, 52.0, 59.0, 62.0, 35.0, 50.0, 29.0, 34.0, 30.0, 17.0, 20.0, 20.0, 17.0, 7.0, 7.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00030040740966796875, -0.00029208511114120483, -0.0002837628126144409, -0.000275440514087677, -0.0002671182155609131, -0.00025879591703414917, -0.00025047361850738525, -0.00024215131998062134, -0.00023382902145385742, -0.0002255067229270935, -0.0002171844244003296, -0.00020886212587356567, -0.00020053982734680176, -0.00019221752882003784, -0.00018389523029327393, -0.00017557293176651, -0.0001672506332397461, -0.00015892833471298218, -0.00015060603618621826, -0.00014228373765945435, -0.00013396143913269043, -0.00012563914060592651, -0.0001173168420791626, -0.00010899454355239868, -0.00010067224502563477, -9.234994649887085e-05, -8.402764797210693e-05, -7.570534944534302e-05, -6.73830509185791e-05, -5.9060752391815186e-05, -5.073845386505127e-05, -4.2416155338287354e-05, -3.409385681152344e-05, -2.577155828475952e-05, -1.7449259757995605e-05, -9.12696123123169e-06, -8.046627044677734e-07, 7.517635822296143e-06, 1.583993434906006e-05, 2.4162232875823975e-05, 3.248453140258789e-05, 4.080682992935181e-05, 4.912912845611572e-05, 5.745142698287964e-05, 6.577372550964355e-05, 7.409602403640747e-05, 8.241832256317139e-05, 9.07406210899353e-05, 9.906291961669922e-05, 0.00010738521814346313, 0.00011570751667022705, 0.00012402981519699097, 0.00013235211372375488, 0.0001406744122505188, 0.00014899671077728271, 0.00015731900930404663, 0.00016564130783081055, 0.00017396360635757446, 0.00018228590488433838, 0.0001906082034111023, 0.0001989305019378662, 0.00020725280046463013, 0.00021557509899139404, 0.00022389739751815796, 0.00023221969604492188]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 9.0, 13.0, 22.0, 35.0, 57.0, 73.0, 115.0, 155.0, 258.0, 391.0, 701.0, 1183.0, 2055.0, 3653.0, 6616.0, 12552.0, 24627.0, 49818.0, 103853.0, 202824.0, 269308.0, 185070.0, 92657.0, 44700.0, 22396.0, 11353.0, 6144.0, 3327.0, 1812.0, 1090.0, 621.0, 364.0, 235.0, 166.0, 94.0, 52.0, 47.0, 27.0, 13.0, 18.0, 12.0, 6.0, 8.0, 2.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.703125, -4.53765869140625, -4.3721923828125, -4.20672607421875, -4.041259765625, -3.87579345703125, -3.7103271484375, -3.54486083984375, -3.37939453125, -3.21392822265625, -3.0484619140625, -2.88299560546875, -2.717529296875, -2.55206298828125, -2.3865966796875, -2.22113037109375, -2.0556640625, -1.89019775390625, -1.7247314453125, -1.55926513671875, -1.393798828125, -1.22833251953125, -1.0628662109375, -0.89739990234375, -0.73193359375, -0.56646728515625, -0.4010009765625, -0.23553466796875, -0.070068359375, 0.09539794921875, 0.2608642578125, 0.42633056640625, 0.591796875, 0.75726318359375, 0.9227294921875, 1.08819580078125, 1.253662109375, 1.41912841796875, 1.5845947265625, 1.75006103515625, 1.91552734375, 2.08099365234375, 2.2464599609375, 2.41192626953125, 2.577392578125, 2.74285888671875, 2.9083251953125, 3.07379150390625, 3.2392578125, 3.40472412109375, 3.5701904296875, 3.73565673828125, 3.901123046875, 4.06658935546875, 4.2320556640625, 4.39752197265625, 4.56298828125, 4.72845458984375, 4.8939208984375, 5.05938720703125, 5.224853515625, 5.39031982421875, 5.5557861328125, 5.72125244140625, 5.88671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 2.0, 6.0, 8.0, 12.0, 29.0, 34.0, 42.0, 54.0, 70.0, 76.0, 82.0, 93.0, 79.0, 87.0, 75.0, 50.0, 41.0, 32.0, 26.0, 26.0, 16.0, 7.0, 15.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.728515625, -3.588531494140625, -3.44854736328125, -3.308563232421875, -3.1685791015625, -3.028594970703125, -2.88861083984375, -2.748626708984375, -2.608642578125, -2.468658447265625, -2.32867431640625, -2.188690185546875, -2.0487060546875, -1.908721923828125, -1.76873779296875, -1.628753662109375, -1.48876953125, -1.348785400390625, -1.20880126953125, -1.068817138671875, -0.9288330078125, -0.788848876953125, -0.64886474609375, -0.508880615234375, -0.368896484375, -0.228912353515625, -0.08892822265625, 0.051055908203125, 0.1910400390625, 0.331024169921875, 0.47100830078125, 0.610992431640625, 0.7509765625, 0.890960693359375, 1.03094482421875, 1.170928955078125, 1.3109130859375, 1.450897216796875, 1.59088134765625, 1.730865478515625, 1.870849609375, 2.010833740234375, 2.15081787109375, 2.290802001953125, 2.4307861328125, 2.570770263671875, 2.71075439453125, 2.850738525390625, 2.99072265625, 3.130706787109375, 3.27069091796875, 3.410675048828125, 3.5506591796875, 3.690643310546875, 3.83062744140625, 3.970611572265625, 4.110595703125, 4.250579833984375, 4.39056396484375, 4.530548095703125, 4.6705322265625, 4.810516357421875, 4.95050048828125, 5.090484619140625, 5.23046875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 6.0, 9.0, 5.0, 13.0, 15.0, 15.0, 13.0, 21.0, 27.0, 28.0, 22.0, 34.0, 44.0, 39.0, 37.0, 43.0, 41.0, 36.0, 39.0, 48.0, 42.0, 47.0, 44.0, 47.0, 35.0, 34.0, 23.0, 28.0, 31.0, 23.0, 26.0, 11.0, 14.0, 18.0, 7.0, 10.0, 8.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.803672790527344, -47.32434844970703, -45.84502410888672, -44.365699768066406, -42.886375427246094, -41.40705490112305, -39.927730560302734, -38.44840621948242, -36.96908187866211, -35.4897575378418, -34.010433197021484, -32.53110885620117, -31.051786422729492, -29.57246208190918, -28.0931396484375, -26.613815307617188, -25.134490966796875, -23.655166625976562, -22.17584228515625, -20.69651985168457, -19.217195510864258, -17.737871170043945, -16.258548736572266, -14.779224395751953, -13.29990005493164, -11.820575714111328, -10.341252326965332, -8.861928939819336, -7.382604598999023, -5.903280735015869, -4.423956871032715, -2.9446334838867188, -1.4653053283691406, 0.014018535614013672, 1.493342399597168, 2.9726662635803223, 4.451990127563477, 5.931313991546631, 7.410637855529785, 8.889961242675781, 10.369285583496094, 11.848609924316406, 13.327933311462402, 14.807256698608398, 16.28658103942871, 17.765905380249023, 19.245227813720703, 20.724552154541016, 22.203876495361328, 23.68320083618164, 25.162525177001953, 26.641847610473633, 28.121171951293945, 29.600496292114258, 31.079818725585938, 32.55914306640625, 34.03846740722656, 35.517791748046875, 36.99711608886719, 38.4764404296875, 39.95576477050781, 41.43508529663086, 42.91440963745117, 44.393733978271484, 45.8730583190918]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 6.0, 10.0, 10.0, 11.0, 14.0, 12.0, 20.0, 19.0, 25.0, 27.0, 28.0, 28.0, 21.0, 36.0, 42.0, 41.0, 52.0, 47.0, 35.0, 38.0, 49.0, 43.0, 41.0, 53.0, 38.0, 40.0, 36.0, 24.0, 21.0, 25.0, 15.0, 19.0, 17.0, 14.0, 12.0, 13.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-70.67494201660156, -68.4756088256836, -66.27627563476562, -64.07693481445312, -61.877601623535156, -59.67826843261719, -57.47893524169922, -55.279598236083984, -53.08026123046875, -50.88092803955078, -48.68159103393555, -46.48225784301758, -44.282920837402344, -42.083587646484375, -39.884254455566406, -37.68491744995117, -35.4855842590332, -33.286251068115234, -31.0869140625, -28.88758087158203, -26.688243865966797, -24.488910675048828, -22.289575576782227, -20.090240478515625, -17.890905380249023, -15.691570281982422, -13.49223518371582, -11.292901039123535, -9.093565940856934, -6.894230842590332, -4.694896697998047, -2.4955615997314453, -0.29622650146484375, 1.9031083583831787, 4.102443218231201, 6.3017778396606445, 8.501112937927246, 10.700448036193848, 12.899782180786133, 15.099117279052734, 17.298452377319336, 19.497787475585938, 21.69712257385254, 23.89645767211914, 26.09579086303711, 28.295127868652344, 30.494461059570312, 32.69379425048828, 34.893131256103516, 37.092464447021484, 39.29180145263672, 41.49113464355469, 43.69047164916992, 45.88980484008789, 48.089141845703125, 50.288475036621094, 52.48780822753906, 54.68714141845703, 56.886478424072266, 59.085811614990234, 61.28514862060547, 63.48448181152344, 65.6838150024414, 67.88314819335938, 70.08248901367188]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 16.0, 16.0, 20.0, 40.0, 49.0, 91.0, 130.0, 197.0, 284.0, 497.0, 730.0, 1136.0, 1888.0, 3085.0, 4863.0, 8065.0, 13501.0, 21709.0, 34146.0, 50712.0, 71553.0, 93629.0, 112269.0, 122030.0, 120105.0, 108332.0, 87928.0, 65625.0, 45958.0, 30236.0, 19388.0, 11837.0, 7146.0, 4371.0, 2505.0, 1606.0, 1002.0, 656.0, 428.0, 259.0, 178.0, 128.0, 74.0, 49.0, 32.0, 20.0, 11.0, 11.0, 4.0, 2.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-30.859375, -29.859619140625, -28.85986328125, -27.860107421875, -26.8603515625, -25.860595703125, -24.86083984375, -23.861083984375, -22.861328125, -21.861572265625, -20.86181640625, -19.862060546875, -18.8623046875, -17.862548828125, -16.86279296875, -15.863037109375, -14.86328125, -13.863525390625, -12.86376953125, -11.864013671875, -10.8642578125, -9.864501953125, -8.86474609375, -7.864990234375, -6.865234375, -5.865478515625, -4.86572265625, -3.865966796875, -2.8662109375, -1.866455078125, -0.86669921875, 0.133056640625, 1.1328125, 2.132568359375, 3.13232421875, 4.132080078125, 5.1318359375, 6.131591796875, 7.13134765625, 8.131103515625, 9.130859375, 10.130615234375, 11.13037109375, 12.130126953125, 13.1298828125, 14.129638671875, 15.12939453125, 16.129150390625, 17.12890625, 18.128662109375, 19.12841796875, 20.128173828125, 21.1279296875, 22.127685546875, 23.12744140625, 24.127197265625, 25.126953125, 26.126708984375, 27.12646484375, 28.126220703125, 29.1259765625, 30.125732421875, 31.12548828125, 32.125244140625, 33.125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 10.0, 10.0, 12.0, 13.0, 13.0, 20.0, 19.0, 27.0, 28.0, 28.0, 25.0, 21.0, 39.0, 43.0, 38.0, 52.0, 50.0, 32.0, 40.0, 48.0, 43.0, 43.0, 49.0, 41.0, 39.0, 34.0, 23.0, 22.0, 24.0, 15.0, 19.0, 17.0, 14.0, 13.0, 14.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-70.6875, -68.4833984375, -66.279296875, -64.0751953125, -61.87109375, -59.6669921875, -57.462890625, -55.2587890625, -53.0546875, -50.8505859375, -48.646484375, -46.4423828125, -44.23828125, -42.0341796875, -39.830078125, -37.6259765625, -35.421875, -33.2177734375, -31.013671875, -28.8095703125, -26.60546875, -24.4013671875, -22.197265625, -19.9931640625, -17.7890625, -15.5849609375, -13.380859375, -11.1767578125, -8.97265625, -6.7685546875, -4.564453125, -2.3603515625, -0.15625, 2.0478515625, 4.251953125, 6.4560546875, 8.66015625, 10.8642578125, 13.068359375, 15.2724609375, 17.4765625, 19.6806640625, 21.884765625, 24.0888671875, 26.29296875, 28.4970703125, 30.701171875, 32.9052734375, 35.109375, 37.3134765625, 39.517578125, 41.7216796875, 43.92578125, 46.1298828125, 48.333984375, 50.5380859375, 52.7421875, 54.9462890625, 57.150390625, 59.3544921875, 61.55859375, 63.7626953125, 65.966796875, 68.1708984375, 70.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 9.0, 11.0, 16.0, 21.0, 25.0, 54.0, 73.0, 99.0, 179.0, 213.0, 352.0, 556.0, 793.0, 1156.0, 1863.0, 2829.0, 4385.0, 7093.0, 11146.0, 17543.0, 28177.0, 43004.0, 63614.0, 87667.0, 111343.0, 127940.0, 128908.0, 116314.0, 93076.0, 68116.0, 47300.0, 30673.0, 19581.0, 12445.0, 7906.0, 4945.0, 3067.0, 2092.0, 1296.0, 880.0, 623.0, 404.0, 260.0, 154.0, 132.0, 68.0, 48.0, 31.0, 23.0, 17.0, 14.0, 10.0, 5.0, 2.0, 4.0, 2.0, 5.0], "bins": [-42.84375, -41.5498046875, -40.255859375, -38.9619140625, -37.66796875, -36.3740234375, -35.080078125, -33.7861328125, -32.4921875, -31.1982421875, -29.904296875, -28.6103515625, -27.31640625, -26.0224609375, -24.728515625, -23.4345703125, -22.140625, -20.8466796875, -19.552734375, -18.2587890625, -16.96484375, -15.6708984375, -14.376953125, -13.0830078125, -11.7890625, -10.4951171875, -9.201171875, -7.9072265625, -6.61328125, -5.3193359375, -4.025390625, -2.7314453125, -1.4375, -0.1435546875, 1.150390625, 2.4443359375, 3.73828125, 5.0322265625, 6.326171875, 7.6201171875, 8.9140625, 10.2080078125, 11.501953125, 12.7958984375, 14.08984375, 15.3837890625, 16.677734375, 17.9716796875, 19.265625, 20.5595703125, 21.853515625, 23.1474609375, 24.44140625, 25.7353515625, 27.029296875, 28.3232421875, 29.6171875, 30.9111328125, 32.205078125, 33.4990234375, 34.79296875, 36.0869140625, 37.380859375, 38.6748046875, 39.96875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 3.0, 6.0, 5.0, 8.0, 14.0, 14.0, 12.0, 14.0, 16.0, 16.0, 23.0, 17.0, 35.0, 29.0, 32.0, 29.0, 27.0, 28.0, 33.0, 40.0, 38.0, 49.0, 38.0, 38.0, 34.0, 43.0, 31.0, 26.0, 42.0, 32.0, 35.0, 21.0, 22.0, 17.0, 15.0, 17.0, 12.0, 15.0, 12.0, 13.0, 8.0, 6.0, 7.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-39.6875, -38.4208984375, -37.154296875, -35.8876953125, -34.62109375, -33.3544921875, -32.087890625, -30.8212890625, -29.5546875, -28.2880859375, -27.021484375, -25.7548828125, -24.48828125, -23.2216796875, -21.955078125, -20.6884765625, -19.421875, -18.1552734375, -16.888671875, -15.6220703125, -14.35546875, -13.0888671875, -11.822265625, -10.5556640625, -9.2890625, -8.0224609375, -6.755859375, -5.4892578125, -4.22265625, -2.9560546875, -1.689453125, -0.4228515625, 0.84375, 2.1103515625, 3.376953125, 4.6435546875, 5.91015625, 7.1767578125, 8.443359375, 9.7099609375, 10.9765625, 12.2431640625, 13.509765625, 14.7763671875, 16.04296875, 17.3095703125, 18.576171875, 19.8427734375, 21.109375, 22.3759765625, 23.642578125, 24.9091796875, 26.17578125, 27.4423828125, 28.708984375, 29.9755859375, 31.2421875, 32.5087890625, 33.775390625, 35.0419921875, 36.30859375, 37.5751953125, 38.841796875, 40.1083984375, 41.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 6.0, 14.0, 12.0, 19.0, 25.0, 43.0, 66.0, 86.0, 125.0, 187.0, 241.0, 376.0, 572.0, 859.0, 1358.0, 2135.0, 3600.0, 6005.0, 10056.0, 16664.0, 26851.0, 41991.0, 60955.0, 83831.0, 105127.0, 119271.0, 124373.0, 116012.0, 98603.0, 76939.0, 54939.0, 36828.0, 23474.0, 14546.0, 8817.0, 5142.0, 3066.0, 1900.0, 1147.0, 745.0, 449.0, 356.0, 205.0, 137.0, 123.0, 66.0, 64.0, 46.0, 26.0, 20.0, 15.0, 14.0, 11.0, 7.0, 1.0, 2.0, 3.0, 5.0], "bins": [-13.9921875, -13.5596923828125, -13.127197265625, -12.6947021484375, -12.26220703125, -11.8297119140625, -11.397216796875, -10.9647216796875, -10.5322265625, -10.0997314453125, -9.667236328125, -9.2347412109375, -8.80224609375, -8.3697509765625, -7.937255859375, -7.5047607421875, -7.072265625, -6.6397705078125, -6.207275390625, -5.7747802734375, -5.34228515625, -4.9097900390625, -4.477294921875, -4.0447998046875, -3.6123046875, -3.1798095703125, -2.747314453125, -2.3148193359375, -1.88232421875, -1.4498291015625, -1.017333984375, -0.5848388671875, -0.15234375, 0.2801513671875, 0.712646484375, 1.1451416015625, 1.57763671875, 2.0101318359375, 2.442626953125, 2.8751220703125, 3.3076171875, 3.7401123046875, 4.172607421875, 4.6051025390625, 5.03759765625, 5.4700927734375, 5.902587890625, 6.3350830078125, 6.767578125, 7.2000732421875, 7.632568359375, 8.0650634765625, 8.49755859375, 8.9300537109375, 9.362548828125, 9.7950439453125, 10.2275390625, 10.6600341796875, 11.092529296875, 11.5250244140625, 11.95751953125, 12.3900146484375, 12.822509765625, 13.2550048828125, 13.6875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 16.0, 16.0, 22.0, 27.0, 39.0, 62.0, 54.0, 44.0, 82.0, 71.0, 72.0, 80.0, 69.0, 58.0, 60.0, 53.0, 47.0, 24.0, 22.0, 16.0, 14.0, 8.0, 8.0, 4.0, 7.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002086639404296875, -0.002007126808166504, -0.0019276142120361328, -0.0018481016159057617, -0.0017685890197753906, -0.0016890764236450195, -0.0016095638275146484, -0.0015300512313842773, -0.0014505386352539062, -0.0013710260391235352, -0.001291513442993164, -0.001212000846862793, -0.0011324882507324219, -0.0010529756546020508, -0.0009734630584716797, -0.0008939504623413086, -0.0008144378662109375, -0.0007349252700805664, -0.0006554126739501953, -0.0005759000778198242, -0.0004963874816894531, -0.00041687488555908203, -0.00033736228942871094, -0.00025784969329833984, -0.00017833709716796875, -9.882450103759766e-05, -1.9311904907226562e-05, 6.020069122314453e-05, 0.00013971328735351562, 0.00021922588348388672, 0.0002987384796142578, 0.0003782510757446289, 0.000457763671875, 0.0005372762680053711, 0.0006167888641357422, 0.0006963014602661133, 0.0007758140563964844, 0.0008553266525268555, 0.0009348392486572266, 0.0010143518447875977, 0.0010938644409179688, 0.0011733770370483398, 0.001252889633178711, 0.001332402229309082, 0.0014119148254394531, 0.0014914274215698242, 0.0015709400177001953, 0.0016504526138305664, 0.0017299652099609375, 0.0018094778060913086, 0.0018889904022216797, 0.0019685029983520508, 0.002048015594482422, 0.002127528190612793, 0.002207040786743164, 0.002286553382873535, 0.0023660659790039062, 0.0024455785751342773, 0.0025250911712646484, 0.0026046037673950195, 0.0026841163635253906, 0.0027636289596557617, 0.002843141555786133, 0.002922654151916504, 0.003002166748046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 11.0, 4.0, 30.0, 41.0, 50.0, 75.0, 102.0, 205.0, 256.0, 409.0, 675.0, 1089.0, 1650.0, 2726.0, 4366.0, 7042.0, 11203.0, 17398.0, 26621.0, 38833.0, 54257.0, 71909.0, 89236.0, 102736.0, 109649.0, 108408.0, 99458.0, 84364.0, 66537.0, 49547.0, 34796.0, 23595.0, 15420.0, 9698.0, 6185.0, 3768.0, 2314.0, 1415.0, 882.0, 570.0, 394.0, 214.0, 164.0, 94.0, 58.0, 47.0, 23.0, 10.0, 5.0, 9.0, 6.0, 2.0, 2.0, 3.0], "bins": [-14.234375, -13.825927734375, -13.41748046875, -13.009033203125, -12.6005859375, -12.192138671875, -11.78369140625, -11.375244140625, -10.966796875, -10.558349609375, -10.14990234375, -9.741455078125, -9.3330078125, -8.924560546875, -8.51611328125, -8.107666015625, -7.69921875, -7.290771484375, -6.88232421875, -6.473876953125, -6.0654296875, -5.656982421875, -5.24853515625, -4.840087890625, -4.431640625, -4.023193359375, -3.61474609375, -3.206298828125, -2.7978515625, -2.389404296875, -1.98095703125, -1.572509765625, -1.1640625, -0.755615234375, -0.34716796875, 0.061279296875, 0.4697265625, 0.878173828125, 1.28662109375, 1.695068359375, 2.103515625, 2.511962890625, 2.92041015625, 3.328857421875, 3.7373046875, 4.145751953125, 4.55419921875, 4.962646484375, 5.37109375, 5.779541015625, 6.18798828125, 6.596435546875, 7.0048828125, 7.413330078125, 7.82177734375, 8.230224609375, 8.638671875, 9.047119140625, 9.45556640625, 9.864013671875, 10.2724609375, 10.680908203125, 11.08935546875, 11.497802734375, 11.90625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 9.0, 6.0, 8.0, 12.0, 11.0, 14.0, 15.0, 20.0, 17.0, 17.0, 25.0, 37.0, 34.0, 25.0, 42.0, 28.0, 31.0, 36.0, 37.0, 53.0, 39.0, 52.0, 44.0, 45.0, 41.0, 36.0, 39.0, 26.0, 34.0, 21.0, 12.0, 18.0, 21.0, 19.0, 10.0, 14.0, 14.0, 7.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0], "bins": [-7.53125, -7.32574462890625, -7.1202392578125, -6.91473388671875, -6.709228515625, -6.50372314453125, -6.2982177734375, -6.09271240234375, -5.88720703125, -5.68170166015625, -5.4761962890625, -5.27069091796875, -5.065185546875, -4.85968017578125, -4.6541748046875, -4.44866943359375, -4.2431640625, -4.03765869140625, -3.8321533203125, -3.62664794921875, -3.421142578125, -3.21563720703125, -3.0101318359375, -2.80462646484375, -2.59912109375, -2.39361572265625, -2.1881103515625, -1.98260498046875, -1.777099609375, -1.57159423828125, -1.3660888671875, -1.16058349609375, -0.955078125, -0.74957275390625, -0.5440673828125, -0.33856201171875, -0.133056640625, 0.07244873046875, 0.2779541015625, 0.48345947265625, 0.68896484375, 0.89447021484375, 1.0999755859375, 1.30548095703125, 1.510986328125, 1.71649169921875, 1.9219970703125, 2.12750244140625, 2.3330078125, 2.53851318359375, 2.7440185546875, 2.94952392578125, 3.155029296875, 3.36053466796875, 3.5660400390625, 3.77154541015625, 3.97705078125, 4.18255615234375, 4.3880615234375, 4.59356689453125, 4.799072265625, 5.00457763671875, 5.2100830078125, 5.41558837890625, 5.62109375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 7.0, 11.0, 7.0, 14.0, 10.0, 19.0, 21.0, 18.0, 26.0, 27.0, 29.0, 38.0, 27.0, 30.0, 32.0, 37.0, 33.0, 45.0, 55.0, 33.0, 48.0, 44.0, 47.0, 36.0, 39.0, 32.0, 29.0, 29.0, 29.0, 23.0, 20.0, 25.0, 18.0, 14.0, 11.0, 11.0, 8.0, 3.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.345523834228516, -46.852291107177734, -45.35906219482422, -43.86582946777344, -42.372596740722656, -40.879364013671875, -39.386131286621094, -37.89290237426758, -36.3996696472168, -34.906436920166016, -33.4132080078125, -31.91997528076172, -30.426742553710938, -28.933509826660156, -27.440279006958008, -25.94704818725586, -24.453815460205078, -22.960582733154297, -21.46735191345215, -19.97412109375, -18.48088836669922, -16.987655639648438, -15.494424819946289, -14.001193046569824, -12.50796127319336, -11.014729499816895, -9.52149772644043, -8.028265953063965, -6.5350341796875, -5.041802406311035, -3.5485706329345703, -2.0553388595581055, -0.562103271484375, 0.9311285018920898, 2.4243602752685547, 3.9175920486450195, 5.410823822021484, 6.904055595397949, 8.397287368774414, 9.890519142150879, 11.383750915527344, 12.876982688903809, 14.370214462280273, 15.863446235656738, 17.356678009033203, 18.849910736083984, 20.343141555786133, 21.83637237548828, 23.329605102539062, 24.822837829589844, 26.316068649291992, 27.80929946899414, 29.302532196044922, 30.795764923095703, 32.28899383544922, 33.7822265625, 35.27545928955078, 36.76869201660156, 38.261924743652344, 39.75515365600586, 41.24838638305664, 42.74161911010742, 44.23484802246094, 45.72808074951172, 47.2213134765625]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 6.0, 7.0, 12.0, 2.0, 14.0, 24.0, 16.0, 17.0, 28.0, 26.0, 29.0, 36.0, 29.0, 35.0, 28.0, 32.0, 28.0, 36.0, 45.0, 45.0, 43.0, 53.0, 47.0, 37.0, 44.0, 42.0, 44.0, 17.0, 21.0, 27.0, 16.0, 30.0, 12.0, 15.0, 10.0, 15.0, 7.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.1419677734375, -71.64351654052734, -69.14507293701172, -66.64662170410156, -64.14817810058594, -61.64972686767578, -59.151275634765625, -56.652828216552734, -54.154380798339844, -51.65593338012695, -49.15748596191406, -46.659034729003906, -44.160587310791016, -41.662139892578125, -39.16368865966797, -36.66524124145508, -34.16679382324219, -31.668346405029297, -29.169897079467773, -26.67144775390625, -24.17300033569336, -21.67455291748047, -19.176103591918945, -16.677654266357422, -14.179206848144531, -11.680758476257324, -9.182310104370117, -6.68386173248291, -4.185413360595703, -1.686964988708496, 0.8114833831787109, 3.3099327087402344, 5.808387756347656, 8.306836128234863, 10.80528450012207, 13.303732872009277, 15.802181243896484, 18.300628662109375, 20.7990779876709, 23.297527313232422, 25.795974731445312, 28.294422149658203, 30.792871475219727, 33.29132080078125, 35.78976821899414, 38.28821563720703, 40.78666687011719, 43.28511428833008, 45.78356170654297, 48.28200912475586, 50.78045654296875, 53.278907775878906, 55.7773551940918, 58.27580261230469, 60.774253845214844, 63.272701263427734, 65.77114868164062, 68.26959991455078, 70.7680435180664, 73.26649475097656, 75.76493835449219, 78.26338958740234, 80.7618408203125, 83.26028442382812, 85.75873565673828]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 13.0, 24.0, 34.0, 50.0, 66.0, 90.0, 133.0, 144.0, 192.0, 283.0, 382.0, 458.0, 573.0, 764.0, 894.0, 1182.0, 1383.0, 1657.0, 2026.0, 2361.0, 2685.0, 2842.0, 1012617.0, 2862.0, 2712.0, 2525.0, 2190.0, 1866.0, 1530.0, 1313.0, 1070.0, 828.0, 684.0, 525.0, 416.0, 304.0, 245.0, 183.0, 134.0, 121.0, 85.0, 37.0, 43.0, 29.0, 21.0, 5.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-383.05731201171875, -370.6102294921875, -358.1631164550781, -345.7160339355469, -333.2689514160156, -320.82183837890625, -308.374755859375, -295.92767333984375, -283.4805908203125, -271.03350830078125, -258.5863952636719, -246.13931274414062, -233.69223022460938, -221.24513244628906, -208.79803466796875, -196.3509521484375, -183.90383911132812, -171.4567413330078, -159.00965881347656, -146.56256103515625, -134.115478515625, -121.66838073730469, -109.22128295898438, -96.7741928100586, -84.32710266113281, -71.88001251220703, -59.432918548583984, -46.98582458496094, -34.538734436035156, -22.091644287109375, -9.644546508789062, 2.8025436401367188, 15.249664306640625, 27.69675636291504, 40.14384841918945, 52.5909423828125, 65.03803253173828, 77.48512268066406, 89.93222045898438, 102.37931060791016, 114.82640075683594, 127.27349090576172, 139.7205810546875, 152.1676788330078, 164.61477661132812, 177.06185913085938, 189.5089569091797, 201.9560546875, 214.40313720703125, 226.85023498535156, 239.2973175048828, 251.74441528320312, 264.1914978027344, 276.63861083984375, 289.085693359375, 301.53277587890625, 313.9798583984375, 326.42694091796875, 338.8740539550781, 351.3211364746094, 363.7682189941406, 376.21533203125, 388.66241455078125, 401.1094970703125, 413.5566101074219]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 7.0, 15.0, 14.0, 35.0, 32.0, 60.0, 105.0, 145.0, 185.0, 305.0, 450.0, 714.0, 1159.0, 1766.0, 2625.0, 4143.0, 5789.0, 8404.0, 11582.0, 15100.0, 19685.0, 36771.0, 51253180.0, 36742.0, 19663.0, 15029.0, 11387.0, 8496.0, 5920.0, 4035.0, 2669.0, 1809.0, 1150.0, 696.0, 474.0, 328.0, 207.0, 154.0, 94.0, 61.0, 39.0, 34.0, 16.0, 14.0, 10.0, 13.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.5635681152344, -322.2576904296875, -310.9517822265625, -299.6459045410156, -288.34002685546875, -277.03411865234375, -265.7282409667969, -254.42234802246094, -243.116455078125, -231.81056213378906, -220.50466918945312, -209.19879150390625, -197.8928985595703, -186.58700561523438, -175.2811279296875, -163.97523498535156, -152.66934204101562, -141.3634490966797, -130.05755615234375, -118.75167846679688, -107.44578552246094, -96.139892578125, -84.8340072631836, -73.52812194824219, -62.22222900390625, -50.91633987426758, -39.610450744628906, -28.304561614990234, -16.998672485351562, -5.692783355712891, 5.613105773925781, 16.918991088867188, 28.22491455078125, 39.53080368041992, 50.836692810058594, 62.142581939697266, 73.44847106933594, 84.75436401367188, 96.06024932861328, 107.36613464355469, 118.67202758789062, 129.97792053222656, 141.2838134765625, 152.58969116210938, 163.8955841064453, 175.20147705078125, 186.50735473632812, 197.81324768066406, 209.119140625, 220.42503356933594, 231.73092651367188, 243.03680419921875, 254.3426971435547, 265.6485900878906, 276.9544677734375, 288.2603759765625, 299.5662536621094, 310.87213134765625, 322.17803955078125, 333.4839172363281, 344.789794921875, 356.095703125, 367.4015808105469, 378.70745849609375, 390.01336669921875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 11.0, 14.0, 22.0, 19.0, 28.0, 49.0, 87.0, 103.0, 155.0, 242.0, 353.0, 535.0, 920.0, 1449.0, 2496.0, 4385.0, 8368.0, 16250.0, 35721.0, 92784.0, 289902.0, 1204557.0, 3701703.0, 635767.0, 180877.0, 61994.0, 25565.0, 12017.0, 6285.0, 3504.0, 1949.0, 1160.0, 748.0, 491.0, 295.0, 209.0, 123.0, 92.0, 62.0, 36.0, 24.0, 30.0, 11.0, 10.0, 9.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-39.8125, -38.580078125, -37.34765625, -36.115234375, -34.8828125, -33.650390625, -32.41796875, -31.185546875, -29.953125, -28.720703125, -27.48828125, -26.255859375, -25.0234375, -23.791015625, -22.55859375, -21.326171875, -20.09375, -18.861328125, -17.62890625, -16.396484375, -15.1640625, -13.931640625, -12.69921875, -11.466796875, -10.234375, -9.001953125, -7.76953125, -6.537109375, -5.3046875, -4.072265625, -2.83984375, -1.607421875, -0.375, 0.857421875, 2.08984375, 3.322265625, 4.5546875, 5.787109375, 7.01953125, 8.251953125, 9.484375, 10.716796875, 11.94921875, 13.181640625, 14.4140625, 15.646484375, 16.87890625, 18.111328125, 19.34375, 20.576171875, 21.80859375, 23.041015625, 24.2734375, 25.505859375, 26.73828125, 27.970703125, 29.203125, 30.435546875, 31.66796875, 32.900390625, 34.1328125, 35.365234375, 36.59765625, 37.830078125, 39.0625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 6.0, 5.0, 10.0, 14.0, 16.0, 23.0, 26.0, 37.0, 39.0, 68.0, 60.0, 66.0, 78.0, 612.0, 472.0, 80.0, 69.0, 55.0, 50.0, 46.0, 34.0, 34.0, 21.0, 15.0, 17.0, 13.0, 8.0, 8.0, 9.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-93.75, -91.068359375, -88.38671875, -85.705078125, -83.0234375, -80.341796875, -77.66015625, -74.978515625, -72.296875, -69.615234375, -66.93359375, -64.251953125, -61.5703125, -58.888671875, -56.20703125, -53.525390625, -50.84375, -48.162109375, -45.48046875, -42.798828125, -40.1171875, -37.435546875, -34.75390625, -32.072265625, -29.390625, -26.708984375, -24.02734375, -21.345703125, -18.6640625, -15.982421875, -13.30078125, -10.619140625, -7.9375, -5.255859375, -2.57421875, 0.107421875, 2.7890625, 5.470703125, 8.15234375, 10.833984375, 13.515625, 16.197265625, 18.87890625, 21.560546875, 24.2421875, 26.923828125, 29.60546875, 32.287109375, 34.96875, 37.650390625, 40.33203125, 43.013671875, 45.6953125, 48.376953125, 51.05859375, 53.740234375, 56.421875, 59.103515625, 61.78515625, 64.466796875, 67.1484375, 69.830078125, 72.51171875, 75.193359375, 77.875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 9.0, 8.0, 19.0, 24.0, 53.0, 65.0, 104.0, 130.0, 192.0, 336.0, 466.0, 769.0, 1339.0, 2063.0, 3737.0, 6942.0, 13165.0, 26697.0, 58628.0, 143882.0, 396445.0, 1993532.0, 2911891.0, 448618.0, 158882.0, 63561.0, 28643.0, 13990.0, 7324.0, 4066.0, 2286.0, 1374.0, 800.0, 452.0, 345.0, 188.0, 134.0, 97.0, 58.0, 37.0, 24.0, 17.0, 11.0, 8.0, 1.0, 2.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-29.65625, -28.73095703125, -27.8056640625, -26.88037109375, -25.955078125, -25.02978515625, -24.1044921875, -23.17919921875, -22.25390625, -21.32861328125, -20.4033203125, -19.47802734375, -18.552734375, -17.62744140625, -16.7021484375, -15.77685546875, -14.8515625, -13.92626953125, -13.0009765625, -12.07568359375, -11.150390625, -10.22509765625, -9.2998046875, -8.37451171875, -7.44921875, -6.52392578125, -5.5986328125, -4.67333984375, -3.748046875, -2.82275390625, -1.8974609375, -0.97216796875, -0.046875, 0.87841796875, 1.8037109375, 2.72900390625, 3.654296875, 4.57958984375, 5.5048828125, 6.43017578125, 7.35546875, 8.28076171875, 9.2060546875, 10.13134765625, 11.056640625, 11.98193359375, 12.9072265625, 13.83251953125, 14.7578125, 15.68310546875, 16.6083984375, 17.53369140625, 18.458984375, 19.38427734375, 20.3095703125, 21.23486328125, 22.16015625, 23.08544921875, 24.0107421875, 24.93603515625, 25.861328125, 26.78662109375, 27.7119140625, 28.63720703125, 29.5625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 9.0, 9.0, 8.0, 12.0, 11.0, 22.0, 25.0, 14.0, 27.0, 22.0, 31.0, 38.0, 50.0, 39.0, 69.0, 117.0, 317.0, 681.0, 99.0, 54.0, 45.0, 41.0, 38.0, 47.0, 38.0, 32.0, 17.0, 21.0, 20.0, 18.0, 16.0, 3.0, 5.0, 6.0, 6.0, 3.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-81.375, -79.20068359375, -77.0263671875, -74.85205078125, -72.677734375, -70.50341796875, -68.3291015625, -66.15478515625, -63.98046875, -61.80615234375, -59.6318359375, -57.45751953125, -55.283203125, -53.10888671875, -50.9345703125, -48.76025390625, -46.5859375, -44.41162109375, -42.2373046875, -40.06298828125, -37.888671875, -35.71435546875, -33.5400390625, -31.36572265625, -29.19140625, -27.01708984375, -24.8427734375, -22.66845703125, -20.494140625, -18.31982421875, -16.1455078125, -13.97119140625, -11.796875, -9.62255859375, -7.4482421875, -5.27392578125, -3.099609375, -0.92529296875, 1.2490234375, 3.42333984375, 5.59765625, 7.77197265625, 9.9462890625, 12.12060546875, 14.294921875, 16.46923828125, 18.6435546875, 20.81787109375, 22.9921875, 25.16650390625, 27.3408203125, 29.51513671875, 31.689453125, 33.86376953125, 36.0380859375, 38.21240234375, 40.38671875, 42.56103515625, 44.7353515625, 46.90966796875, 49.083984375, 51.25830078125, 53.4326171875, 55.60693359375, 57.78125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 21.0, 22.0, 14.0, 30.0, 36.0, 36.0, 47.0, 41.0, 70.0, 90.0, 112.0, 170.0, 200.0, 278.0, 372.0, 594.0, 719.0, 1211.0, 1821.0, 3146.0, 5685.0, 12442.0, 30833.0, 120597.0, 5946503.0, 110018.0, 29690.0, 12061.0, 5665.0, 3226.0, 1702.0, 1086.0, 776.0, 503.0, 344.0, 306.0, 218.0, 147.0, 147.0, 102.0, 64.0, 69.0, 28.0, 38.0, 45.0, 29.0, 16.0, 13.0, 5.0, 11.0, 6.0, 11.0, 5.0, 0.0, 0.0, 0.0, 3.0], "bins": [-181.5, -175.734375, -169.96875, -164.203125, -158.4375, -152.671875, -146.90625, -141.140625, -135.375, -129.609375, -123.84375, -118.078125, -112.3125, -106.546875, -100.78125, -95.015625, -89.25, -83.484375, -77.71875, -71.953125, -66.1875, -60.421875, -54.65625, -48.890625, -43.125, -37.359375, -31.59375, -25.828125, -20.0625, -14.296875, -8.53125, -2.765625, 3.0, 8.765625, 14.53125, 20.296875, 26.0625, 31.828125, 37.59375, 43.359375, 49.125, 54.890625, 60.65625, 66.421875, 72.1875, 77.953125, 83.71875, 89.484375, 95.25, 101.015625, 106.78125, 112.546875, 118.3125, 124.078125, 129.84375, 135.609375, 141.375, 147.140625, 152.90625, 158.671875, 164.4375, 170.203125, 175.96875, 181.734375, 187.5]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 3.0, 8.0, 5.0, 8.0, 5.0, 12.0, 14.0, 10.0, 22.0, 21.0, 29.0, 24.0, 33.0, 40.0, 50.0, 63.0, 187.0, 760.0, 227.0, 74.0, 56.0, 49.0, 49.0, 46.0, 32.0, 34.0, 36.0, 21.0, 22.0, 16.0, 21.0, 8.0, 3.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-91.375, -88.5927734375, -85.810546875, -83.0283203125, -80.24609375, -77.4638671875, -74.681640625, -71.8994140625, -69.1171875, -66.3349609375, -63.552734375, -60.7705078125, -57.98828125, -55.2060546875, -52.423828125, -49.6416015625, -46.859375, -44.0771484375, -41.294921875, -38.5126953125, -35.73046875, -32.9482421875, -30.166015625, -27.3837890625, -24.6015625, -21.8193359375, -19.037109375, -16.2548828125, -13.47265625, -10.6904296875, -7.908203125, -5.1259765625, -2.34375, 0.4384765625, 3.220703125, 6.0029296875, 8.78515625, 11.5673828125, 14.349609375, 17.1318359375, 19.9140625, 22.6962890625, 25.478515625, 28.2607421875, 31.04296875, 33.8251953125, 36.607421875, 39.3896484375, 42.171875, 44.9541015625, 47.736328125, 50.5185546875, 53.30078125, 56.0830078125, 58.865234375, 61.6474609375, 64.4296875, 67.2119140625, 69.994140625, 72.7763671875, 75.55859375, 78.3408203125, 81.123046875, 83.9052734375, 86.6875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 6.0, 22.0, 58.0, 222.0, 620.0, 43.0, 12.0, 10.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2257.08203125, -2216.116943359375, -2175.15185546875, -2134.186767578125, -2093.2216796875, -2052.256591796875, -2011.29150390625, -1970.326416015625, -1929.361328125, -1888.396240234375, -1847.43115234375, -1806.466064453125, -1765.5009765625, -1724.535888671875, -1683.57080078125, -1642.605712890625, -1601.640625, -1560.675537109375, -1519.71044921875, -1478.745361328125, -1437.7802734375, -1396.815185546875, -1355.85009765625, -1314.885009765625, -1273.9200439453125, -1232.9549560546875, -1191.9898681640625, -1151.0247802734375, -1110.0596923828125, -1069.0946044921875, -1028.1295166015625, -987.1644287109375, -946.19921875, -905.234130859375, -864.26904296875, -823.303955078125, -782.3388671875, -741.373779296875, -700.40869140625, -659.443603515625, -618.4785766601562, -577.5134887695312, -536.5484008789062, -495.58331298828125, -454.61822509765625, -413.65313720703125, -372.6880798339844, -331.7229919433594, -290.7579040527344, -249.79281616210938, -208.82772827148438, -167.86265563964844, -126.89756774902344, -85.93247985839844, -44.9674072265625, -4.0023193359375, 36.9627685546875, 77.9278564453125, 118.89293670654297, 159.85801696777344, 200.82310485839844, 241.78819274902344, 282.7532653808594, 323.7183532714844, 364.6834411621094]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 11.0, 18.0, 38.0, 59.0, 199.0, 510.0, 66.0, 35.0, 22.0, 11.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1075.1649169921875, -1030.64794921875, -986.131103515625, -941.6141967773438, -897.0972900390625, -852.5803833007812, -808.0634765625, -763.5465698242188, -719.0296630859375, -674.5127563476562, -629.995849609375, -585.4789428710938, -540.9620361328125, -496.44512939453125, -451.92822265625, -407.41131591796875, -362.8944091796875, -318.37750244140625, -273.860595703125, -229.34368896484375, -184.8267822265625, -140.30987548828125, -95.79296875, -51.27606201171875, -6.7591552734375, 37.75775146484375, 82.274658203125, 126.79156494140625, 171.3084716796875, 215.82537841796875, 260.34228515625, 304.85919189453125, 349.3759765625, 393.89288330078125, 438.4097900390625, 482.92669677734375, 527.443603515625, 571.9605102539062, 616.4774169921875, 660.9943237304688, 705.51123046875, 750.0281372070312, 794.5450439453125, 839.0619506835938, 883.578857421875, 928.0957641601562, 972.6126708984375, 1017.1295776367188, 1061.646484375, 1106.163330078125, 1150.6802978515625, 1195.197265625, 1239.714111328125, 1284.23095703125, 1328.7479248046875, 1373.264892578125, 1417.78173828125, 1462.298583984375, 1506.8155517578125, 1551.33251953125, 1595.849365234375, 1640.3662109375, 1684.8831787109375, 1729.400146484375, 1773.9169921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 6.0, 13.0, 11.0, 11.0, 21.0, 43.0, 56.0, 59.0, 102.0, 135.0, 240.0, 306.0, 549.0, 813.0, 1295.0, 2272.0, 3933.0, 8042.0, 18336.0, 68190.0, 3396356.0, 618486.0, 44598.0, 15062.0, 6476.0, 3340.0, 1800.0, 1128.0, 725.0, 509.0, 330.0, 245.0, 202.0, 148.0, 103.0, 88.0, 67.0, 40.0, 38.0, 19.0, 26.0, 20.0, 8.0, 11.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.7265625, -6.485107421875, -6.24365234375, -6.002197265625, -5.7607421875, -5.519287109375, -5.27783203125, -5.036376953125, -4.794921875, -4.553466796875, -4.31201171875, -4.070556640625, -3.8291015625, -3.587646484375, -3.34619140625, -3.104736328125, -2.86328125, -2.621826171875, -2.38037109375, -2.138916015625, -1.8974609375, -1.656005859375, -1.41455078125, -1.173095703125, -0.931640625, -0.690185546875, -0.44873046875, -0.207275390625, 0.0341796875, 0.275634765625, 0.51708984375, 0.758544921875, 1.0, 1.241455078125, 1.48291015625, 1.724365234375, 1.9658203125, 2.207275390625, 2.44873046875, 2.690185546875, 2.931640625, 3.173095703125, 3.41455078125, 3.656005859375, 3.8974609375, 4.138916015625, 4.38037109375, 4.621826171875, 4.86328125, 5.104736328125, 5.34619140625, 5.587646484375, 5.8291015625, 6.070556640625, 6.31201171875, 6.553466796875, 6.794921875, 7.036376953125, 7.27783203125, 7.519287109375, 7.7607421875, 8.002197265625, 8.24365234375, 8.485107421875, 8.7265625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 3.0, 6.0, 14.0, 18.0, 56.0, 214.0, 418.0, 162.0, 30.0, 14.0, 10.0, 13.0, 6.0, 8.0, 0.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59912109375, -0.5787429809570312, -0.5583648681640625, -0.5379867553710938, -0.517608642578125, -0.49723052978515625, -0.4768524169921875, -0.45647430419921875, -0.43609619140625, -0.41571807861328125, -0.3953399658203125, -0.37496185302734375, -0.354583740234375, -0.33420562744140625, -0.3138275146484375, -0.29344940185546875, -0.2730712890625, -0.25269317626953125, -0.2323150634765625, -0.21193695068359375, -0.191558837890625, -0.17118072509765625, -0.1508026123046875, -0.13042449951171875, -0.11004638671875, -0.08966827392578125, -0.0692901611328125, -0.04891204833984375, -0.028533935546875, -0.00815582275390625, 0.0122222900390625, 0.03260040283203125, 0.052978515625, 0.07335662841796875, 0.0937347412109375, 0.11411285400390625, 0.134490966796875, 0.15486907958984375, 0.1752471923828125, 0.19562530517578125, 0.21600341796875, 0.23638153076171875, 0.2567596435546875, 0.27713775634765625, 0.297515869140625, 0.31789398193359375, 0.3382720947265625, 0.35865020751953125, 0.3790283203125, 0.39940643310546875, 0.4197845458984375, 0.44016265869140625, 0.460540771484375, 0.48091888427734375, 0.5012969970703125, 0.5216751098632812, 0.54205322265625, 0.5624313354492188, 0.5828094482421875, 0.6031875610351562, 0.623565673828125, 0.6439437866210938, 0.6643218994140625, 0.6847000122070312, 0.705078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 15.0, 12.0, 13.0, 14.0, 18.0, 28.0, 36.0, 37.0, 65.0, 89.0, 140.0, 220.0, 251.0, 423.0, 699.0, 1389.0, 2739.0, 6181.0, 18210.0, 79353.0, 1111844.0, 2807632.0, 125721.0, 24316.0, 7797.0, 3225.0, 1566.0, 831.0, 502.0, 281.0, 174.0, 142.0, 82.0, 61.0, 41.0, 28.0, 22.0, 14.0, 16.0, 15.0, 12.0, 7.0, 4.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.2578125, -7.03179931640625, -6.8057861328125, -6.57977294921875, -6.353759765625, -6.12774658203125, -5.9017333984375, -5.67572021484375, -5.44970703125, -5.22369384765625, -4.9976806640625, -4.77166748046875, -4.545654296875, -4.31964111328125, -4.0936279296875, -3.86761474609375, -3.6416015625, -3.41558837890625, -3.1895751953125, -2.96356201171875, -2.737548828125, -2.51153564453125, -2.2855224609375, -2.05950927734375, -1.83349609375, -1.60748291015625, -1.3814697265625, -1.15545654296875, -0.929443359375, -0.70343017578125, -0.4774169921875, -0.25140380859375, -0.025390625, 0.20062255859375, 0.4266357421875, 0.65264892578125, 0.878662109375, 1.10467529296875, 1.3306884765625, 1.55670166015625, 1.78271484375, 2.00872802734375, 2.2347412109375, 2.46075439453125, 2.686767578125, 2.91278076171875, 3.1387939453125, 3.36480712890625, 3.5908203125, 3.81683349609375, 4.0428466796875, 4.26885986328125, 4.494873046875, 4.72088623046875, 4.9468994140625, 5.17291259765625, 5.39892578125, 5.62493896484375, 5.8509521484375, 6.07696533203125, 6.302978515625, 6.52899169921875, 6.7550048828125, 6.98101806640625, 7.20703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 5.0, 8.0, 9.0, 11.0, 5.0, 9.0, 17.0, 21.0, 23.0, 28.0, 40.0, 46.0, 69.0, 71.0, 87.0, 116.0, 147.0, 206.0, 312.0, 408.0, 657.0, 424.0, 292.0, 207.0, 164.0, 133.0, 98.0, 92.0, 72.0, 60.0, 46.0, 43.0, 23.0, 32.0, 11.0, 9.0, 21.0, 12.0, 8.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9716796875, -0.936553955078125, -0.90142822265625, -0.866302490234375, -0.8311767578125, -0.796051025390625, -0.76092529296875, -0.725799560546875, -0.690673828125, -0.655548095703125, -0.62042236328125, -0.585296630859375, -0.5501708984375, -0.515045166015625, -0.47991943359375, -0.444793701171875, -0.40966796875, -0.374542236328125, -0.33941650390625, -0.304290771484375, -0.2691650390625, -0.234039306640625, -0.19891357421875, -0.163787841796875, -0.128662109375, -0.093536376953125, -0.05841064453125, -0.023284912109375, 0.0118408203125, 0.046966552734375, 0.08209228515625, 0.117218017578125, 0.15234375, 0.187469482421875, 0.22259521484375, 0.257720947265625, 0.2928466796875, 0.327972412109375, 0.36309814453125, 0.398223876953125, 0.433349609375, 0.468475341796875, 0.50360107421875, 0.538726806640625, 0.5738525390625, 0.608978271484375, 0.64410400390625, 0.679229736328125, 0.71435546875, 0.749481201171875, 0.78460693359375, 0.819732666015625, 0.8548583984375, 0.889984130859375, 0.92510986328125, 0.960235595703125, 0.995361328125, 1.030487060546875, 1.06561279296875, 1.100738525390625, 1.1358642578125, 1.170989990234375, 1.20611572265625, 1.241241455078125, 1.2763671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 8.0, 4.0, 4.0, 14.0, 20.0, 44.0, 55.0, 126.0, 195.0, 203.0, 127.0, 70.0, 42.0, 28.0, 15.0, 15.0, 13.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.504745483398438, -10.862683296203613, -10.220622062683105, -9.578559875488281, -8.936498641967773, -8.29443645477295, -7.652374267578125, -7.010312557220459, -6.368250846862793, -5.726189136505127, -5.084127426147461, -4.442065238952637, -3.8000035285949707, -3.1579418182373047, -2.5158798694610596, -1.8738179206848145, -1.2317562103271484, -0.5896943807601929, 0.052367448806762695, 0.6944292783737183, 1.3364911079406738, 1.9785528182983398, 2.620614767074585, 3.26267671585083, 3.904738426208496, 4.546800136566162, 5.188861846923828, 5.830924034118652, 6.472985744476318, 7.115047454833984, 7.757109642028809, 8.399171829223633, 9.04123306274414, 9.683295249938965, 10.325356483459473, 10.967418670654297, 11.609479904174805, 12.251542091369629, 12.893604278564453, 13.535665512084961, 14.177727699279785, 14.81978988647461, 15.461851119995117, 16.103912353515625, 16.745975494384766, 17.388036727905273, 18.03009796142578, 18.672161102294922, 19.31422233581543, 19.956283569335938, 20.598346710205078, 21.240407943725586, 21.882469177246094, 22.524532318115234, 23.166593551635742, 23.80865478515625, 24.45071792602539, 25.0927791595459, 25.73484230041504, 26.376903533935547, 27.018964767456055, 27.661026000976562, 28.303089141845703, 28.94515037536621, 29.58721160888672]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 6.0, 6.0, 10.0, 10.0, 13.0, 10.0, 14.0, 12.0, 24.0, 27.0, 26.0, 20.0, 32.0, 24.0, 47.0, 45.0, 35.0, 48.0, 42.0, 38.0, 44.0, 33.0, 50.0, 35.0, 36.0, 39.0, 33.0, 40.0, 29.0, 31.0, 22.0, 17.0, 16.0, 13.0, 12.0, 19.0, 9.0, 3.0, 8.0, 10.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.937492370605469, -8.650494575500488, -8.363497734069824, -8.076499938964844, -7.789502143859863, -7.502504825592041, -7.215507507324219, -6.928509712219238, -6.641512393951416, -6.354515075683594, -6.067517280578613, -5.780519962310791, -5.493522644042969, -5.206524848937988, -4.919527530670166, -4.632530212402344, -4.345532417297363, -4.058535099029541, -3.7715373039245605, -3.4845399856567383, -3.197542428970337, -2.9105448722839355, -2.6235475540161133, -2.336549997329712, -2.0495524406433105, -1.7625548839569092, -1.4755574464797974, -1.1885600090026855, -0.9015624523162842, -0.6145648956298828, -0.327567458152771, -0.04057002067565918, 0.24642658233642578, 0.5334240794181824, 0.820421576499939, 1.1074190139770508, 1.3944165706634521, 1.6814141273498535, 1.9684115648269653, 2.255409002304077, 2.5424065589904785, 2.82940411567688, 3.1164016723632812, 3.4033989906311035, 3.690396547317505, 3.9773941040039062, 4.2643914222717285, 4.551388740539551, 4.838386535644531, 5.1253838539123535, 5.412381649017334, 5.699378967285156, 5.986376762390137, 6.273374080657959, 6.560371398925781, 6.847369194030762, 7.134366512298584, 7.421363830566406, 7.708361625671387, 7.995358943939209, 8.282356262207031, 8.569354057312012, 8.856351852416992, 9.143348693847656, 9.430346488952637]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 7.0, 12.0, 16.0, 21.0, 19.0, 36.0, 55.0, 62.0, 118.0, 198.0, 358.0, 631.0, 1262.0, 2820.0, 8120.0, 45048.0, 841935.0, 127070.0, 13283.0, 4041.0, 1572.0, 770.0, 421.0, 256.0, 140.0, 95.0, 63.0, 35.0, 31.0, 22.0, 13.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.859375, -8.5882568359375, -8.317138671875, -8.0460205078125, -7.77490234375, -7.5037841796875, -7.232666015625, -6.9615478515625, -6.6904296875, -6.4193115234375, -6.148193359375, -5.8770751953125, -5.60595703125, -5.3348388671875, -5.063720703125, -4.7926025390625, -4.521484375, -4.2503662109375, -3.979248046875, -3.7081298828125, -3.43701171875, -3.1658935546875, -2.894775390625, -2.6236572265625, -2.3525390625, -2.0814208984375, -1.810302734375, -1.5391845703125, -1.26806640625, -0.9969482421875, -0.725830078125, -0.4547119140625, -0.18359375, 0.0875244140625, 0.358642578125, 0.6297607421875, 0.90087890625, 1.1719970703125, 1.443115234375, 1.7142333984375, 1.9853515625, 2.2564697265625, 2.527587890625, 2.7987060546875, 3.06982421875, 3.3409423828125, 3.612060546875, 3.8831787109375, 4.154296875, 4.4254150390625, 4.696533203125, 4.9676513671875, 5.23876953125, 5.5098876953125, 5.781005859375, 6.0521240234375, 6.3232421875, 6.5943603515625, 6.865478515625, 7.1365966796875, 7.40771484375, 7.6788330078125, 7.949951171875, 8.2210693359375, 8.4921875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 7.0, 13.0, 14.0, 29.0, 54.0, 112.0, 156.0, 198.0, 174.0, 104.0, 46.0, 30.0, 13.0, 12.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4892578125, -0.467498779296875, -0.44573974609375, -0.423980712890625, -0.4022216796875, -0.380462646484375, -0.35870361328125, -0.336944580078125, -0.315185546875, -0.293426513671875, -0.27166748046875, -0.249908447265625, -0.2281494140625, -0.206390380859375, -0.18463134765625, -0.162872314453125, -0.14111328125, -0.119354248046875, -0.09759521484375, -0.075836181640625, -0.0540771484375, -0.032318115234375, -0.01055908203125, 0.011199951171875, 0.032958984375, 0.054718017578125, 0.07647705078125, 0.098236083984375, 0.1199951171875, 0.141754150390625, 0.16351318359375, 0.185272216796875, 0.20703125, 0.228790283203125, 0.25054931640625, 0.272308349609375, 0.2940673828125, 0.315826416015625, 0.33758544921875, 0.359344482421875, 0.381103515625, 0.402862548828125, 0.42462158203125, 0.446380615234375, 0.4681396484375, 0.489898681640625, 0.51165771484375, 0.533416748046875, 0.55517578125, 0.576934814453125, 0.59869384765625, 0.620452880859375, 0.6422119140625, 0.663970947265625, 0.68572998046875, 0.707489013671875, 0.729248046875, 0.751007080078125, 0.77276611328125, 0.794525146484375, 0.8162841796875, 0.838043212890625, 0.85980224609375, 0.881561279296875, 0.9033203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 7.0, 7.0, 5.0, 8.0, 6.0, 10.0, 18.0, 24.0, 61.0, 59.0, 102.0, 169.0, 261.0, 477.0, 948.0, 2093.0, 5485.0, 21487.0, 386889.0, 593412.0, 26227.0, 6201.0, 2300.0, 1070.0, 478.0, 263.0, 128.0, 109.0, 83.0, 48.0, 39.0, 24.0, 13.0, 14.0, 12.0, 8.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.377685546875, -9.07568359375, -8.773681640625, -8.4716796875, -8.169677734375, -7.86767578125, -7.565673828125, -7.263671875, -6.961669921875, -6.65966796875, -6.357666015625, -6.0556640625, -5.753662109375, -5.45166015625, -5.149658203125, -4.84765625, -4.545654296875, -4.24365234375, -3.941650390625, -3.6396484375, -3.337646484375, -3.03564453125, -2.733642578125, -2.431640625, -2.129638671875, -1.82763671875, -1.525634765625, -1.2236328125, -0.921630859375, -0.61962890625, -0.317626953125, -0.015625, 0.286376953125, 0.58837890625, 0.890380859375, 1.1923828125, 1.494384765625, 1.79638671875, 2.098388671875, 2.400390625, 2.702392578125, 3.00439453125, 3.306396484375, 3.6083984375, 3.910400390625, 4.21240234375, 4.514404296875, 4.81640625, 5.118408203125, 5.42041015625, 5.722412109375, 6.0244140625, 6.326416015625, 6.62841796875, 6.930419921875, 7.232421875, 7.534423828125, 7.83642578125, 8.138427734375, 8.4404296875, 8.742431640625, 9.04443359375, 9.346435546875, 9.6484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 7.0, 7.0, 11.0, 13.0, 15.0, 5.0, 13.0, 20.0, 26.0, 29.0, 30.0, 26.0, 40.0, 44.0, 37.0, 46.0, 51.0, 53.0, 32.0, 51.0, 52.0, 42.0, 44.0, 35.0, 39.0, 30.0, 39.0, 29.0, 17.0, 23.0, 19.0, 16.0, 10.0, 14.0, 10.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.853240966796875, -2.76702880859375, -2.680816650390625, -2.5946044921875, -2.508392333984375, -2.42218017578125, -2.335968017578125, -2.249755859375, -2.163543701171875, -2.07733154296875, -1.991119384765625, -1.9049072265625, -1.818695068359375, -1.73248291015625, -1.646270751953125, -1.56005859375, -1.473846435546875, -1.38763427734375, -1.301422119140625, -1.2152099609375, -1.128997802734375, -1.04278564453125, -0.956573486328125, -0.870361328125, -0.784149169921875, -0.69793701171875, -0.611724853515625, -0.5255126953125, -0.439300537109375, -0.35308837890625, -0.266876220703125, -0.1806640625, -0.094451904296875, -0.00823974609375, 0.077972412109375, 0.1641845703125, 0.250396728515625, 0.33660888671875, 0.422821044921875, 0.509033203125, 0.595245361328125, 0.68145751953125, 0.767669677734375, 0.8538818359375, 0.940093994140625, 1.02630615234375, 1.112518310546875, 1.19873046875, 1.284942626953125, 1.37115478515625, 1.457366943359375, 1.5435791015625, 1.629791259765625, 1.71600341796875, 1.802215576171875, 1.888427734375, 1.974639892578125, 2.06085205078125, 2.147064208984375, 2.2332763671875, 2.319488525390625, 2.40570068359375, 2.491912841796875, 2.578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 18.0, 19.0, 25.0, 33.0, 49.0, 77.0, 130.0, 228.0, 500.0, 1240.0, 4260.0, 27318.0, 915246.0, 88248.0, 7844.0, 1894.0, 673.0, 278.0, 162.0, 89.0, 54.0, 47.0, 28.0, 21.0, 12.0, 10.0, 5.0, 11.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5234375, -11.1708984375, -10.818359375, -10.4658203125, -10.11328125, -9.7607421875, -9.408203125, -9.0556640625, -8.703125, -8.3505859375, -7.998046875, -7.6455078125, -7.29296875, -6.9404296875, -6.587890625, -6.2353515625, -5.8828125, -5.5302734375, -5.177734375, -4.8251953125, -4.47265625, -4.1201171875, -3.767578125, -3.4150390625, -3.0625, -2.7099609375, -2.357421875, -2.0048828125, -1.65234375, -1.2998046875, -0.947265625, -0.5947265625, -0.2421875, 0.1103515625, 0.462890625, 0.8154296875, 1.16796875, 1.5205078125, 1.873046875, 2.2255859375, 2.578125, 2.9306640625, 3.283203125, 3.6357421875, 3.98828125, 4.3408203125, 4.693359375, 5.0458984375, 5.3984375, 5.7509765625, 6.103515625, 6.4560546875, 6.80859375, 7.1611328125, 7.513671875, 7.8662109375, 8.21875, 8.5712890625, 8.923828125, 9.2763671875, 9.62890625, 9.9814453125, 10.333984375, 10.6865234375, 11.0390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 9.0, 8.0, 8.0, 6.0, 26.0, 29.0, 35.0, 65.0, 87.0, 116.0, 137.0, 149.0, 107.0, 54.0, 43.0, 21.0, 19.0, 13.0, 10.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0005340576171875, -0.0005208998918533325, -0.000507742166519165, -0.0004945844411849976, -0.0004814267158508301, -0.0004682689905166626, -0.0004551112651824951, -0.00044195353984832764, -0.00042879581451416016, -0.0004156380891799927, -0.0004024803638458252, -0.0003893226385116577, -0.00037616491317749023, -0.00036300718784332275, -0.0003498494625091553, -0.0003366917371749878, -0.0003235340118408203, -0.00031037628650665283, -0.00029721856117248535, -0.00028406083583831787, -0.0002709031105041504, -0.0002577453851699829, -0.00024458765983581543, -0.00023142993450164795, -0.00021827220916748047, -0.000205114483833313, -0.0001919567584991455, -0.00017879903316497803, -0.00016564130783081055, -0.00015248358249664307, -0.00013932585716247559, -0.0001261681318283081, -0.00011301040649414062, -9.985268115997314e-05, -8.669495582580566e-05, -7.353723049163818e-05, -6.03795051574707e-05, -4.722177982330322e-05, -3.406405448913574e-05, -2.0906329154968262e-05, -7.748603820800781e-06, 5.409121513366699e-06, 1.856684684753418e-05, 3.172457218170166e-05, 4.488229751586914e-05, 5.804002285003662e-05, 7.11977481842041e-05, 8.435547351837158e-05, 9.751319885253906e-05, 0.00011067092418670654, 0.00012382864952087402, 0.0001369863748550415, 0.00015014410018920898, 0.00016330182552337646, 0.00017645955085754395, 0.00018961727619171143, 0.0002027750015258789, 0.0002159327268600464, 0.00022909045219421387, 0.00024224817752838135, 0.00025540590286254883, 0.0002685636281967163, 0.0002817213535308838, 0.00029487907886505127, 0.00030803680419921875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 18.0, 18.0, 28.0, 55.0, 118.0, 235.0, 608.0, 1878.0, 8366.0, 125529.0, 883904.0, 22573.0, 3478.0, 1007.0, 370.0, 171.0, 79.0, 53.0, 20.0, 21.0, 8.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4453125, -11.0667724609375, -10.688232421875, -10.3096923828125, -9.93115234375, -9.5526123046875, -9.174072265625, -8.7955322265625, -8.4169921875, -8.0384521484375, -7.659912109375, -7.2813720703125, -6.90283203125, -6.5242919921875, -6.145751953125, -5.7672119140625, -5.388671875, -5.0101318359375, -4.631591796875, -4.2530517578125, -3.87451171875, -3.4959716796875, -3.117431640625, -2.7388916015625, -2.3603515625, -1.9818115234375, -1.603271484375, -1.2247314453125, -0.84619140625, -0.4676513671875, -0.089111328125, 0.2894287109375, 0.66796875, 1.0465087890625, 1.425048828125, 1.8035888671875, 2.18212890625, 2.5606689453125, 2.939208984375, 3.3177490234375, 3.6962890625, 4.0748291015625, 4.453369140625, 4.8319091796875, 5.21044921875, 5.5889892578125, 5.967529296875, 6.3460693359375, 6.724609375, 7.1031494140625, 7.481689453125, 7.8602294921875, 8.23876953125, 8.6173095703125, 8.995849609375, 9.3743896484375, 9.7529296875, 10.1314697265625, 10.510009765625, 10.8885498046875, 11.26708984375, 11.6456298828125, 12.024169921875, 12.4027099609375, 12.78125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 13.0, 8.0, 15.0, 19.0, 34.0, 31.0, 68.0, 81.0, 116.0, 115.0, 112.0, 114.0, 87.0, 48.0, 40.0, 28.0, 20.0, 9.0, 7.0, 7.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.6640625, -4.53460693359375, -4.4051513671875, -4.27569580078125, -4.146240234375, -4.01678466796875, -3.8873291015625, -3.75787353515625, -3.62841796875, -3.49896240234375, -3.3695068359375, -3.24005126953125, -3.110595703125, -2.98114013671875, -2.8516845703125, -2.72222900390625, -2.5927734375, -2.46331787109375, -2.3338623046875, -2.20440673828125, -2.074951171875, -1.94549560546875, -1.8160400390625, -1.68658447265625, -1.55712890625, -1.42767333984375, -1.2982177734375, -1.16876220703125, -1.039306640625, -0.90985107421875, -0.7803955078125, -0.65093994140625, -0.521484375, -0.39202880859375, -0.2625732421875, -0.13311767578125, -0.003662109375, 0.12579345703125, 0.2552490234375, 0.38470458984375, 0.51416015625, 0.64361572265625, 0.7730712890625, 0.90252685546875, 1.031982421875, 1.16143798828125, 1.2908935546875, 1.42034912109375, 1.5498046875, 1.67926025390625, 1.8087158203125, 1.93817138671875, 2.067626953125, 2.19708251953125, 2.3265380859375, 2.45599365234375, 2.58544921875, 2.71490478515625, 2.8443603515625, 2.97381591796875, 3.103271484375, 3.23272705078125, 3.3621826171875, 3.49163818359375, 3.62109375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 3.0, 10.0, 14.0, 47.0, 109.0, 288.0, 279.0, 120.0, 44.0, 22.0, 18.0, 11.0, 5.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4100341796875, -32.678707122802734, -30.947376251220703, -29.216049194335938, -27.484718322753906, -25.75339126586914, -24.022062301635742, -22.290733337402344, -20.559404373168945, -18.828075408935547, -17.09674644470215, -15.365418434143066, -13.634089469909668, -11.90276050567627, -10.171432495117188, -8.440103530883789, -6.708774566650391, -4.977445602416992, -3.246117115020752, -1.5147886276245117, 0.21654033660888672, 1.9478693008422852, 3.679197311401367, 5.410526275634766, 7.141855239868164, 8.873184204101562, 10.604513168334961, 12.335841178894043, 14.067170143127441, 15.79849910736084, 17.529827117919922, 19.26115608215332, 20.99248504638672, 22.723814010620117, 24.455142974853516, 26.18647003173828, 27.917800903320312, 29.649127960205078, 31.380456924438477, 33.111785888671875, 34.843116760253906, 36.57444381713867, 38.3057746887207, 40.03710174560547, 41.7684326171875, 43.499759674072266, 45.23108673095703, 46.96241760253906, 48.69374465942383, 50.425071716308594, 52.156402587890625, 53.88772964477539, 55.61906051635742, 57.35038757324219, 59.08171844482422, 60.813045501708984, 62.54437255859375, 64.27570343017578, 66.00702667236328, 67.73835754394531, 69.46968841552734, 71.20101928710938, 72.93234252929688, 74.6636734008789, 76.39500427246094]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 7.0, 0.0, 2.0, 5.0, 3.0, 13.0, 10.0, 25.0, 41.0, 64.0, 82.0, 118.0, 122.0, 128.0, 125.0, 83.0, 65.0, 41.0, 15.0, 16.0, 8.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-64.34403991699219, -62.69165802001953, -61.039276123046875, -59.38689422607422, -57.73451614379883, -56.08213424682617, -54.429752349853516, -52.77737045288086, -51.12499237060547, -49.47261047363281, -47.820228576660156, -46.1678466796875, -44.51546859741211, -42.86308670043945, -41.2107048034668, -39.55832290649414, -37.905941009521484, -36.25355911254883, -34.60117721557617, -32.94879913330078, -31.296417236328125, -29.64403533935547, -27.991653442382812, -26.339271545410156, -24.686891555786133, -23.034509658813477, -21.382129669189453, -19.729747772216797, -18.07736587524414, -16.424985885620117, -14.772603988647461, -13.120223045349121, -11.467842102050781, -9.815461158752441, -8.163080215454102, -6.510698318481445, -4.8583173751831055, -3.2059364318847656, -1.5535545349121094, 0.09882640838623047, 1.7512073516845703, 3.4035885334014893, 5.055969715118408, 6.708351135253906, 8.360732078552246, 10.013113021850586, 11.665494918823242, 13.317875862121582, 14.970256805419922, 16.622638702392578, 18.2750186920166, 19.927400588989258, 21.57978057861328, 23.232162475585938, 24.884544372558594, 26.53692626953125, 28.189306259155273, 29.84168815612793, 31.494068145751953, 33.14645004272461, 34.798831939697266, 36.451210021972656, 38.10359191894531, 39.75597381591797, 41.408355712890625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 11.0, 7.0, 11.0, 22.0, 34.0, 57.0, 265.0, 8338.0, 4175632.0, 9395.0, 334.0, 65.0, 28.0, 20.0, 13.0, 8.0, 5.0, 8.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.5, -95.5595703125, -92.619140625, -89.6787109375, -86.73828125, -83.7978515625, -80.857421875, -77.9169921875, -74.9765625, -72.0361328125, -69.095703125, -66.1552734375, -63.21484375, -60.2744140625, -57.333984375, -54.3935546875, -51.453125, -48.5126953125, -45.572265625, -42.6318359375, -39.69140625, -36.7509765625, -33.810546875, -30.8701171875, -27.9296875, -24.9892578125, -22.048828125, -19.1083984375, -16.16796875, -13.2275390625, -10.287109375, -7.3466796875, -4.40625, -1.4658203125, 1.474609375, 4.4150390625, 7.35546875, 10.2958984375, 13.236328125, 16.1767578125, 19.1171875, 22.0576171875, 24.998046875, 27.9384765625, 30.87890625, 33.8193359375, 36.759765625, 39.7001953125, 42.640625, 45.5810546875, 48.521484375, 51.4619140625, 54.40234375, 57.3427734375, 60.283203125, 63.2236328125, 66.1640625, 69.1044921875, 72.044921875, 74.9853515625, 77.92578125, 80.8662109375, 83.806640625, 86.7470703125, 89.6875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 9.0, 3.0, 9.0, 9.0, 12.0, 15.0, 17.0, 36.0, 54.0, 73.0, 87.0, 88.0, 104.0, 99.0, 102.0, 80.0, 54.0, 55.0, 23.0, 11.0, 11.0, 11.0, 8.0, 7.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36083984375, -0.34632110595703125, -0.3318023681640625, -0.31728363037109375, -0.302764892578125, -0.28824615478515625, -0.2737274169921875, -0.25920867919921875, -0.24468994140625, -0.23017120361328125, -0.2156524658203125, -0.20113372802734375, -0.186614990234375, -0.17209625244140625, -0.1575775146484375, -0.14305877685546875, -0.1285400390625, -0.11402130126953125, -0.0995025634765625, -0.08498382568359375, -0.070465087890625, -0.05594635009765625, -0.0414276123046875, -0.02690887451171875, -0.01239013671875, 0.00212860107421875, 0.0166473388671875, 0.03116607666015625, 0.045684814453125, 0.06020355224609375, 0.0747222900390625, 0.08924102783203125, 0.103759765625, 0.11827850341796875, 0.1327972412109375, 0.14731597900390625, 0.161834716796875, 0.17635345458984375, 0.1908721923828125, 0.20539093017578125, 0.21990966796875, 0.23442840576171875, 0.2489471435546875, 0.26346588134765625, 0.277984619140625, 0.29250335693359375, 0.3070220947265625, 0.32154083251953125, 0.3360595703125, 0.35057830810546875, 0.3650970458984375, 0.37961578369140625, 0.394134521484375, 0.40865325927734375, 0.4231719970703125, 0.43769073486328125, 0.45220947265625, 0.46672821044921875, 0.4812469482421875, 0.49576568603515625, 0.510284423828125, 0.5248031616210938, 0.5393218994140625, 0.5538406372070312, 0.568359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 14.0, 30.0, 93.0, 236.0, 1937.0, 314737.0, 3872608.0, 3713.0, 510.0, 205.0, 95.0, 49.0, 28.0, 20.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.390625, -11.918701171875, -10.44677734375, -8.974853515625, -7.5029296875, -6.031005859375, -4.55908203125, -3.087158203125, -1.615234375, -0.143310546875, 1.32861328125, 2.800537109375, 4.2724609375, 5.744384765625, 7.21630859375, 8.688232421875, 10.16015625, 11.632080078125, 13.10400390625, 14.575927734375, 16.0478515625, 17.519775390625, 18.99169921875, 20.463623046875, 21.935546875, 23.407470703125, 24.87939453125, 26.351318359375, 27.8232421875, 29.295166015625, 30.76708984375, 32.239013671875, 33.7109375, 35.182861328125, 36.65478515625, 38.126708984375, 39.5986328125, 41.070556640625, 42.54248046875, 44.014404296875, 45.486328125, 46.958251953125, 48.43017578125, 49.902099609375, 51.3740234375, 52.845947265625, 54.31787109375, 55.789794921875, 57.26171875, 58.733642578125, 60.20556640625, 61.677490234375, 63.1494140625, 64.621337890625, 66.09326171875, 67.565185546875, 69.037109375, 70.509033203125, 71.98095703125, 73.452880859375, 74.9248046875, 76.396728515625, 77.86865234375, 79.340576171875, 80.8125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 7.0, 3.0, 5.0, 9.0, 8.0, 7.0, 12.0, 16.0, 13.0, 14.0, 29.0, 30.0, 53.0, 57.0, 67.0, 110.0, 162.0, 337.0, 1055.0, 868.0, 470.0, 235.0, 138.0, 87.0, 51.0, 35.0, 39.0, 16.0, 22.0, 18.0, 14.0, 17.0, 10.0, 10.0, 9.0, 5.0, 5.0, 1.0, 7.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.78955078125, -0.7655563354492188, -0.7415618896484375, -0.7175674438476562, -0.693572998046875, -0.6695785522460938, -0.6455841064453125, -0.6215896606445312, -0.59759521484375, -0.5736007690429688, -0.5496063232421875, -0.5256118774414062, -0.501617431640625, -0.47762298583984375, -0.4536285400390625, -0.42963409423828125, -0.4056396484375, -0.38164520263671875, -0.3576507568359375, -0.33365631103515625, -0.309661865234375, -0.28566741943359375, -0.2616729736328125, -0.23767852783203125, -0.21368408203125, -0.18968963623046875, -0.1656951904296875, -0.14170074462890625, -0.117706298828125, -0.09371185302734375, -0.0697174072265625, -0.04572296142578125, -0.021728515625, 0.00226593017578125, 0.0262603759765625, 0.05025482177734375, 0.074249267578125, 0.09824371337890625, 0.1222381591796875, 0.14623260498046875, 0.17022705078125, 0.19422149658203125, 0.2182159423828125, 0.24221038818359375, 0.266204833984375, 0.29019927978515625, 0.3141937255859375, 0.33818817138671875, 0.3621826171875, 0.38617706298828125, 0.4101715087890625, 0.43416595458984375, 0.458160400390625, 0.48215484619140625, 0.5061492919921875, 0.5301437377929688, 0.55413818359375, 0.5781326293945312, 0.6021270751953125, 0.6261215209960938, 0.650115966796875, 0.6741104125976562, 0.6981048583984375, 0.7220993041992188, 0.74609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 8.0, 904.0, 99.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.41563606262207, -8.240530014038086, -3.0654239654541016, 2.109682083129883, 7.284788131713867, 12.459894180297852, 17.635000228881836, 22.81010627746582, 27.985212326049805, 33.160316467285156, 38.335426330566406, 43.510528564453125, 48.685638427734375, 53.860740661621094, 59.035850524902344, 64.21095275878906, 69.38606262207031, 74.56117248535156, 79.73627471923828, 84.911376953125, 90.08648681640625, 95.2615966796875, 100.43669891357422, 105.61180114746094, 110.78691101074219, 115.96202087402344, 121.13712310791016, 126.31222534179688, 131.48733520507812, 136.66244506835938, 141.83755493164062, 147.0126495361328, 152.187744140625, 157.36285400390625, 162.5379638671875, 167.7130584716797, 172.88816833496094, 178.0632781982422, 183.23837280273438, 188.41348266601562, 193.58859252929688, 198.76370239257812, 203.93881225585938, 209.11390686035156, 214.2890167236328, 219.46412658691406, 224.63922119140625, 229.8143310546875, 234.98944091796875, 240.16455078125, 245.33966064453125, 250.51475524902344, 255.6898651123047, 260.8649597167969, 266.0400695800781, 271.2151794433594, 276.3902893066406, 281.5653991699219, 286.7405090332031, 291.9156188964844, 297.0906982421875, 302.26580810546875, 307.44091796875, 312.61602783203125, 317.7911376953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 1.0, 3.0, 11.0, 14.0, 16.0, 33.0, 58.0, 62.0, 105.0, 102.0, 109.0, 103.0, 98.0, 91.0, 70.0, 42.0, 38.0, 21.0, 13.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.060612201690674, -6.711625576019287, -6.3626389503479, -6.013652801513672, -5.664666175842285, -5.315679550170898, -4.966692924499512, -4.617706298828125, -4.268719673156738, -3.9197330474853516, -3.570746660232544, -3.2217600345611572, -2.8727736473083496, -2.523787021636963, -2.174800395965576, -1.8258140087127686, -1.476827621459961, -1.1278411149978638, -0.7788545489311218, -0.4298679828643799, -0.08088147640228271, 0.26810503005981445, 0.6170916557312012, 0.9660780429840088, 1.3150646686553955, 1.6640511751174927, 2.01303768157959, 2.3620243072509766, 2.7110109329223633, 3.059997320175171, 3.4089839458465576, 3.7579703330993652, 4.10695743560791, 4.455944061279297, 4.804930686950684, 5.15391731262207, 5.502903461456299, 5.8518900871276855, 6.200876712799072, 6.549862861633301, 6.8988494873046875, 7.247836112976074, 7.596822738647461, 7.945809364318848, 8.294795989990234, 8.643781661987305, 8.992769241333008, 9.341754913330078, 9.690742492675781, 10.039729118347168, 10.388715744018555, 10.737702369689941, 11.086688995361328, 11.435674667358398, 11.784662246704102, 12.133647918701172, 12.482634544372559, 12.831621170043945, 13.180607795715332, 13.529594421386719, 13.878581047058105, 14.227567672729492, 14.576553344726562, 14.92553997039795, 15.274526596069336]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 7.0, 2.0, 4.0, 10.0, 7.0, 14.0, 21.0, 33.0, 49.0, 65.0, 146.0, 318.0, 899.0, 2558.0, 9876.0, 62380.0, 751077.0, 193986.0, 20197.0, 4544.0, 1302.0, 531.0, 220.0, 114.0, 66.0, 33.0, 21.0, 26.0, 12.0, 11.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-14.40625, -14.0029296875, -13.599609375, -13.1962890625, -12.79296875, -12.3896484375, -11.986328125, -11.5830078125, -11.1796875, -10.7763671875, -10.373046875, -9.9697265625, -9.56640625, -9.1630859375, -8.759765625, -8.3564453125, -7.953125, -7.5498046875, -7.146484375, -6.7431640625, -6.33984375, -5.9365234375, -5.533203125, -5.1298828125, -4.7265625, -4.3232421875, -3.919921875, -3.5166015625, -3.11328125, -2.7099609375, -2.306640625, -1.9033203125, -1.5, -1.0966796875, -0.693359375, -0.2900390625, 0.11328125, 0.5166015625, 0.919921875, 1.3232421875, 1.7265625, 2.1298828125, 2.533203125, 2.9365234375, 3.33984375, 3.7431640625, 4.146484375, 4.5498046875, 4.953125, 5.3564453125, 5.759765625, 6.1630859375, 6.56640625, 6.9697265625, 7.373046875, 7.7763671875, 8.1796875, 8.5830078125, 8.986328125, 9.3896484375, 9.79296875, 10.1962890625, 10.599609375, 11.0029296875, 11.40625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 19.0, 19.0, 38.0, 61.0, 86.0, 147.0, 144.0, 127.0, 119.0, 82.0, 48.0, 40.0, 25.0, 17.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0498313903808594, -1.0264205932617188, -1.0030097961425781, -0.9795989990234375, -0.9561882019042969, -0.9327774047851562, -0.9093666076660156, -0.885955810546875, -0.8625450134277344, -0.8391342163085938, -0.8157234191894531, -0.7923126220703125, -0.7689018249511719, -0.7454910278320312, -0.7220802307128906, -0.69866943359375, -0.6752586364746094, -0.6518478393554688, -0.6284370422363281, -0.6050262451171875, -0.5816154479980469, -0.5582046508789062, -0.5347938537597656, -0.511383056640625, -0.4879722595214844, -0.46456146240234375, -0.4411506652832031, -0.4177398681640625, -0.3943290710449219, -0.37091827392578125, -0.3475074768066406, -0.3240966796875, -0.3006858825683594, -0.27727508544921875, -0.2538642883300781, -0.2304534912109375, -0.20704269409179688, -0.18363189697265625, -0.16022109985351562, -0.136810302734375, -0.11339950561523438, -0.08998870849609375, -0.06657791137695312, -0.0431671142578125, -0.019756317138671875, 0.00365447998046875, 0.027065277099609375, 0.05047607421875, 0.07388687133789062, 0.09729766845703125, 0.12070846557617188, 0.1441192626953125, 0.16753005981445312, 0.19094085693359375, 0.21435165405273438, 0.237762451171875, 0.2611732482910156, 0.28458404541015625, 0.3079948425292969, 0.3314056396484375, 0.3548164367675781, 0.37822723388671875, 0.4016380310058594, 0.425048828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 4.0, 8.0, 9.0, 12.0, 4.0, 11.0, 18.0, 17.0, 19.0, 19.0, 13.0, 28.0, 80.0, 273.0, 2358.0, 188570.0, 852173.0, 4344.0, 345.0, 75.0, 35.0, 22.0, 15.0, 18.0, 9.0, 13.0, 11.0, 11.0, 6.0, 5.0, 9.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.828125, -27.012451171875, -26.19677734375, -25.381103515625, -24.5654296875, -23.749755859375, -22.93408203125, -22.118408203125, -21.302734375, -20.487060546875, -19.67138671875, -18.855712890625, -18.0400390625, -17.224365234375, -16.40869140625, -15.593017578125, -14.77734375, -13.961669921875, -13.14599609375, -12.330322265625, -11.5146484375, -10.698974609375, -9.88330078125, -9.067626953125, -8.251953125, -7.436279296875, -6.62060546875, -5.804931640625, -4.9892578125, -4.173583984375, -3.35791015625, -2.542236328125, -1.7265625, -0.910888671875, -0.09521484375, 0.720458984375, 1.5361328125, 2.351806640625, 3.16748046875, 3.983154296875, 4.798828125, 5.614501953125, 6.43017578125, 7.245849609375, 8.0615234375, 8.877197265625, 9.69287109375, 10.508544921875, 11.32421875, 12.139892578125, 12.95556640625, 13.771240234375, 14.5869140625, 15.402587890625, 16.21826171875, 17.033935546875, 17.849609375, 18.665283203125, 19.48095703125, 20.296630859375, 21.1123046875, 21.927978515625, 22.74365234375, 23.559326171875, 24.375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 9.0, 10.0, 13.0, 19.0, 14.0, 21.0, 18.0, 31.0, 26.0, 37.0, 34.0, 44.0, 38.0, 37.0, 38.0, 40.0, 49.0, 43.0, 41.0, 41.0, 44.0, 45.0, 43.0, 41.0, 35.0, 23.0, 25.0, 27.0, 20.0, 19.0, 16.0, 8.0, 11.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.046875, -1.9837188720703125, -1.920562744140625, -1.8574066162109375, -1.79425048828125, -1.7310943603515625, -1.667938232421875, -1.6047821044921875, -1.5416259765625, -1.4784698486328125, -1.415313720703125, -1.3521575927734375, -1.28900146484375, -1.2258453369140625, -1.162689208984375, -1.0995330810546875, -1.036376953125, -0.9732208251953125, -0.910064697265625, -0.8469085693359375, -0.78375244140625, -0.7205963134765625, -0.657440185546875, -0.5942840576171875, -0.5311279296875, -0.4679718017578125, -0.404815673828125, -0.3416595458984375, -0.27850341796875, -0.2153472900390625, -0.152191162109375, -0.0890350341796875, -0.02587890625, 0.0372772216796875, 0.100433349609375, 0.1635894775390625, 0.22674560546875, 0.2899017333984375, 0.353057861328125, 0.4162139892578125, 0.4793701171875, 0.5425262451171875, 0.605682373046875, 0.6688385009765625, 0.73199462890625, 0.7951507568359375, 0.858306884765625, 0.9214630126953125, 0.984619140625, 1.0477752685546875, 1.110931396484375, 1.1740875244140625, 1.23724365234375, 1.3003997802734375, 1.363555908203125, 1.4267120361328125, 1.4898681640625, 1.5530242919921875, 1.616180419921875, 1.6793365478515625, 1.74249267578125, 1.8056488037109375, 1.868804931640625, 1.9319610595703125, 1.9951171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 21.0, 51.0, 170.0, 1534.0, 1043486.0, 2954.0, 221.0, 52.0, 23.0, 12.0, 3.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-124.375, -120.30859375, -116.2421875, -112.17578125, -108.109375, -104.04296875, -99.9765625, -95.91015625, -91.84375, -87.77734375, -83.7109375, -79.64453125, -75.578125, -71.51171875, -67.4453125, -63.37890625, -59.3125, -55.24609375, -51.1796875, -47.11328125, -43.046875, -38.98046875, -34.9140625, -30.84765625, -26.78125, -22.71484375, -18.6484375, -14.58203125, -10.515625, -6.44921875, -2.3828125, 1.68359375, 5.75, 9.81640625, 13.8828125, 17.94921875, 22.015625, 26.08203125, 30.1484375, 34.21484375, 38.28125, 42.34765625, 46.4140625, 50.48046875, 54.546875, 58.61328125, 62.6796875, 66.74609375, 70.8125, 74.87890625, 78.9453125, 83.01171875, 87.078125, 91.14453125, 95.2109375, 99.27734375, 103.34375, 107.41015625, 111.4765625, 115.54296875, 119.609375, 123.67578125, 127.7421875, 131.80859375, 135.875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 3.0, 8.0, 5.0, 10.0, 5.0, 19.0, 16.0, 16.0, 15.0, 15.0, 25.0, 27.0, 38.0, 38.0, 56.0, 76.0, 103.0, 101.0, 94.0, 62.0, 41.0, 35.0, 32.0, 19.0, 18.0, 24.0, 9.0, 14.0, 10.0, 10.0, 8.0, 5.0, 6.0, 5.0, 3.0, 6.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008368492126464844, -0.0008098185062408447, -0.0007827877998352051, -0.0007557570934295654, -0.0007287263870239258, -0.0007016956806182861, -0.0006746649742126465, -0.0006476342678070068, -0.0006206035614013672, -0.0005935728549957275, -0.0005665421485900879, -0.0005395114421844482, -0.0005124807357788086, -0.00048545002937316895, -0.0004584193229675293, -0.00043138861656188965, -0.00040435791015625, -0.00037732720375061035, -0.0003502964973449707, -0.00032326579093933105, -0.0002962350845336914, -0.00026920437812805176, -0.0002421736717224121, -0.00021514296531677246, -0.0001881122589111328, -0.00016108155250549316, -0.00013405084609985352, -0.00010702013969421387, -7.998943328857422e-05, -5.295872688293457e-05, -2.5928020477294922e-05, 1.1026859283447266e-06, 2.8133392333984375e-05, 5.5164098739624023e-05, 8.219480514526367e-05, 0.00010922551155090332, 0.00013625621795654297, 0.00016328692436218262, 0.00019031763076782227, 0.00021734833717346191, 0.00024437904357910156, 0.0002714097499847412, 0.00029844045639038086, 0.0003254711627960205, 0.00035250186920166016, 0.0003795325756072998, 0.00040656328201293945, 0.0004335939884185791, 0.00046062469482421875, 0.0004876554012298584, 0.000514686107635498, 0.0005417168140411377, 0.0005687475204467773, 0.000595778226852417, 0.0006228089332580566, 0.0006498396396636963, 0.0006768703460693359, 0.0007039010524749756, 0.0007309317588806152, 0.0007579624652862549, 0.0007849931716918945, 0.0008120238780975342, 0.0008390545845031738, 0.0008660852909088135, 0.0008931159973144531]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 10.0, 7.0, 7.0, 24.0, 28.0, 22.0, 34.0, 40.0, 66.0, 101.0, 147.0, 252.0, 426.0, 730.0, 1712.0, 4251.0, 13401.0, 62114.0, 729740.0, 196809.0, 26033.0, 7275.0, 2717.0, 1157.0, 625.0, 301.0, 178.0, 129.0, 61.0, 46.0, 29.0, 18.0, 17.0, 4.0, 9.0, 10.0, 2.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-16.609375, -16.1312255859375, -15.653076171875, -15.1749267578125, -14.69677734375, -14.2186279296875, -13.740478515625, -13.2623291015625, -12.7841796875, -12.3060302734375, -11.827880859375, -11.3497314453125, -10.87158203125, -10.3934326171875, -9.915283203125, -9.4371337890625, -8.958984375, -8.4808349609375, -8.002685546875, -7.5245361328125, -7.04638671875, -6.5682373046875, -6.090087890625, -5.6119384765625, -5.1337890625, -4.6556396484375, -4.177490234375, -3.6993408203125, -3.22119140625, -2.7430419921875, -2.264892578125, -1.7867431640625, -1.30859375, -0.8304443359375, -0.352294921875, 0.1258544921875, 0.60400390625, 1.0821533203125, 1.560302734375, 2.0384521484375, 2.5166015625, 2.9947509765625, 3.472900390625, 3.9510498046875, 4.42919921875, 4.9073486328125, 5.385498046875, 5.8636474609375, 6.341796875, 6.8199462890625, 7.298095703125, 7.7762451171875, 8.25439453125, 8.7325439453125, 9.210693359375, 9.6888427734375, 10.1669921875, 10.6451416015625, 11.123291015625, 11.6014404296875, 12.07958984375, 12.5577392578125, 13.035888671875, 13.5140380859375, 13.9921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 7.0, 21.0, 36.0, 49.0, 90.0, 165.0, 228.0, 179.0, 87.0, 56.0, 32.0, 22.0, 5.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.71875, -13.4100341796875, -13.101318359375, -12.7926025390625, -12.48388671875, -12.1751708984375, -11.866455078125, -11.5577392578125, -11.2490234375, -10.9403076171875, -10.631591796875, -10.3228759765625, -10.01416015625, -9.7054443359375, -9.396728515625, -9.0880126953125, -8.779296875, -8.4705810546875, -8.161865234375, -7.8531494140625, -7.54443359375, -7.2357177734375, -6.927001953125, -6.6182861328125, -6.3095703125, -6.0008544921875, -5.692138671875, -5.3834228515625, -5.07470703125, -4.7659912109375, -4.457275390625, -4.1485595703125, -3.83984375, -3.5311279296875, -3.222412109375, -2.9136962890625, -2.60498046875, -2.2962646484375, -1.987548828125, -1.6788330078125, -1.3701171875, -1.0614013671875, -0.752685546875, -0.4439697265625, -0.13525390625, 0.1734619140625, 0.482177734375, 0.7908935546875, 1.099609375, 1.4083251953125, 1.717041015625, 2.0257568359375, 2.33447265625, 2.6431884765625, 2.951904296875, 3.2606201171875, 3.5693359375, 3.8780517578125, 4.186767578125, 4.4954833984375, 4.80419921875, 5.1129150390625, 5.421630859375, 5.7303466796875, 6.0390625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 10.0, 37.0, 81.0, 173.0, 290.0, 226.0, 96.0, 34.0, 12.0, 15.0, 6.0, 4.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.779842376708984, -42.96872329711914, -41.1576042175293, -39.34648895263672, -37.535369873046875, -35.72425079345703, -33.91313171386719, -32.102012634277344, -30.290895462036133, -28.47977638244629, -26.668659210205078, -24.857540130615234, -23.04642105102539, -21.23530387878418, -19.424184799194336, -17.613067626953125, -15.801948547363281, -13.990830421447754, -12.179712295532227, -10.368593215942383, -8.557475090026855, -6.746356964111328, -4.935237884521484, -3.124119758605957, -1.3130016326904297, 0.49811673164367676, 2.309235095977783, 4.120353698730469, 5.931471824645996, 7.742589950561523, 9.553709030151367, 11.364827156066895, 13.175949096679688, 14.987067222595215, 16.798185348510742, 18.609304428100586, 20.420421600341797, 22.23154067993164, 24.042659759521484, 25.853778839111328, 27.66489601135254, 29.476015090942383, 31.287132263183594, 33.09825134277344, 34.90937042236328, 36.720489501953125, 38.53160858154297, 40.34272384643555, 42.15384292602539, 43.964962005615234, 45.77608108520508, 47.587196350097656, 49.3983154296875, 51.209434509277344, 53.02055358886719, 54.83167266845703, 56.642791748046875, 58.45391082763672, 60.26502990722656, 62.076148986816406, 63.887264251708984, 65.69837951660156, 67.50950622558594, 69.32061767578125, 71.1317367553711]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 7.0, 9.0, 11.0, 25.0, 22.0, 48.0, 53.0, 60.0, 78.0, 98.0, 90.0, 74.0, 89.0, 69.0, 57.0, 49.0, 42.0, 31.0, 21.0, 23.0, 7.0, 7.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.773853302001953, -23.75680160522461, -22.739749908447266, -21.722698211669922, -20.705646514892578, -19.688594818115234, -18.671545028686523, -17.65449333190918, -16.637441635131836, -15.620389938354492, -14.603338241577148, -13.586287498474121, -12.569235801696777, -11.552184104919434, -10.535133361816406, -9.518081665039062, -8.501029968261719, -7.483978271484375, -6.4669270515441895, -5.449875831604004, -4.43282413482666, -3.4157724380493164, -2.398721218109131, -1.3816699981689453, -0.36461830139160156, 0.6524331569671631, 1.6694846153259277, 2.6865360736846924, 3.703587532043457, 4.720639228820801, 5.737690448760986, 6.754741668701172, 7.77178955078125, 8.788841247558594, 9.805892944335938, 10.822943687438965, 11.839995384216309, 12.857047080993652, 13.87409782409668, 14.891149520874023, 15.908201217651367, 16.92525291442871, 17.942304611206055, 18.9593563079834, 19.97640609741211, 20.993457794189453, 22.010509490966797, 23.02756118774414, 24.044612884521484, 25.061664581298828, 26.078716278076172, 27.095767974853516, 28.11281967163086, 29.129871368408203, 30.146921157836914, 31.163972854614258, 32.18102264404297, 33.19807434082031, 34.215126037597656, 35.232177734375, 36.249229431152344, 37.26628112792969, 38.28333282470703, 39.300384521484375, 40.31743621826172]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 8.0, 0.0, 8.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 14.0, 10.0, 2.0, 12.0, 20.0, 2.0, 26.0, 23.0, 27.0, 54.0, 409.0, 8044.0, 4133207.0, 50964.0, 1053.0, 193.0, 60.0, 35.0, 23.0, 14.0, 4.0, 8.0, 16.0, 14.0, 4.0, 4.0, 4.0, 2.0, 8.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-48.15625, -46.28173828125, -44.4072265625, -42.53271484375, -40.658203125, -38.78369140625, -36.9091796875, -35.03466796875, -33.16015625, -31.28564453125, -29.4111328125, -27.53662109375, -25.662109375, -23.78759765625, -21.9130859375, -20.03857421875, -18.1640625, -16.28955078125, -14.4150390625, -12.54052734375, -10.666015625, -8.79150390625, -6.9169921875, -5.04248046875, -3.16796875, -1.29345703125, 0.5810546875, 2.45556640625, 4.330078125, 6.20458984375, 8.0791015625, 9.95361328125, 11.828125, 13.70263671875, 15.5771484375, 17.45166015625, 19.326171875, 21.20068359375, 23.0751953125, 24.94970703125, 26.82421875, 28.69873046875, 30.5732421875, 32.44775390625, 34.322265625, 36.19677734375, 38.0712890625, 39.94580078125, 41.8203125, 43.69482421875, 45.5693359375, 47.44384765625, 49.318359375, 51.19287109375, 53.0673828125, 54.94189453125, 56.81640625, 58.69091796875, 60.5654296875, 62.43994140625, 64.314453125, 66.18896484375, 68.0634765625, 69.93798828125, 71.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 6.0, 9.0, 7.0, 12.0, 12.0, 22.0, 27.0, 21.0, 32.0, 37.0, 45.0, 59.0, 58.0, 48.0, 61.0, 58.0, 62.0, 54.0, 54.0, 44.0, 37.0, 35.0, 40.0, 30.0, 21.0, 16.0, 14.0, 17.0, 18.0, 11.0, 3.0, 3.0, 7.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342529296875, -0.3305320739746094, -0.31853485107421875, -0.3065376281738281, -0.2945404052734375, -0.2825431823730469, -0.27054595947265625, -0.2585487365722656, -0.246551513671875, -0.23455429077148438, -0.22255706787109375, -0.21055984497070312, -0.1985626220703125, -0.18656539916992188, -0.17456817626953125, -0.16257095336914062, -0.15057373046875, -0.13857650756835938, -0.12657928466796875, -0.11458206176757812, -0.1025848388671875, -0.09058761596679688, -0.07859039306640625, -0.06659317016601562, -0.054595947265625, -0.042598724365234375, -0.03060150146484375, -0.018604278564453125, -0.0066070556640625, 0.005390167236328125, 0.01738739013671875, 0.029384613037109375, 0.0413818359375, 0.053379058837890625, 0.06537628173828125, 0.07737350463867188, 0.0893707275390625, 0.10136795043945312, 0.11336517333984375, 0.12536239624023438, 0.137359619140625, 0.14935684204101562, 0.16135406494140625, 0.17335128784179688, 0.1853485107421875, 0.19734573364257812, 0.20934295654296875, 0.22134017944335938, 0.23333740234375, 0.24533462524414062, 0.25733184814453125, 0.2693290710449219, 0.2813262939453125, 0.2933235168457031, 0.30532073974609375, 0.3173179626464844, 0.329315185546875, 0.3413124084472656, 0.35330963134765625, 0.3653068542480469, 0.3773040771484375, 0.3893013000488281, 0.40129852294921875, 0.4132957458496094, 0.42529296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 12.0, 40.0, 93.0, 375.0, 15239.0, 4177200.0, 1187.0, 90.0, 41.0, 12.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.125, -170.91796875, -167.7109375, -164.50390625, -161.296875, -158.08984375, -154.8828125, -151.67578125, -148.46875, -145.26171875, -142.0546875, -138.84765625, -135.640625, -132.43359375, -129.2265625, -126.01953125, -122.8125, -119.60546875, -116.3984375, -113.19140625, -109.984375, -106.77734375, -103.5703125, -100.36328125, -97.15625, -93.94921875, -90.7421875, -87.53515625, -84.328125, -81.12109375, -77.9140625, -74.70703125, -71.5, -68.29296875, -65.0859375, -61.87890625, -58.671875, -55.46484375, -52.2578125, -49.05078125, -45.84375, -42.63671875, -39.4296875, -36.22265625, -33.015625, -29.80859375, -26.6015625, -23.39453125, -20.1875, -16.98046875, -13.7734375, -10.56640625, -7.359375, -4.15234375, -0.9453125, 2.26171875, 5.46875, 8.67578125, 11.8828125, 15.08984375, 18.296875, 21.50390625, 24.7109375, 27.91796875, 31.125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 7.0, 9.0, 8.0, 14.0, 23.0, 28.0, 52.0, 76.0, 135.0, 231.0, 588.0, 1887.0, 487.0, 202.0, 110.0, 81.0, 47.0, 37.0, 11.0, 13.0, 7.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.2982635498046875, -2.235198974609375, -2.1721343994140625, -2.10906982421875, -2.0460052490234375, -1.982940673828125, -1.9198760986328125, -1.8568115234375, -1.7937469482421875, -1.730682373046875, -1.6676177978515625, -1.60455322265625, -1.5414886474609375, -1.478424072265625, -1.4153594970703125, -1.352294921875, -1.2892303466796875, -1.226165771484375, -1.1631011962890625, -1.10003662109375, -1.0369720458984375, -0.973907470703125, -0.9108428955078125, -0.8477783203125, -0.7847137451171875, -0.721649169921875, -0.6585845947265625, -0.59552001953125, -0.5324554443359375, -0.469390869140625, -0.4063262939453125, -0.34326171875, -0.2801971435546875, -0.217132568359375, -0.1540679931640625, -0.09100341796875, -0.0279388427734375, 0.035125732421875, 0.0981903076171875, 0.1612548828125, 0.2243194580078125, 0.287384033203125, 0.3504486083984375, 0.41351318359375, 0.4765777587890625, 0.539642333984375, 0.6027069091796875, 0.665771484375, 0.7288360595703125, 0.791900634765625, 0.8549652099609375, 0.91802978515625, 0.9810943603515625, 1.044158935546875, 1.1072235107421875, 1.1702880859375, 1.2333526611328125, 1.296417236328125, 1.3594818115234375, 1.42254638671875, 1.4856109619140625, 1.548675537109375, 1.6117401123046875, 1.6748046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 906.0, 108.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-430.1242370605469, -422.2818908691406, -414.4395446777344, -406.5971984863281, -398.7548522949219, -390.9125061035156, -383.0701599121094, -375.2278137207031, -367.3854675292969, -359.5431213378906, -351.7007751464844, -343.8584289550781, -336.0160827636719, -328.1737365722656, -320.3313903808594, -312.4890441894531, -304.6466979980469, -296.8043518066406, -288.9620056152344, -281.1196594238281, -273.2773132324219, -265.4349670410156, -257.5926208496094, -249.75027465820312, -241.9079132080078, -234.06556701660156, -226.2232208251953, -218.38087463378906, -210.5385284423828, -202.69618225097656, -194.8538360595703, -187.01148986816406, -179.16912841796875, -171.3267822265625, -163.48443603515625, -155.64208984375, -147.79974365234375, -139.9573974609375, -132.11505126953125, -124.272705078125, -116.43035888671875, -108.5880126953125, -100.74566650390625, -92.9033203125, -85.06097412109375, -77.2186279296875, -69.37628173828125, -61.533931732177734, -53.69158935546875, -45.8492431640625, -38.00689697265625, -30.164548873901367, -22.322202682495117, -14.479854583740234, -6.637508392333984, 1.2048377990722656, 9.047183990478516, 16.889530181884766, 24.731876373291016, 32.57422637939453, 40.41657257080078, 48.25891876220703, 56.10126495361328, 63.94361114501953, 71.78595733642578]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 12.0, 19.0, 15.0, 31.0, 48.0, 62.0, 69.0, 109.0, 95.0, 105.0, 88.0, 88.0, 72.0, 58.0, 43.0, 24.0, 27.0, 17.0, 9.0, 6.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.358285903930664, -20.849388122558594, -20.340490341186523, -19.831592559814453, -19.322694778442383, -18.813796997070312, -18.304899215698242, -17.796001434326172, -17.2871036529541, -16.77820587158203, -16.26930809020996, -15.76041030883789, -15.25151252746582, -14.74261474609375, -14.23371696472168, -13.72481918334961, -13.215920448303223, -12.707022666931152, -12.198124885559082, -11.689227104187012, -11.180329322814941, -10.671431541442871, -10.162532806396484, -9.653635025024414, -9.144737243652344, -8.635839462280273, -8.126941680908203, -7.618043899536133, -7.1091461181640625, -6.600248336791992, -6.091350078582764, -5.582452297210693, -5.073554992675781, -4.564657211303711, -4.055759429931641, -3.546861410140991, -3.037963628768921, -2.5290658473968506, -2.020167827606201, -1.5112700462341309, -1.0023722648620605, -0.49347442388534546, 0.015423417091369629, 0.5243213176727295, 1.0332190990447998, 1.5421168804168701, 2.0510149002075195, 2.55991268157959, 3.06881046295166, 3.5777082443237305, 4.086606025695801, 4.595503807067871, 5.104401588439941, 5.613299369812012, 6.12219762802124, 6.6310954093933105, 7.139993190765381, 7.648890972137451, 8.15778923034668, 8.66668701171875, 9.17558479309082, 9.68448257446289, 10.193380355834961, 10.702278137207031, 11.211175918579102]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 9.0, 12.0, 11.0, 15.0, 18.0, 21.0, 25.0, 32.0, 48.0, 49.0, 68.0, 97.0, 372.0, 12238.0, 743638.0, 287306.0, 4004.0, 214.0, 82.0, 53.0, 54.0, 49.0, 22.0, 20.0, 26.0, 17.0, 15.0, 12.0, 6.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -19.98681640625, -19.3173828125, -18.64794921875, -17.978515625, -17.30908203125, -16.6396484375, -15.97021484375, -15.30078125, -14.63134765625, -13.9619140625, -13.29248046875, -12.623046875, -11.95361328125, -11.2841796875, -10.61474609375, -9.9453125, -9.27587890625, -8.6064453125, -7.93701171875, -7.267578125, -6.59814453125, -5.9287109375, -5.25927734375, -4.58984375, -3.92041015625, -3.2509765625, -2.58154296875, -1.912109375, -1.24267578125, -0.5732421875, 0.09619140625, 0.765625, 1.43505859375, 2.1044921875, 2.77392578125, 3.443359375, 4.11279296875, 4.7822265625, 5.45166015625, 6.12109375, 6.79052734375, 7.4599609375, 8.12939453125, 8.798828125, 9.46826171875, 10.1376953125, 10.80712890625, 11.4765625, 12.14599609375, 12.8154296875, 13.48486328125, 14.154296875, 14.82373046875, 15.4931640625, 16.16259765625, 16.83203125, 17.50146484375, 18.1708984375, 18.84033203125, 19.509765625, 20.17919921875, 20.8486328125, 21.51806640625, 22.1875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 19.0, 41.0, 84.0, 151.0, 211.0, 214.0, 157.0, 79.0, 43.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.8424072265625, -2.780517578125, -2.7186279296875, -2.65673828125, -2.5948486328125, -2.532958984375, -2.4710693359375, -2.4091796875, -2.3472900390625, -2.285400390625, -2.2235107421875, -2.16162109375, -2.0997314453125, -2.037841796875, -1.9759521484375, -1.9140625, -1.8521728515625, -1.790283203125, -1.7283935546875, -1.66650390625, -1.6046142578125, -1.542724609375, -1.4808349609375, -1.4189453125, -1.3570556640625, -1.295166015625, -1.2332763671875, -1.17138671875, -1.1094970703125, -1.047607421875, -0.9857177734375, -0.923828125, -0.8619384765625, -0.800048828125, -0.7381591796875, -0.67626953125, -0.6143798828125, -0.552490234375, -0.4906005859375, -0.4287109375, -0.3668212890625, -0.304931640625, -0.2430419921875, -0.18115234375, -0.1192626953125, -0.057373046875, 0.0045166015625, 0.06640625, 0.1282958984375, 0.190185546875, 0.2520751953125, 0.31396484375, 0.3758544921875, 0.437744140625, 0.4996337890625, 0.5615234375, 0.6234130859375, 0.685302734375, 0.7471923828125, 0.80908203125, 0.8709716796875, 0.932861328125, 0.9947509765625, 1.056640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 7.0, 18.0, 18.0, 31.0, 30.0, 57.0, 80.0, 150.0, 254.0, 517.0, 1239.0, 3550.0, 14416.0, 81017.0, 468533.0, 395708.0, 65330.0, 12210.0, 3148.0, 1120.0, 444.0, 252.0, 134.0, 86.0, 49.0, 38.0, 30.0, 16.0, 18.0, 8.0, 12.0, 1.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.5079345703125, -8.203369140625, -7.8988037109375, -7.59423828125, -7.2896728515625, -6.985107421875, -6.6805419921875, -6.3759765625, -6.0714111328125, -5.766845703125, -5.4622802734375, -5.15771484375, -4.8531494140625, -4.548583984375, -4.2440185546875, -3.939453125, -3.6348876953125, -3.330322265625, -3.0257568359375, -2.72119140625, -2.4166259765625, -2.112060546875, -1.8074951171875, -1.5029296875, -1.1983642578125, -0.893798828125, -0.5892333984375, -0.28466796875, 0.0198974609375, 0.324462890625, 0.6290283203125, 0.93359375, 1.2381591796875, 1.542724609375, 1.8472900390625, 2.15185546875, 2.4564208984375, 2.760986328125, 3.0655517578125, 3.3701171875, 3.6746826171875, 3.979248046875, 4.2838134765625, 4.58837890625, 4.8929443359375, 5.197509765625, 5.5020751953125, 5.806640625, 6.1112060546875, 6.415771484375, 6.7203369140625, 7.02490234375, 7.3294677734375, 7.634033203125, 7.9385986328125, 8.2431640625, 8.5477294921875, 8.852294921875, 9.1568603515625, 9.46142578125, 9.7659912109375, 10.070556640625, 10.3751220703125, 10.6796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 10.0, 4.0, 8.0, 6.0, 7.0, 19.0, 13.0, 24.0, 34.0, 25.0, 31.0, 33.0, 40.0, 52.0, 38.0, 47.0, 36.0, 47.0, 50.0, 44.0, 42.0, 48.0, 42.0, 32.0, 32.0, 41.0, 41.0, 33.0, 22.0, 18.0, 27.0, 11.0, 9.0, 8.0, 11.0, 7.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.345703125, -3.23114013671875, -3.1165771484375, -3.00201416015625, -2.887451171875, -2.77288818359375, -2.6583251953125, -2.54376220703125, -2.42919921875, -2.31463623046875, -2.2000732421875, -2.08551025390625, -1.970947265625, -1.85638427734375, -1.7418212890625, -1.62725830078125, -1.5126953125, -1.39813232421875, -1.2835693359375, -1.16900634765625, -1.054443359375, -0.93988037109375, -0.8253173828125, -0.71075439453125, -0.59619140625, -0.48162841796875, -0.3670654296875, -0.25250244140625, -0.137939453125, -0.02337646484375, 0.0911865234375, 0.20574951171875, 0.3203125, 0.43487548828125, 0.5494384765625, 0.66400146484375, 0.778564453125, 0.89312744140625, 1.0076904296875, 1.12225341796875, 1.23681640625, 1.35137939453125, 1.4659423828125, 1.58050537109375, 1.695068359375, 1.80963134765625, 1.9241943359375, 2.03875732421875, 2.1533203125, 2.26788330078125, 2.3824462890625, 2.49700927734375, 2.611572265625, 2.72613525390625, 2.8406982421875, 2.95526123046875, 3.06982421875, 3.18438720703125, 3.2989501953125, 3.41351318359375, 3.528076171875, 3.64263916015625, 3.7572021484375, 3.87176513671875, 3.986328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 12.0, 16.0, 22.0, 29.0, 44.0, 70.0, 145.0, 292.0, 611.0, 1740.0, 5526.0, 24582.0, 169231.0, 644694.0, 168601.0, 24238.0, 5653.0, 1747.0, 605.0, 299.0, 142.0, 80.0, 38.0, 30.0, 30.0, 18.0, 7.0, 12.0, 8.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8515625, -7.5660400390625, -7.280517578125, -6.9949951171875, -6.70947265625, -6.4239501953125, -6.138427734375, -5.8529052734375, -5.5673828125, -5.2818603515625, -4.996337890625, -4.7108154296875, -4.42529296875, -4.1397705078125, -3.854248046875, -3.5687255859375, -3.283203125, -2.9976806640625, -2.712158203125, -2.4266357421875, -2.14111328125, -1.8555908203125, -1.570068359375, -1.2845458984375, -0.9990234375, -0.7135009765625, -0.427978515625, -0.1424560546875, 0.14306640625, 0.4285888671875, 0.714111328125, 0.9996337890625, 1.28515625, 1.5706787109375, 1.856201171875, 2.1417236328125, 2.42724609375, 2.7127685546875, 2.998291015625, 3.2838134765625, 3.5693359375, 3.8548583984375, 4.140380859375, 4.4259033203125, 4.71142578125, 4.9969482421875, 5.282470703125, 5.5679931640625, 5.853515625, 6.1390380859375, 6.424560546875, 6.7100830078125, 6.99560546875, 7.2811279296875, 7.566650390625, 7.8521728515625, 8.1376953125, 8.4232177734375, 8.708740234375, 8.9942626953125, 9.27978515625, 9.5653076171875, 9.850830078125, 10.1363525390625, 10.421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 13.0, 12.0, 14.0, 21.0, 23.0, 38.0, 33.0, 51.0, 53.0, 74.0, 60.0, 103.0, 82.0, 73.0, 61.0, 64.0, 46.0, 38.0, 22.0, 30.0, 18.0, 15.0, 6.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00069427490234375, -0.0006744042038917542, -0.0006545335054397583, -0.0006346628069877625, -0.0006147921085357666, -0.0005949214100837708, -0.0005750507116317749, -0.000555180013179779, -0.0005353093147277832, -0.0005154386162757874, -0.0004955679178237915, -0.00047569721937179565, -0.0004558265209197998, -0.00043595582246780396, -0.0004160851240158081, -0.00039621442556381226, -0.0003763437271118164, -0.00035647302865982056, -0.0003366023302078247, -0.00031673163175582886, -0.000296860933303833, -0.00027699023485183716, -0.0002571195363998413, -0.00023724883794784546, -0.0002173781394958496, -0.00019750744104385376, -0.0001776367425918579, -0.00015776604413986206, -0.0001378953456878662, -0.00011802464723587036, -9.815394878387451e-05, -7.828325033187866e-05, -5.841255187988281e-05, -3.854185342788696e-05, -1.8671154975891113e-05, 1.1995434761047363e-06, 2.1070241928100586e-05, 4.0940940380096436e-05, 6.0811638832092285e-05, 8.068233728408813e-05, 0.00010055303573608398, 0.00012042373418807983, 0.00014029443264007568, 0.00016016513109207153, 0.00018003582954406738, 0.00019990652799606323, 0.00021977722644805908, 0.00023964792490005493, 0.0002595186233520508, 0.00027938932180404663, 0.0002992600202560425, 0.00031913071870803833, 0.0003390014171600342, 0.00035887211561203003, 0.0003787428140640259, 0.00039861351251602173, 0.0004184842109680176, 0.00043835490942001343, 0.0004582256078720093, 0.0004780963063240051, 0.000497967004776001, 0.0005178377032279968, 0.0005377084016799927, 0.0005575791001319885, 0.0005774497985839844]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 2.0, 3.0, 5.0, 10.0, 12.0, 22.0, 24.0, 40.0, 57.0, 102.0, 139.0, 227.0, 407.0, 791.0, 1854.0, 5468.0, 25368.0, 181190.0, 630168.0, 170067.0, 23919.0, 5239.0, 1809.0, 716.0, 349.0, 204.0, 113.0, 74.0, 50.0, 32.0, 22.0, 21.0, 4.0, 9.0, 10.0, 3.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1953125, -7.926513671875, -7.65771484375, -7.388916015625, -7.1201171875, -6.851318359375, -6.58251953125, -6.313720703125, -6.044921875, -5.776123046875, -5.50732421875, -5.238525390625, -4.9697265625, -4.700927734375, -4.43212890625, -4.163330078125, -3.89453125, -3.625732421875, -3.35693359375, -3.088134765625, -2.8193359375, -2.550537109375, -2.28173828125, -2.012939453125, -1.744140625, -1.475341796875, -1.20654296875, -0.937744140625, -0.6689453125, -0.400146484375, -0.13134765625, 0.137451171875, 0.40625, 0.675048828125, 0.94384765625, 1.212646484375, 1.4814453125, 1.750244140625, 2.01904296875, 2.287841796875, 2.556640625, 2.825439453125, 3.09423828125, 3.363037109375, 3.6318359375, 3.900634765625, 4.16943359375, 4.438232421875, 4.70703125, 4.975830078125, 5.24462890625, 5.513427734375, 5.7822265625, 6.051025390625, 6.31982421875, 6.588623046875, 6.857421875, 7.126220703125, 7.39501953125, 7.663818359375, 7.9326171875, 8.201416015625, 8.47021484375, 8.739013671875, 9.0078125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 11.0, 4.0, 15.0, 21.0, 33.0, 38.0, 75.0, 89.0, 101.0, 117.0, 92.0, 99.0, 68.0, 60.0, 57.0, 38.0, 23.0, 19.0, 15.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.86328125, -5.724822998046875, -5.58636474609375, -5.447906494140625, -5.3094482421875, -5.170989990234375, -5.03253173828125, -4.894073486328125, -4.755615234375, -4.617156982421875, -4.47869873046875, -4.340240478515625, -4.2017822265625, -4.063323974609375, -3.92486572265625, -3.786407470703125, -3.64794921875, -3.509490966796875, -3.37103271484375, -3.232574462890625, -3.0941162109375, -2.955657958984375, -2.81719970703125, -2.678741455078125, -2.540283203125, -2.401824951171875, -2.26336669921875, -2.124908447265625, -1.9864501953125, -1.847991943359375, -1.70953369140625, -1.571075439453125, -1.4326171875, -1.294158935546875, -1.15570068359375, -1.017242431640625, -0.8787841796875, -0.740325927734375, -0.60186767578125, -0.463409423828125, -0.324951171875, -0.186492919921875, -0.04803466796875, 0.090423583984375, 0.2288818359375, 0.367340087890625, 0.50579833984375, 0.644256591796875, 0.78271484375, 0.921173095703125, 1.05963134765625, 1.198089599609375, 1.3365478515625, 1.475006103515625, 1.61346435546875, 1.751922607421875, 1.890380859375, 2.028839111328125, 2.16729736328125, 2.305755615234375, 2.4442138671875, 2.582672119140625, 2.72113037109375, 2.859588623046875, 2.998046875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 12.0, 76.0, 507.0, 357.0, 44.0, 9.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.2283935546875, -262.7335510253906, -257.23870849609375, -251.7438507080078, -246.24900817871094, -240.75416564941406, -235.2593231201172, -229.76446533203125, -224.26962280273438, -218.7747802734375, -213.27993774414062, -207.7850799560547, -202.2902374267578, -196.79539489746094, -191.30055236816406, -185.80569458007812, -180.31085205078125, -174.81600952148438, -169.3211669921875, -163.82630920410156, -158.3314666748047, -152.8366241455078, -147.34178161621094, -141.846923828125, -136.3520965576172, -130.8572540283203, -125.3624038696289, -119.86756134033203, -114.37271118164062, -108.87786865234375, -103.38302612304688, -97.88817596435547, -92.39332580566406, -86.89848327636719, -81.40363311767578, -75.9087905883789, -70.4139404296875, -64.91909790039062, -59.424251556396484, -53.929405212402344, -48.4345588684082, -42.93971252441406, -37.44486618041992, -31.950021743774414, -26.455175399780273, -20.960329055786133, -15.465484619140625, -9.970638275146484, -4.475791931152344, 1.0190539360046387, 6.513899803161621, 12.008745193481445, 17.503591537475586, 22.998437881469727, 28.493282318115234, 33.988128662109375, 39.482975006103516, 44.977821350097656, 50.4726676940918, 55.96751403808594, 61.46235656738281, 66.95720672607422, 72.4520492553711, 77.9468994140625, 83.44174194335938]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 10.0, 5.0, 9.0, 18.0, 17.0, 32.0, 28.0, 52.0, 45.0, 58.0, 73.0, 66.0, 67.0, 65.0, 79.0, 73.0, 79.0, 51.0, 43.0, 32.0, 30.0, 23.0, 13.0, 13.0, 11.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.706134796142578, -27.579944610595703, -26.453752517700195, -25.32756233215332, -24.201370239257812, -23.075180053710938, -21.948989868164062, -20.822799682617188, -19.69660758972168, -18.570417404174805, -17.444225311279297, -16.318035125732422, -15.19184398651123, -14.065652847290039, -12.939462661743164, -11.813271522521973, -10.687080383300781, -9.56088924407959, -8.434698104858398, -7.308507919311523, -6.182316780090332, -5.056125640869141, -3.9299349784851074, -2.803744316101074, -1.6775531768798828, -0.5513622760772705, 0.5748286247253418, 1.701019525527954, 2.8272104263305664, 3.953401565551758, 5.079592227935791, 6.205782890319824, 7.331977844238281, 8.458168983459473, 9.584360122680664, 10.710550308227539, 11.83674144744873, 12.962932586669922, 14.089122772216797, 15.215313911437988, 16.34150505065918, 17.467695236206055, 18.593887329101562, 19.720077514648438, 20.846267700195312, 21.97245979309082, 23.098649978637695, 24.224842071533203, 25.351032257080078, 26.477222442626953, 27.60341453552246, 28.729604721069336, 29.855796813964844, 30.98198699951172, 32.108177185058594, 33.23436737060547, 34.360557556152344, 35.48674774169922, 36.612937927246094, 37.739131927490234, 38.86532211303711, 39.991512298583984, 41.11770248413086, 42.243892669677734, 43.370086669921875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 9.0, 23.0, 51.0, 129.0, 348.0, 2011.0, 4034860.0, 155469.0, 1151.0, 168.0, 48.0, 10.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-130.0, -127.3408203125, -124.681640625, -122.0224609375, -119.36328125, -116.7041015625, -114.044921875, -111.3857421875, -108.7265625, -106.0673828125, -103.408203125, -100.7490234375, -98.08984375, -95.4306640625, -92.771484375, -90.1123046875, -87.453125, -84.7939453125, -82.134765625, -79.4755859375, -76.81640625, -74.1572265625, -71.498046875, -68.8388671875, -66.1796875, -63.5205078125, -60.861328125, -58.2021484375, -55.54296875, -52.8837890625, -50.224609375, -47.5654296875, -44.90625, -42.2470703125, -39.587890625, -36.9287109375, -34.26953125, -31.6103515625, -28.951171875, -26.2919921875, -23.6328125, -20.9736328125, -18.314453125, -15.6552734375, -12.99609375, -10.3369140625, -7.677734375, -5.0185546875, -2.359375, 0.2998046875, 2.958984375, 5.6181640625, 8.27734375, 10.9365234375, 13.595703125, 16.2548828125, 18.9140625, 21.5732421875, 24.232421875, 26.8916015625, 29.55078125, 32.2099609375, 34.869140625, 37.5283203125, 40.1875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 11.0, 40.0, 78.0, 145.0, 164.0, 207.0, 176.0, 109.0, 46.0, 24.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.171875, -3.1002197265625, -3.028564453125, -2.9569091796875, -2.88525390625, -2.8135986328125, -2.741943359375, -2.6702880859375, -2.5986328125, -2.5269775390625, -2.455322265625, -2.3836669921875, -2.31201171875, -2.2403564453125, -2.168701171875, -2.0970458984375, -2.025390625, -1.9537353515625, -1.882080078125, -1.8104248046875, -1.73876953125, -1.6671142578125, -1.595458984375, -1.5238037109375, -1.4521484375, -1.3804931640625, -1.308837890625, -1.2371826171875, -1.16552734375, -1.0938720703125, -1.022216796875, -0.9505615234375, -0.87890625, -0.8072509765625, -0.735595703125, -0.6639404296875, -0.59228515625, -0.5206298828125, -0.448974609375, -0.3773193359375, -0.3056640625, -0.2340087890625, -0.162353515625, -0.0906982421875, -0.01904296875, 0.0526123046875, 0.124267578125, 0.1959228515625, 0.267578125, 0.3392333984375, 0.410888671875, 0.4825439453125, 0.55419921875, 0.6258544921875, 0.697509765625, 0.7691650390625, 0.8408203125, 0.9124755859375, 0.984130859375, 1.0557861328125, 1.12744140625, 1.1990966796875, 1.270751953125, 1.3424072265625, 1.4140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 20.0, 34.0, 66.0, 99.0, 176.0, 357.0, 4581.0, 4187377.0, 987.0, 270.0, 140.0, 90.0, 46.0, 24.0, 10.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.625, -212.14453125, -207.6640625, -203.18359375, -198.703125, -194.22265625, -189.7421875, -185.26171875, -180.78125, -176.30078125, -171.8203125, -167.33984375, -162.859375, -158.37890625, -153.8984375, -149.41796875, -144.9375, -140.45703125, -135.9765625, -131.49609375, -127.015625, -122.53515625, -118.0546875, -113.57421875, -109.09375, -104.61328125, -100.1328125, -95.65234375, -91.171875, -86.69140625, -82.2109375, -77.73046875, -73.25, -68.76953125, -64.2890625, -59.80859375, -55.328125, -50.84765625, -46.3671875, -41.88671875, -37.40625, -32.92578125, -28.4453125, -23.96484375, -19.484375, -15.00390625, -10.5234375, -6.04296875, -1.5625, 2.91796875, 7.3984375, 11.87890625, 16.359375, 20.83984375, 25.3203125, 29.80078125, 34.28125, 38.76171875, 43.2421875, 47.72265625, 52.203125, 56.68359375, 61.1640625, 65.64453125, 70.125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 7.0, 12.0, 44.0, 158.0, 913.0, 2595.0, 249.0, 65.0, 26.0, 11.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.7265625, -13.47320556640625, -13.2198486328125, -12.96649169921875, -12.713134765625, -12.45977783203125, -12.2064208984375, -11.95306396484375, -11.69970703125, -11.44635009765625, -11.1929931640625, -10.93963623046875, -10.686279296875, -10.43292236328125, -10.1795654296875, -9.92620849609375, -9.6728515625, -9.41949462890625, -9.1661376953125, -8.91278076171875, -8.659423828125, -8.40606689453125, -8.1527099609375, -7.89935302734375, -7.64599609375, -7.39263916015625, -7.1392822265625, -6.88592529296875, -6.632568359375, -6.37921142578125, -6.1258544921875, -5.87249755859375, -5.619140625, -5.36578369140625, -5.1124267578125, -4.85906982421875, -4.605712890625, -4.35235595703125, -4.0989990234375, -3.84564208984375, -3.59228515625, -3.33892822265625, -3.0855712890625, -2.83221435546875, -2.578857421875, -2.32550048828125, -2.0721435546875, -1.81878662109375, -1.5654296875, -1.31207275390625, -1.0587158203125, -0.80535888671875, -0.552001953125, -0.29864501953125, -0.0452880859375, 0.20806884765625, 0.46142578125, 0.71478271484375, 0.9681396484375, 1.22149658203125, 1.474853515625, 1.72821044921875, 1.9815673828125, 2.23492431640625, 2.48828125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 59.0, 837.0, 97.0, 9.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.95411682128906, -245.8665771484375, -238.77903747558594, -231.69149780273438, -224.6039581298828, -217.51641845703125, -210.42889404296875, -203.34133911132812, -196.25381469726562, -189.16627502441406, -182.0787353515625, -174.99119567871094, -167.90365600585938, -160.8161163330078, -153.72857666015625, -146.64105224609375, -139.55349731445312, -132.46595764160156, -125.37841796875, -118.29087829589844, -111.20333862304688, -104.11579895019531, -97.02826690673828, -89.94072723388672, -82.85318756103516, -75.7656478881836, -68.67810821533203, -61.590572357177734, -54.50303268432617, -47.41549301147461, -40.32795715332031, -33.24041748046875, -26.152877807617188, -19.065338134765625, -11.977800369262695, -4.890262603759766, 2.197277069091797, 9.28481674194336, 16.372352600097656, 23.45989227294922, 30.54743194580078, 37.634971618652344, 44.722511291503906, 51.8100471496582, 58.897586822509766, 65.98512268066406, 73.07266235351562, 80.16020202636719, 87.24774169921875, 94.33528137207031, 101.42282104492188, 108.51036071777344, 115.597900390625, 122.68544006347656, 129.77297973632812, 136.86050415039062, 143.94805908203125, 151.0355987548828, 158.12313842773438, 165.21067810058594, 172.2982177734375, 179.38575744628906, 186.47329711914062, 193.56082153320312, 200.6483612060547]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 11.0, 24.0, 37.0, 50.0, 90.0, 95.0, 137.0, 131.0, 130.0, 107.0, 83.0, 39.0, 31.0, 16.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.93144989013672, -29.90447235107422, -28.87749481201172, -27.85051727294922, -26.82353973388672, -25.79656219482422, -24.769582748413086, -23.742605209350586, -22.715627670288086, -21.688650131225586, -20.661672592163086, -19.634695053100586, -18.607715606689453, -17.580738067626953, -16.553760528564453, -15.526782989501953, -14.499805450439453, -13.472827911376953, -12.445850372314453, -11.418871879577637, -10.391894340515137, -9.364916801452637, -8.33793830871582, -7.31096076965332, -6.28398323059082, -5.25700569152832, -4.230027675628662, -3.203049898147583, -2.176072120666504, -1.149094581604004, -0.1221165657043457, 0.9048614501953125, 1.9318389892578125, 2.9588167667388916, 3.9857945442199707, 5.012772560119629, 6.039750099182129, 7.066727638244629, 8.093706130981445, 9.120683670043945, 10.147661209106445, 11.174638748168945, 12.201616287231445, 13.228594779968262, 14.255572319030762, 15.282549858093262, 16.309528350830078, 17.336505889892578, 18.363483428955078, 19.390460968017578, 20.417438507080078, 21.444416046142578, 22.471393585205078, 23.498371124267578, 24.52535057067871, 25.55232810974121, 26.57930564880371, 27.60628318786621, 28.63326072692871, 29.66023826599121, 30.687217712402344, 31.714195251464844, 32.741172790527344, 33.768150329589844, 34.795127868652344]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 10.0, 17.0, 15.0, 31.0, 22.0, 47.0, 93.0, 129.0, 283.0, 662.0, 2057.0, 12946.0, 326219.0, 675372.0, 25870.0, 3037.0, 884.0, 354.0, 185.0, 97.0, 55.0, 38.0, 32.0, 24.0, 13.0, 18.0, 13.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.9375, -30.081298828125, -29.22509765625, -28.368896484375, -27.5126953125, -26.656494140625, -25.80029296875, -24.944091796875, -24.087890625, -23.231689453125, -22.37548828125, -21.519287109375, -20.6630859375, -19.806884765625, -18.95068359375, -18.094482421875, -17.23828125, -16.382080078125, -15.52587890625, -14.669677734375, -13.8134765625, -12.957275390625, -12.10107421875, -11.244873046875, -10.388671875, -9.532470703125, -8.67626953125, -7.820068359375, -6.9638671875, -6.107666015625, -5.25146484375, -4.395263671875, -3.5390625, -2.682861328125, -1.82666015625, -0.970458984375, -0.1142578125, 0.741943359375, 1.59814453125, 2.454345703125, 3.310546875, 4.166748046875, 5.02294921875, 5.879150390625, 6.7353515625, 7.591552734375, 8.44775390625, 9.303955078125, 10.16015625, 11.016357421875, 11.87255859375, 12.728759765625, 13.5849609375, 14.441162109375, 15.29736328125, 16.153564453125, 17.009765625, 17.865966796875, 18.72216796875, 19.578369140625, 20.4345703125, 21.290771484375, 22.14697265625, 23.003173828125, 23.859375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 11.0, 34.0, 73.0, 101.0, 144.0, 159.0, 175.0, 145.0, 85.0, 40.0, 18.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.56640625, -3.478851318359375, -3.39129638671875, -3.303741455078125, -3.2161865234375, -3.128631591796875, -3.04107666015625, -2.953521728515625, -2.865966796875, -2.778411865234375, -2.69085693359375, -2.603302001953125, -2.5157470703125, -2.428192138671875, -2.34063720703125, -2.253082275390625, -2.16552734375, -2.077972412109375, -1.99041748046875, -1.902862548828125, -1.8153076171875, -1.727752685546875, -1.64019775390625, -1.552642822265625, -1.465087890625, -1.377532958984375, -1.28997802734375, -1.202423095703125, -1.1148681640625, -1.027313232421875, -0.93975830078125, -0.852203369140625, -0.7646484375, -0.677093505859375, -0.58953857421875, -0.501983642578125, -0.4144287109375, -0.326873779296875, -0.23931884765625, -0.151763916015625, -0.064208984375, 0.023345947265625, 0.11090087890625, 0.198455810546875, 0.2860107421875, 0.373565673828125, 0.46112060546875, 0.548675537109375, 0.63623046875, 0.723785400390625, 0.81134033203125, 0.898895263671875, 0.9864501953125, 1.074005126953125, 1.16156005859375, 1.249114990234375, 1.336669921875, 1.424224853515625, 1.51177978515625, 1.599334716796875, 1.6868896484375, 1.774444580078125, 1.86199951171875, 1.949554443359375, 2.037109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 9.0, 11.0, 20.0, 24.0, 26.0, 36.0, 52.0, 68.0, 83.0, 159.0, 303.0, 722.0, 2333.0, 12671.0, 167358.0, 763582.0, 89718.0, 8307.0, 1796.0, 563.0, 244.0, 136.0, 96.0, 59.0, 41.0, 24.0, 28.0, 15.0, 15.0, 16.0, 2.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.3125, -18.7818603515625, -18.251220703125, -17.7205810546875, -17.18994140625, -16.6593017578125, -16.128662109375, -15.5980224609375, -15.0673828125, -14.5367431640625, -14.006103515625, -13.4754638671875, -12.94482421875, -12.4141845703125, -11.883544921875, -11.3529052734375, -10.822265625, -10.2916259765625, -9.760986328125, -9.2303466796875, -8.69970703125, -8.1690673828125, -7.638427734375, -7.1077880859375, -6.5771484375, -6.0465087890625, -5.515869140625, -4.9852294921875, -4.45458984375, -3.9239501953125, -3.393310546875, -2.8626708984375, -2.33203125, -1.8013916015625, -1.270751953125, -0.7401123046875, -0.20947265625, 0.3211669921875, 0.851806640625, 1.3824462890625, 1.9130859375, 2.4437255859375, 2.974365234375, 3.5050048828125, 4.03564453125, 4.5662841796875, 5.096923828125, 5.6275634765625, 6.158203125, 6.6888427734375, 7.219482421875, 7.7501220703125, 8.28076171875, 8.8114013671875, 9.342041015625, 9.8726806640625, 10.4033203125, 10.9339599609375, 11.464599609375, 11.9952392578125, 12.52587890625, 13.0565185546875, 13.587158203125, 14.1177978515625, 14.6484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 3.0, 12.0, 10.0, 12.0, 16.0, 19.0, 43.0, 23.0, 37.0, 44.0, 44.0, 48.0, 50.0, 39.0, 67.0, 64.0, 55.0, 58.0, 42.0, 45.0, 53.0, 36.0, 23.0, 23.0, 29.0, 19.0, 20.0, 13.0, 10.0, 6.0, 11.0, 3.0, 3.0, 8.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.4140625, -6.237548828125, -6.06103515625, -5.884521484375, -5.7080078125, -5.531494140625, -5.35498046875, -5.178466796875, -5.001953125, -4.825439453125, -4.64892578125, -4.472412109375, -4.2958984375, -4.119384765625, -3.94287109375, -3.766357421875, -3.58984375, -3.413330078125, -3.23681640625, -3.060302734375, -2.8837890625, -2.707275390625, -2.53076171875, -2.354248046875, -2.177734375, -2.001220703125, -1.82470703125, -1.648193359375, -1.4716796875, -1.295166015625, -1.11865234375, -0.942138671875, -0.765625, -0.589111328125, -0.41259765625, -0.236083984375, -0.0595703125, 0.116943359375, 0.29345703125, 0.469970703125, 0.646484375, 0.822998046875, 0.99951171875, 1.176025390625, 1.3525390625, 1.529052734375, 1.70556640625, 1.882080078125, 2.05859375, 2.235107421875, 2.41162109375, 2.588134765625, 2.7646484375, 2.941162109375, 3.11767578125, 3.294189453125, 3.470703125, 3.647216796875, 3.82373046875, 4.000244140625, 4.1767578125, 4.353271484375, 4.52978515625, 4.706298828125, 4.8828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 4.0, 7.0, 5.0, 15.0, 19.0, 24.0, 38.0, 64.0, 116.0, 203.0, 409.0, 863.0, 2160.0, 7030.0, 37347.0, 388940.0, 542942.0, 54581.0, 9076.0, 2645.0, 1017.0, 455.0, 254.0, 111.0, 78.0, 48.0, 36.0, 13.0, 5.0, 11.0, 4.0, 12.0, 5.0, 1.0, 2.0, 2.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -7.9638671875, -7.646484375, -7.3291015625, -7.01171875, -6.6943359375, -6.376953125, -6.0595703125, -5.7421875, -5.4248046875, -5.107421875, -4.7900390625, -4.47265625, -4.1552734375, -3.837890625, -3.5205078125, -3.203125, -2.8857421875, -2.568359375, -2.2509765625, -1.93359375, -1.6162109375, -1.298828125, -0.9814453125, -0.6640625, -0.3466796875, -0.029296875, 0.2880859375, 0.60546875, 0.9228515625, 1.240234375, 1.5576171875, 1.875, 2.1923828125, 2.509765625, 2.8271484375, 3.14453125, 3.4619140625, 3.779296875, 4.0966796875, 4.4140625, 4.7314453125, 5.048828125, 5.3662109375, 5.68359375, 6.0009765625, 6.318359375, 6.6357421875, 6.953125, 7.2705078125, 7.587890625, 7.9052734375, 8.22265625, 8.5400390625, 8.857421875, 9.1748046875, 9.4921875, 9.8095703125, 10.126953125, 10.4443359375, 10.76171875, 11.0791015625, 11.396484375, 11.7138671875, 12.03125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 7.0, 6.0, 11.0, 13.0, 30.0, 29.0, 53.0, 60.0, 81.0, 96.0, 95.0, 93.0, 97.0, 74.0, 60.0, 43.0, 32.0, 44.0, 20.0, 16.0, 5.0, 7.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009002685546875, -0.0008752793073654175, -0.000850290060043335, -0.0008253008127212524, -0.0008003115653991699, -0.0007753223180770874, -0.0007503330707550049, -0.0007253438234329224, -0.0007003545761108398, -0.0006753653287887573, -0.0006503760814666748, -0.0006253868341445923, -0.0006003975868225098, -0.0005754083395004272, -0.0005504190921783447, -0.0005254298448562622, -0.0005004405975341797, -0.00047545135021209717, -0.00045046210289001465, -0.00042547285556793213, -0.0004004836082458496, -0.0003754943609237671, -0.00035050511360168457, -0.00032551586627960205, -0.00030052661895751953, -0.000275537371635437, -0.0002505481243133545, -0.00022555887699127197, -0.00020056962966918945, -0.00017558038234710693, -0.00015059113502502441, -0.0001256018877029419, -0.00010061264038085938, -7.562339305877686e-05, -5.0634145736694336e-05, -2.5644898414611816e-05, -6.556510925292969e-07, 2.4333596229553223e-05, 4.932284355163574e-05, 7.431209087371826e-05, 9.930133819580078e-05, 0.0001242905855178833, 0.00014927983283996582, 0.00017426908016204834, 0.00019925832748413086, 0.00022424757480621338, 0.0002492368221282959, 0.0002742260694503784, 0.00029921531677246094, 0.00032420456409454346, 0.000349193811416626, 0.0003741830587387085, 0.000399172306060791, 0.00042416155338287354, 0.00044915080070495605, 0.0004741400480270386, 0.0004991292953491211, 0.0005241185426712036, 0.0005491077899932861, 0.0005740970373153687, 0.0005990862846374512, 0.0006240755319595337, 0.0006490647792816162, 0.0006740540266036987, 0.0006990432739257812]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 11.0, 14.0, 16.0, 24.0, 22.0, 30.0, 46.0, 62.0, 99.0, 191.0, 351.0, 798.0, 1860.0, 6770.0, 41559.0, 383626.0, 532001.0, 66832.0, 9798.0, 2466.0, 985.0, 409.0, 200.0, 122.0, 61.0, 56.0, 41.0, 16.0, 18.0, 14.0, 5.0, 6.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-9.3125, -9.0224609375, -8.732421875, -8.4423828125, -8.15234375, -7.8623046875, -7.572265625, -7.2822265625, -6.9921875, -6.7021484375, -6.412109375, -6.1220703125, -5.83203125, -5.5419921875, -5.251953125, -4.9619140625, -4.671875, -4.3818359375, -4.091796875, -3.8017578125, -3.51171875, -3.2216796875, -2.931640625, -2.6416015625, -2.3515625, -2.0615234375, -1.771484375, -1.4814453125, -1.19140625, -0.9013671875, -0.611328125, -0.3212890625, -0.03125, 0.2587890625, 0.548828125, 0.8388671875, 1.12890625, 1.4189453125, 1.708984375, 1.9990234375, 2.2890625, 2.5791015625, 2.869140625, 3.1591796875, 3.44921875, 3.7392578125, 4.029296875, 4.3193359375, 4.609375, 4.8994140625, 5.189453125, 5.4794921875, 5.76953125, 6.0595703125, 6.349609375, 6.6396484375, 6.9296875, 7.2197265625, 7.509765625, 7.7998046875, 8.08984375, 8.3798828125, 8.669921875, 8.9599609375, 9.25]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 5.0, 10.0, 5.0, 8.0, 12.0, 19.0, 14.0, 25.0, 30.0, 26.0, 52.0, 48.0, 47.0, 60.0, 82.0, 79.0, 57.0, 72.0, 51.0, 57.0, 57.0, 37.0, 35.0, 21.0, 17.0, 14.0, 15.0, 9.0, 14.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.661895751953125, -3.54254150390625, -3.423187255859375, -3.3038330078125, -3.184478759765625, -3.06512451171875, -2.945770263671875, -2.826416015625, -2.707061767578125, -2.58770751953125, -2.468353271484375, -2.3489990234375, -2.229644775390625, -2.11029052734375, -1.990936279296875, -1.87158203125, -1.752227783203125, -1.63287353515625, -1.513519287109375, -1.3941650390625, -1.274810791015625, -1.15545654296875, -1.036102294921875, -0.916748046875, -0.797393798828125, -0.67803955078125, -0.558685302734375, -0.4393310546875, -0.319976806640625, -0.20062255859375, -0.081268310546875, 0.0380859375, 0.157440185546875, 0.27679443359375, 0.396148681640625, 0.5155029296875, 0.634857177734375, 0.75421142578125, 0.873565673828125, 0.992919921875, 1.112274169921875, 1.23162841796875, 1.350982666015625, 1.4703369140625, 1.589691162109375, 1.70904541015625, 1.828399658203125, 1.94775390625, 2.067108154296875, 2.18646240234375, 2.305816650390625, 2.4251708984375, 2.544525146484375, 2.66387939453125, 2.783233642578125, 2.902587890625, 3.021942138671875, 3.14129638671875, 3.260650634765625, 3.3800048828125, 3.499359130859375, 3.61871337890625, 3.738067626953125, 3.857421875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 15.0, 68.0, 353.0, 412.0, 103.0, 42.0, 11.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.497636795043945, -26.170827865600586, -20.84402084350586, -15.5172119140625, -10.19040298461914, -4.863594055175781, 0.4632129669189453, 5.790021896362305, 11.116830825805664, 16.443639755249023, 21.77044677734375, 27.09725570678711, 32.42406463623047, 37.75087356567383, 43.07768249511719, 48.40448760986328, 53.731300354003906, 59.058109283447266, 64.38491821289062, 69.71172332763672, 75.03853607177734, 80.36534118652344, 85.69215393066406, 91.01895904541016, 96.34576416015625, 101.67256927490234, 106.99938201904297, 112.32618713378906, 117.65299987792969, 122.97980499267578, 128.30661010742188, 133.6334228515625, 138.96022033691406, 144.2870330810547, 149.61383056640625, 154.94064331054688, 160.2674560546875, 165.59426879882812, 170.9210662841797, 176.2478790283203, 181.57469177246094, 186.90150451660156, 192.22830200195312, 197.55511474609375, 202.88192749023438, 208.208740234375, 213.53553771972656, 218.8623504638672, 224.18914794921875, 229.51596069335938, 234.84275817871094, 240.16957092285156, 245.4963836669922, 250.8231964111328, 256.1499938964844, 261.476806640625, 266.8036193847656, 272.13043212890625, 277.4572448730469, 282.7840576171875, 288.11083984375, 293.4376525878906, 298.76446533203125, 304.0912780761719, 309.4180908203125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 14.0, 8.0, 14.0, 8.0, 21.0, 25.0, 26.0, 31.0, 40.0, 41.0, 53.0, 58.0, 56.0, 44.0, 70.0, 62.0, 52.0, 48.0, 49.0, 58.0, 33.0, 30.0, 25.0, 19.0, 26.0, 20.0, 12.0, 10.0, 6.0, 9.0, 9.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.592987060546875, -38.282344818115234, -36.97170639038086, -35.66106414794922, -34.350425720214844, -33.0397834777832, -31.729143142700195, -30.418502807617188, -29.10786247253418, -27.797222137451172, -26.486581802368164, -25.175941467285156, -23.865299224853516, -22.55466079711914, -21.2440185546875, -19.933378219604492, -18.622737884521484, -17.312097549438477, -16.00145721435547, -14.690815925598145, -13.380175590515137, -12.069535255432129, -10.758893966674805, -9.448253631591797, -8.137613296508789, -6.826972961425781, -5.516332149505615, -4.205691337585449, -2.8950510025024414, -1.5844106674194336, -0.2737698554992676, 1.0368709564208984, 2.3475112915039062, 3.658151865005493, 4.96879243850708, 6.279433250427246, 7.590073585510254, 8.900713920593262, 10.211355209350586, 11.521995544433594, 12.832635879516602, 14.14327621459961, 15.453916549682617, 16.764556884765625, 18.075199127197266, 19.38583755493164, 20.69647979736328, 22.00712013244629, 23.317760467529297, 24.628400802612305, 25.939041137695312, 27.24968147277832, 28.560321807861328, 29.87096405029297, 31.181604385375977, 32.492244720458984, 33.802886962890625, 35.113529205322266, 36.42416763305664, 37.73480987548828, 39.045448303222656, 40.3560905456543, 41.66672897338867, 42.97737121582031, 44.28800964355469]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 5.0, 15.0, 17.0, 30.0, 47.0, 96.0, 146.0, 394.0, 1762.0, 50196.0, 4123663.0, 16616.0, 963.0, 205.0, 77.0, 16.0, 22.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.0, -74.361328125, -72.72265625, -71.083984375, -69.4453125, -67.806640625, -66.16796875, -64.529296875, -62.890625, -61.251953125, -59.61328125, -57.974609375, -56.3359375, -54.697265625, -53.05859375, -51.419921875, -49.78125, -48.142578125, -46.50390625, -44.865234375, -43.2265625, -41.587890625, -39.94921875, -38.310546875, -36.671875, -35.033203125, -33.39453125, -31.755859375, -30.1171875, -28.478515625, -26.83984375, -25.201171875, -23.5625, -21.923828125, -20.28515625, -18.646484375, -17.0078125, -15.369140625, -13.73046875, -12.091796875, -10.453125, -8.814453125, -7.17578125, -5.537109375, -3.8984375, -2.259765625, -0.62109375, 1.017578125, 2.65625, 4.294921875, 5.93359375, 7.572265625, 9.2109375, 10.849609375, 12.48828125, 14.126953125, 15.765625, 17.404296875, 19.04296875, 20.681640625, 22.3203125, 23.958984375, 25.59765625, 27.236328125, 28.875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 17.0, 32.0, 58.0, 100.0, 122.0, 161.0, 171.0, 127.0, 92.0, 60.0, 26.0, 19.0, 5.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91015625, -3.816925048828125, -3.72369384765625, -3.630462646484375, -3.5372314453125, -3.444000244140625, -3.35076904296875, -3.257537841796875, -3.164306640625, -3.071075439453125, -2.97784423828125, -2.884613037109375, -2.7913818359375, -2.698150634765625, -2.60491943359375, -2.511688232421875, -2.41845703125, -2.325225830078125, -2.23199462890625, -2.138763427734375, -2.0455322265625, -1.952301025390625, -1.85906982421875, -1.765838623046875, -1.672607421875, -1.579376220703125, -1.48614501953125, -1.392913818359375, -1.2996826171875, -1.206451416015625, -1.11322021484375, -1.019989013671875, -0.9267578125, -0.833526611328125, -0.74029541015625, -0.647064208984375, -0.5538330078125, -0.460601806640625, -0.36737060546875, -0.274139404296875, -0.180908203125, -0.087677001953125, 0.00555419921875, 0.098785400390625, 0.1920166015625, 0.285247802734375, 0.37847900390625, 0.471710205078125, 0.56494140625, 0.658172607421875, 0.75140380859375, 0.844635009765625, 0.9378662109375, 1.031097412109375, 1.12432861328125, 1.217559814453125, 1.310791015625, 1.404022216796875, 1.49725341796875, 1.590484619140625, 1.6837158203125, 1.776947021484375, 1.87017822265625, 1.963409423828125, 2.056640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 9.0, 23.0, 38.0, 59.0, 117.0, 248.0, 574.0, 2827.0, 4023252.0, 164987.0, 1427.0, 396.0, 171.0, 66.0, 40.0, 17.0, 12.0, 10.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-125.5, -122.9326171875, -120.365234375, -117.7978515625, -115.23046875, -112.6630859375, -110.095703125, -107.5283203125, -104.9609375, -102.3935546875, -99.826171875, -97.2587890625, -94.69140625, -92.1240234375, -89.556640625, -86.9892578125, -84.421875, -81.8544921875, -79.287109375, -76.7197265625, -74.15234375, -71.5849609375, -69.017578125, -66.4501953125, -63.8828125, -61.3154296875, -58.748046875, -56.1806640625, -53.61328125, -51.0458984375, -48.478515625, -45.9111328125, -43.34375, -40.7763671875, -38.208984375, -35.6416015625, -33.07421875, -30.5068359375, -27.939453125, -25.3720703125, -22.8046875, -20.2373046875, -17.669921875, -15.1025390625, -12.53515625, -9.9677734375, -7.400390625, -4.8330078125, -2.265625, 0.3017578125, 2.869140625, 5.4365234375, 8.00390625, 10.5712890625, 13.138671875, 15.7060546875, 18.2734375, 20.8408203125, 23.408203125, 25.9755859375, 28.54296875, 31.1103515625, 33.677734375, 36.2451171875, 38.8125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 9.0, 15.0, 26.0, 47.0, 138.0, 544.0, 2554.0, 517.0, 122.0, 58.0, 26.0, 13.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.61602783203125, -9.3726806640625, -9.12933349609375, -8.885986328125, -8.64263916015625, -8.3992919921875, -8.15594482421875, -7.91259765625, -7.66925048828125, -7.4259033203125, -7.18255615234375, -6.939208984375, -6.69586181640625, -6.4525146484375, -6.20916748046875, -5.9658203125, -5.72247314453125, -5.4791259765625, -5.23577880859375, -4.992431640625, -4.74908447265625, -4.5057373046875, -4.26239013671875, -4.01904296875, -3.77569580078125, -3.5323486328125, -3.28900146484375, -3.045654296875, -2.80230712890625, -2.5589599609375, -2.31561279296875, -2.072265625, -1.82891845703125, -1.5855712890625, -1.34222412109375, -1.098876953125, -0.85552978515625, -0.6121826171875, -0.36883544921875, -0.12548828125, 0.11785888671875, 0.3612060546875, 0.60455322265625, 0.847900390625, 1.09124755859375, 1.3345947265625, 1.57794189453125, 1.8212890625, 2.06463623046875, 2.3079833984375, 2.55133056640625, 2.794677734375, 3.03802490234375, 3.2813720703125, 3.52471923828125, 3.76806640625, 4.01141357421875, 4.2547607421875, 4.49810791015625, 4.741455078125, 4.98480224609375, 5.2281494140625, 5.47149658203125, 5.71484375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 27.0, 446.0, 502.0, 22.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.4884490966797, -135.60340881347656, -129.7183837890625, -123.83334350585938, -117.94830322265625, -112.06326293945312, -106.17823028564453, -100.29319763183594, -94.40815734863281, -88.52311706542969, -82.6380844116211, -76.7530517578125, -70.86801147460938, -64.98297119140625, -59.097938537597656, -53.2129020690918, -47.32786560058594, -41.44282913208008, -35.55779266357422, -29.67275619506836, -23.7877197265625, -17.90268325805664, -12.017646789550781, -6.132610321044922, -0.2475738525390625, 5.637462615966797, 11.522499084472656, 17.407535552978516, 23.292572021484375, 29.177608489990234, 35.062644958496094, 40.94768142700195, 46.83270263671875, 52.71773910522461, 58.60277557373047, 64.48780822753906, 70.37284851074219, 76.25788879394531, 82.1429214477539, 88.0279541015625, 93.91299438476562, 99.79803466796875, 105.68306732177734, 111.56809997558594, 117.45314025878906, 123.33818054199219, 129.22320556640625, 135.10824584960938, 140.9932861328125, 146.87832641601562, 152.76336669921875, 158.6483917236328, 164.53343200683594, 170.41847229003906, 176.30349731445312, 182.18853759765625, 188.07357788085938, 193.9586181640625, 199.84365844726562, 205.7286834716797, 211.6137237548828, 217.49876403808594, 223.3837890625, 229.26882934570312, 235.15386962890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 11.0, 19.0, 35.0, 43.0, 49.0, 57.0, 61.0, 71.0, 82.0, 87.0, 100.0, 79.0, 72.0, 49.0, 39.0, 45.0, 35.0, 20.0, 14.0, 5.0, 7.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.530033111572266, -28.667436599731445, -27.804840087890625, -26.942245483398438, -26.079648971557617, -25.217052459716797, -24.354455947875977, -23.491859436035156, -22.62926483154297, -21.76666831970215, -20.904071807861328, -20.04147720336914, -19.17888069152832, -18.3162841796875, -17.45368766784668, -16.59109115600586, -15.728494644165039, -14.865898132324219, -14.003302574157715, -13.140706062316895, -12.27811050415039, -11.41551399230957, -10.55291748046875, -9.69032096862793, -8.827725410461426, -7.965129375457764, -7.102533340454102, -6.239936828613281, -5.377340793609619, -4.514744758605957, -3.6521482467651367, -2.7895522117614746, -1.9269580841064453, -1.0643619298934937, -0.201765775680542, 0.6608304977416992, 1.5234265327453613, 2.3860225677490234, 3.2486190795898438, 4.111215114593506, 4.973811149597168, 5.83640718460083, 6.699003219604492, 7.5615997314453125, 8.424196243286133, 9.286791801452637, 10.149388313293457, 11.011983871459961, 11.874580383300781, 12.737176895141602, 13.599772453308105, 14.462368965148926, 15.32496452331543, 16.18756103515625, 17.05015754699707, 17.91275405883789, 18.775348663330078, 19.6379451751709, 20.50054168701172, 21.363136291503906, 22.225732803344727, 23.088329315185547, 23.950925827026367, 24.813522338867188, 25.676118850708008]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 9.0, 4.0, 10.0, 15.0, 14.0, 16.0, 26.0, 36.0, 54.0, 70.0, 110.0, 124.0, 214.0, 339.0, 578.0, 1176.0, 2947.0, 10095.0, 52548.0, 371704.0, 509122.0, 78751.0, 13668.0, 3685.0, 1381.0, 677.0, 355.0, 230.0, 157.0, 118.0, 74.0, 62.0, 41.0, 27.0, 35.0, 16.0, 13.0, 11.0, 14.0, 10.0, 5.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.4847412109375, -12.024169921875, -11.5635986328125, -11.10302734375, -10.6424560546875, -10.181884765625, -9.7213134765625, -9.2607421875, -8.8001708984375, -8.339599609375, -7.8790283203125, -7.41845703125, -6.9578857421875, -6.497314453125, -6.0367431640625, -5.576171875, -5.1156005859375, -4.655029296875, -4.1944580078125, -3.73388671875, -3.2733154296875, -2.812744140625, -2.3521728515625, -1.8916015625, -1.4310302734375, -0.970458984375, -0.5098876953125, -0.04931640625, 0.4112548828125, 0.871826171875, 1.3323974609375, 1.79296875, 2.2535400390625, 2.714111328125, 3.1746826171875, 3.63525390625, 4.0958251953125, 4.556396484375, 5.0169677734375, 5.4775390625, 5.9381103515625, 6.398681640625, 6.8592529296875, 7.31982421875, 7.7803955078125, 8.240966796875, 8.7015380859375, 9.162109375, 9.6226806640625, 10.083251953125, 10.5438232421875, 11.00439453125, 11.4649658203125, 11.925537109375, 12.3861083984375, 12.8466796875, 13.3072509765625, 13.767822265625, 14.2283935546875, 14.68896484375, 15.1495361328125, 15.610107421875, 16.0706787109375, 16.53125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 10.0, 9.0, 23.0, 29.0, 51.0, 55.0, 100.0, 114.0, 101.0, 115.0, 99.0, 93.0, 53.0, 54.0, 39.0, 28.0, 12.0, 10.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.36883544921875, -3.2825927734375, -3.19635009765625, -3.110107421875, -3.02386474609375, -2.9376220703125, -2.85137939453125, -2.76513671875, -2.67889404296875, -2.5926513671875, -2.50640869140625, -2.420166015625, -2.33392333984375, -2.2476806640625, -2.16143798828125, -2.0751953125, -1.98895263671875, -1.9027099609375, -1.81646728515625, -1.730224609375, -1.64398193359375, -1.5577392578125, -1.47149658203125, -1.38525390625, -1.29901123046875, -1.2127685546875, -1.12652587890625, -1.040283203125, -0.95404052734375, -0.8677978515625, -0.78155517578125, -0.6953125, -0.60906982421875, -0.5228271484375, -0.43658447265625, -0.350341796875, -0.26409912109375, -0.1778564453125, -0.09161376953125, -0.00537109375, 0.08087158203125, 0.1671142578125, 0.25335693359375, 0.339599609375, 0.42584228515625, 0.5120849609375, 0.59832763671875, 0.6845703125, 0.77081298828125, 0.8570556640625, 0.94329833984375, 1.029541015625, 1.11578369140625, 1.2020263671875, 1.28826904296875, 1.37451171875, 1.46075439453125, 1.5469970703125, 1.63323974609375, 1.719482421875, 1.80572509765625, 1.8919677734375, 1.97821044921875, 2.064453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 15.0, 11.0, 31.0, 36.0, 49.0, 104.0, 213.0, 403.0, 1055.0, 4259.0, 47452.0, 849423.0, 135160.0, 7789.0, 1515.0, 526.0, 221.0, 109.0, 61.0, 42.0, 20.0, 14.0, 15.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.493408203125, -16.78369140625, -16.073974609375, -15.3642578125, -14.654541015625, -13.94482421875, -13.235107421875, -12.525390625, -11.815673828125, -11.10595703125, -10.396240234375, -9.6865234375, -8.976806640625, -8.26708984375, -7.557373046875, -6.84765625, -6.137939453125, -5.42822265625, -4.718505859375, -4.0087890625, -3.299072265625, -2.58935546875, -1.879638671875, -1.169921875, -0.460205078125, 0.24951171875, 0.959228515625, 1.6689453125, 2.378662109375, 3.08837890625, 3.798095703125, 4.5078125, 5.217529296875, 5.92724609375, 6.636962890625, 7.3466796875, 8.056396484375, 8.76611328125, 9.475830078125, 10.185546875, 10.895263671875, 11.60498046875, 12.314697265625, 13.0244140625, 13.734130859375, 14.44384765625, 15.153564453125, 15.86328125, 16.572998046875, 17.28271484375, 17.992431640625, 18.7021484375, 19.411865234375, 20.12158203125, 20.831298828125, 21.541015625, 22.250732421875, 22.96044921875, 23.670166015625, 24.3798828125, 25.089599609375, 25.79931640625, 26.509033203125, 27.21875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 8.0, 8.0, 5.0, 14.0, 16.0, 13.0, 25.0, 43.0, 36.0, 35.0, 59.0, 42.0, 50.0, 60.0, 57.0, 62.0, 73.0, 63.0, 44.0, 50.0, 50.0, 28.0, 41.0, 33.0, 28.0, 12.0, 13.0, 9.0, 5.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.89752197265625, -6.6427001953125, -6.38787841796875, -6.133056640625, -5.87823486328125, -5.6234130859375, -5.36859130859375, -5.11376953125, -4.85894775390625, -4.6041259765625, -4.34930419921875, -4.094482421875, -3.83966064453125, -3.5848388671875, -3.33001708984375, -3.0751953125, -2.82037353515625, -2.5655517578125, -2.31072998046875, -2.055908203125, -1.80108642578125, -1.5462646484375, -1.29144287109375, -1.03662109375, -0.78179931640625, -0.5269775390625, -0.27215576171875, -0.017333984375, 0.23748779296875, 0.4923095703125, 0.74713134765625, 1.001953125, 1.25677490234375, 1.5115966796875, 1.76641845703125, 2.021240234375, 2.27606201171875, 2.5308837890625, 2.78570556640625, 3.04052734375, 3.29534912109375, 3.5501708984375, 3.80499267578125, 4.059814453125, 4.31463623046875, 4.5694580078125, 4.82427978515625, 5.0791015625, 5.33392333984375, 5.5887451171875, 5.84356689453125, 6.098388671875, 6.35321044921875, 6.6080322265625, 6.86285400390625, 7.11767578125, 7.37249755859375, 7.6273193359375, 7.88214111328125, 8.136962890625, 8.39178466796875, 8.6466064453125, 8.90142822265625, 9.15625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 7.0, 9.0, 10.0, 25.0, 35.0, 58.0, 106.0, 216.0, 494.0, 1184.0, 3515.0, 14871.0, 98618.0, 613166.0, 273755.0, 32639.0, 6452.0, 1990.0, 733.0, 317.0, 145.0, 84.0, 45.0, 29.0, 26.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.1221923828125, -5.916259765625, -5.7103271484375, -5.50439453125, -5.2984619140625, -5.092529296875, -4.8865966796875, -4.6806640625, -4.4747314453125, -4.268798828125, -4.0628662109375, -3.85693359375, -3.6510009765625, -3.445068359375, -3.2391357421875, -3.033203125, -2.8272705078125, -2.621337890625, -2.4154052734375, -2.20947265625, -2.0035400390625, -1.797607421875, -1.5916748046875, -1.3857421875, -1.1798095703125, -0.973876953125, -0.7679443359375, -0.56201171875, -0.3560791015625, -0.150146484375, 0.0557861328125, 0.26171875, 0.4676513671875, 0.673583984375, 0.8795166015625, 1.08544921875, 1.2913818359375, 1.497314453125, 1.7032470703125, 1.9091796875, 2.1151123046875, 2.321044921875, 2.5269775390625, 2.73291015625, 2.9388427734375, 3.144775390625, 3.3507080078125, 3.556640625, 3.7625732421875, 3.968505859375, 4.1744384765625, 4.38037109375, 4.5863037109375, 4.792236328125, 4.9981689453125, 5.2041015625, 5.4100341796875, 5.615966796875, 5.8218994140625, 6.02783203125, 6.2337646484375, 6.439697265625, 6.6456298828125, 6.8515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 1.0, 4.0, 12.0, 3.0, 21.0, 24.0, 21.0, 38.0, 41.0, 51.0, 83.0, 96.0, 113.0, 99.0, 77.0, 69.0, 48.0, 58.0, 35.0, 30.0, 14.0, 20.0, 10.0, 8.0, 5.0, 4.0, 3.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006079673767089844, -0.0005918741226196289, -0.0005757808685302734, -0.000559687614440918, -0.0005435943603515625, -0.000527501106262207, -0.0005114078521728516, -0.0004953145980834961, -0.0004792213439941406, -0.00046312808990478516, -0.0004470348358154297, -0.0004309415817260742, -0.00041484832763671875, -0.0003987550735473633, -0.0003826618194580078, -0.00036656856536865234, -0.0003504753112792969, -0.0003343820571899414, -0.00031828880310058594, -0.00030219554901123047, -0.000286102294921875, -0.00027000904083251953, -0.00025391578674316406, -0.0002378225326538086, -0.00022172927856445312, -0.00020563602447509766, -0.0001895427703857422, -0.00017344951629638672, -0.00015735626220703125, -0.00014126300811767578, -0.0001251697540283203, -0.00010907649993896484, -9.298324584960938e-05, -7.68899917602539e-05, -6.079673767089844e-05, -4.470348358154297e-05, -2.86102294921875e-05, -1.2516975402832031e-05, 3.5762786865234375e-06, 1.9669532775878906e-05, 3.5762786865234375e-05, 5.1856040954589844e-05, 6.794929504394531e-05, 8.404254913330078e-05, 0.00010013580322265625, 0.00011622905731201172, 0.0001323223114013672, 0.00014841556549072266, 0.00016450881958007812, 0.0001806020736694336, 0.00019669532775878906, 0.00021278858184814453, 0.0002288818359375, 0.00024497509002685547, 0.00026106834411621094, 0.0002771615982055664, 0.0002932548522949219, 0.00030934810638427734, 0.0003254413604736328, 0.0003415346145629883, 0.00035762786865234375, 0.0003737211227416992, 0.0003898143768310547, 0.00040590763092041016, 0.0004220008850097656]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 9.0, 11.0, 8.0, 21.0, 23.0, 38.0, 71.0, 119.0, 251.0, 620.0, 1770.0, 6314.0, 36881.0, 375119.0, 553421.0, 61253.0, 9009.0, 2147.0, 769.0, 295.0, 163.0, 78.0, 43.0, 39.0, 30.0, 16.0, 5.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5859375, -6.3597412109375, -6.133544921875, -5.9073486328125, -5.68115234375, -5.4549560546875, -5.228759765625, -5.0025634765625, -4.7763671875, -4.5501708984375, -4.323974609375, -4.0977783203125, -3.87158203125, -3.6453857421875, -3.419189453125, -3.1929931640625, -2.966796875, -2.7406005859375, -2.514404296875, -2.2882080078125, -2.06201171875, -1.8358154296875, -1.609619140625, -1.3834228515625, -1.1572265625, -0.9310302734375, -0.704833984375, -0.4786376953125, -0.25244140625, -0.0262451171875, 0.199951171875, 0.4261474609375, 0.65234375, 0.8785400390625, 1.104736328125, 1.3309326171875, 1.55712890625, 1.7833251953125, 2.009521484375, 2.2357177734375, 2.4619140625, 2.6881103515625, 2.914306640625, 3.1405029296875, 3.36669921875, 3.5928955078125, 3.819091796875, 4.0452880859375, 4.271484375, 4.4976806640625, 4.723876953125, 4.9500732421875, 5.17626953125, 5.4024658203125, 5.628662109375, 5.8548583984375, 6.0810546875, 6.3072509765625, 6.533447265625, 6.7596435546875, 6.98583984375, 7.2120361328125, 7.438232421875, 7.6644287109375, 7.890625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 5.0, 9.0, 13.0, 20.0, 18.0, 19.0, 25.0, 38.0, 62.0, 57.0, 50.0, 96.0, 63.0, 86.0, 77.0, 74.0, 61.0, 46.0, 54.0, 25.0, 21.0, 12.0, 14.0, 12.0, 6.0, 8.0, 1.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.779296875, -3.664825439453125, -3.55035400390625, -3.435882568359375, -3.3214111328125, -3.206939697265625, -3.09246826171875, -2.977996826171875, -2.863525390625, -2.749053955078125, -2.63458251953125, -2.520111083984375, -2.4056396484375, -2.291168212890625, -2.17669677734375, -2.062225341796875, -1.94775390625, -1.833282470703125, -1.71881103515625, -1.604339599609375, -1.4898681640625, -1.375396728515625, -1.26092529296875, -1.146453857421875, -1.031982421875, -0.917510986328125, -0.80303955078125, -0.688568115234375, -0.5740966796875, -0.459625244140625, -0.34515380859375, -0.230682373046875, -0.1162109375, -0.001739501953125, 0.11273193359375, 0.227203369140625, 0.3416748046875, 0.456146240234375, 0.57061767578125, 0.685089111328125, 0.799560546875, 0.914031982421875, 1.02850341796875, 1.142974853515625, 1.2574462890625, 1.371917724609375, 1.48638916015625, 1.600860595703125, 1.71533203125, 1.829803466796875, 1.94427490234375, 2.058746337890625, 2.1732177734375, 2.287689208984375, 2.40216064453125, 2.516632080078125, 2.631103515625, 2.745574951171875, 2.86004638671875, 2.974517822265625, 3.0889892578125, 3.203460693359375, 3.31793212890625, 3.432403564453125, 3.546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 17.0, 293.0, 629.0, 59.0, 12.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.71131896972656, -65.57402801513672, -56.436729431152344, -47.2994384765625, -38.16214370727539, -29.02484893798828, -19.887557983398438, -10.750263214111328, -1.6129684448242188, 7.524325370788574, 16.661619186401367, 25.798912048339844, 34.93620681762695, 44.07350158691406, 53.210792541503906, 62.348087310791016, 71.48538208007812, 80.62267303466797, 89.75997161865234, 98.89726257324219, 108.03456115722656, 117.1718521118164, 126.30914306640625, 135.44644165039062, 144.583740234375, 153.72103881835938, 162.8583221435547, 171.99562072753906, 181.13291931152344, 190.27020263671875, 199.40750122070312, 208.5447998046875, 217.68209838867188, 226.81939697265625, 235.95668029785156, 245.09397888183594, 254.2312774658203, 263.3685607910156, 272.505859375, 281.6431579589844, 290.78045654296875, 299.9177551269531, 309.0550537109375, 318.19232177734375, 327.3296203613281, 336.4669189453125, 345.6042175292969, 354.74151611328125, 363.8787841796875, 373.0160827636719, 382.15338134765625, 391.2906494140625, 400.4279479980469, 409.56524658203125, 418.7025451660156, 427.83984375, 436.9771423339844, 446.11444091796875, 455.2517395019531, 464.3890380859375, 473.52630615234375, 482.6636047363281, 491.8009033203125, 500.9382019042969, 510.07550048828125]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 9.0, 7.0, 24.0, 26.0, 36.0, 32.0, 49.0, 60.0, 59.0, 70.0, 68.0, 69.0, 61.0, 54.0, 56.0, 47.0, 45.0, 43.0, 36.0, 34.0, 25.0, 19.0, 21.0, 6.0, 10.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.18724822998047, -43.58382034301758, -41.98039627075195, -40.37696838378906, -38.77354049682617, -37.17011260986328, -35.566688537597656, -33.963260650634766, -32.359832763671875, -30.756406784057617, -29.152978897094727, -27.54955291748047, -25.946125030517578, -24.34269905090332, -22.739273071289062, -21.135845184326172, -19.532421112060547, -17.92899513244629, -16.3255672454834, -14.72214126586914, -13.118714332580566, -11.515287399291992, -9.911861419677734, -8.30843448638916, -6.705007553100586, -5.101580619812012, -3.4981541633605957, -1.8947277069091797, -0.29130077362060547, 1.3121261596679688, 2.9155521392822266, 4.518979072570801, 6.122406005859375, 7.725832939147949, 9.329259872436523, 10.932685852050781, 12.536112785339355, 14.13953971862793, 15.742965698242188, 17.346393585205078, 18.949819564819336, 20.553245544433594, 22.156673431396484, 23.760099411010742, 25.363525390625, 26.96695327758789, 28.57037925720215, 30.173805236816406, 31.777233123779297, 33.38066101074219, 34.98408508300781, 36.5875129699707, 38.190940856933594, 39.79436492919922, 41.39779281616211, 43.001220703125, 44.604644775390625, 46.208072662353516, 47.81149673461914, 49.41492462158203, 51.01835250854492, 52.62178039550781, 54.22520446777344, 55.82863235473633, 57.43206024169922]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 11.0, 13.0, 18.0, 21.0, 42.0, 56.0, 92.0, 151.0, 253.0, 621.0, 1655.0, 7574.0, 162692.0, 3990109.0, 25948.0, 3441.0, 867.0, 350.0, 155.0, 90.0, 52.0, 19.0, 13.0, 12.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-42.03125, -41.08154296875, -40.1318359375, -39.18212890625, -38.232421875, -37.28271484375, -36.3330078125, -35.38330078125, -34.43359375, -33.48388671875, -32.5341796875, -31.58447265625, -30.634765625, -29.68505859375, -28.7353515625, -27.78564453125, -26.8359375, -25.88623046875, -24.9365234375, -23.98681640625, -23.037109375, -22.08740234375, -21.1376953125, -20.18798828125, -19.23828125, -18.28857421875, -17.3388671875, -16.38916015625, -15.439453125, -14.48974609375, -13.5400390625, -12.59033203125, -11.640625, -10.69091796875, -9.7412109375, -8.79150390625, -7.841796875, -6.89208984375, -5.9423828125, -4.99267578125, -4.04296875, -3.09326171875, -2.1435546875, -1.19384765625, -0.244140625, 0.70556640625, 1.6552734375, 2.60498046875, 3.5546875, 4.50439453125, 5.4541015625, 6.40380859375, 7.353515625, 8.30322265625, 9.2529296875, 10.20263671875, 11.15234375, 12.10205078125, 13.0517578125, 14.00146484375, 14.951171875, 15.90087890625, 16.8505859375, 17.80029296875, 18.75]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 11.0, 10.0, 17.0, 35.0, 43.0, 69.0, 69.0, 91.0, 98.0, 96.0, 92.0, 89.0, 74.0, 63.0, 41.0, 28.0, 31.0, 17.0, 6.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.19140625, -3.114501953125, -3.03759765625, -2.960693359375, -2.8837890625, -2.806884765625, -2.72998046875, -2.653076171875, -2.576171875, -2.499267578125, -2.42236328125, -2.345458984375, -2.2685546875, -2.191650390625, -2.11474609375, -2.037841796875, -1.9609375, -1.884033203125, -1.80712890625, -1.730224609375, -1.6533203125, -1.576416015625, -1.49951171875, -1.422607421875, -1.345703125, -1.268798828125, -1.19189453125, -1.114990234375, -1.0380859375, -0.961181640625, -0.88427734375, -0.807373046875, -0.73046875, -0.653564453125, -0.57666015625, -0.499755859375, -0.4228515625, -0.345947265625, -0.26904296875, -0.192138671875, -0.115234375, -0.038330078125, 0.03857421875, 0.115478515625, 0.1923828125, 0.269287109375, 0.34619140625, 0.423095703125, 0.5, 0.576904296875, 0.65380859375, 0.730712890625, 0.8076171875, 0.884521484375, 0.96142578125, 1.038330078125, 1.115234375, 1.192138671875, 1.26904296875, 1.345947265625, 1.4228515625, 1.499755859375, 1.57666015625, 1.653564453125, 1.73046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 9.0, 18.0, 39.0, 52.0, 80.0, 147.0, 734.0, 4190635.0, 2061.0, 217.0, 101.0, 71.0, 45.0, 31.0, 21.0, 18.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.625, -62.671875, -57.71875, -52.765625, -47.8125, -42.859375, -37.90625, -32.953125, -28.0, -23.046875, -18.09375, -13.140625, -8.1875, -3.234375, 1.71875, 6.671875, 11.625, 16.578125, 21.53125, 26.484375, 31.4375, 36.390625, 41.34375, 46.296875, 51.25, 56.203125, 61.15625, 66.109375, 71.0625, 76.015625, 80.96875, 85.921875, 90.875, 95.828125, 100.78125, 105.734375, 110.6875, 115.640625, 120.59375, 125.546875, 130.5, 135.453125, 140.40625, 145.359375, 150.3125, 155.265625, 160.21875, 165.171875, 170.125, 175.078125, 180.03125, 184.984375, 189.9375, 194.890625, 199.84375, 204.796875, 209.75, 214.703125, 219.65625, 224.609375, 229.5625, 234.515625, 239.46875, 244.421875, 249.375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 18.0, 73.0, 768.0, 3013.0, 167.0, 34.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.890625, -8.450927734375, -8.01123046875, -7.571533203125, -7.1318359375, -6.692138671875, -6.25244140625, -5.812744140625, -5.373046875, -4.933349609375, -4.49365234375, -4.053955078125, -3.6142578125, -3.174560546875, -2.73486328125, -2.295166015625, -1.85546875, -1.415771484375, -0.97607421875, -0.536376953125, -0.0966796875, 0.343017578125, 0.78271484375, 1.222412109375, 1.662109375, 2.101806640625, 2.54150390625, 2.981201171875, 3.4208984375, 3.860595703125, 4.30029296875, 4.739990234375, 5.1796875, 5.619384765625, 6.05908203125, 6.498779296875, 6.9384765625, 7.378173828125, 7.81787109375, 8.257568359375, 8.697265625, 9.136962890625, 9.57666015625, 10.016357421875, 10.4560546875, 10.895751953125, 11.33544921875, 11.775146484375, 12.21484375, 12.654541015625, 13.09423828125, 13.533935546875, 13.9736328125, 14.413330078125, 14.85302734375, 15.292724609375, 15.732421875, 16.172119140625, 16.61181640625, 17.051513671875, 17.4912109375, 17.930908203125, 18.37060546875, 18.810302734375, 19.25]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 11.0, 959.0, 44.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-488.052978515625, -477.8087463378906, -467.5644836425781, -457.32025146484375, -447.07598876953125, -436.8317565917969, -426.5874938964844, -416.34326171875, -406.0989990234375, -395.8547668457031, -385.6105041503906, -375.36627197265625, -365.12200927734375, -354.8777770996094, -344.6335144042969, -334.3892822265625, -324.14501953125, -313.9007873535156, -303.6565246582031, -293.41229248046875, -283.16802978515625, -272.9237976074219, -262.6795349121094, -252.435302734375, -242.19107055664062, -231.9468231201172, -221.70257568359375, -211.4583282470703, -201.21408081054688, -190.96983337402344, -180.7255859375, -170.48135375976562, -160.23709106445312, -149.9928436279297, -139.74859619140625, -129.5043487548828, -119.26010131835938, -109.01585388183594, -98.77161407470703, -88.5273666381836, -78.28311920166016, -68.03887176513672, -57.79462432861328, -47.55038070678711, -37.30613327026367, -27.061885833740234, -16.817642211914062, -6.573394775390625, 3.6708526611328125, 13.915099143981934, 24.159345626831055, 34.40359115600586, 44.6478385925293, 54.892086029052734, 65.1363296508789, 75.38057708740234, 85.62482452392578, 95.86907196044922, 106.11331939697266, 116.35755920410156, 126.601806640625, 136.84605407714844, 147.09030151367188, 157.3345489501953, 167.57879638671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 4.0, 10.0, 20.0, 23.0, 35.0, 47.0, 85.0, 95.0, 115.0, 102.0, 109.0, 84.0, 75.0, 61.0, 46.0, 32.0, 23.0, 18.0, 11.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.2419490814209, -28.393123626708984, -27.54429817199707, -26.695472717285156, -25.846647262573242, -24.997821807861328, -24.148998260498047, -23.3001708984375, -22.45134735107422, -21.602521896362305, -20.75369644165039, -19.904870986938477, -19.056045532226562, -18.20722007751465, -17.358394622802734, -16.509571075439453, -15.660743713378906, -14.811918258666992, -13.963092803955078, -13.114267349243164, -12.26544189453125, -11.416616439819336, -10.567791938781738, -9.718966484069824, -8.87014102935791, -8.021315574645996, -7.172490119934082, -6.323665142059326, -5.474839687347412, -4.626014232635498, -3.777189254760742, -2.928363800048828, -2.0795364379882812, -1.2307111024856567, -0.3818857669830322, 0.46693944931030273, 1.3157649040222168, 2.164590358734131, 3.0134153366088867, 3.862240791320801, 4.711066246032715, 5.559891700744629, 6.408717155456543, 7.257542133331299, 8.106367111206055, 8.955192565917969, 9.804018020629883, 10.652843475341797, 11.501668930053711, 12.350494384765625, 13.199319839477539, 14.048145294189453, 14.896970748901367, 15.745796203613281, 16.594619750976562, 17.44344711303711, 18.29227066040039, 19.141096115112305, 19.98992156982422, 20.838747024536133, 21.687572479248047, 22.53639793395996, 23.385223388671875, 24.234046936035156, 25.082874298095703]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 13.0, 20.0, 22.0, 29.0, 64.0, 94.0, 164.0, 356.0, 840.0, 2731.0, 13571.0, 113843.0, 682129.0, 206818.0, 21994.0, 3892.0, 1107.0, 398.0, 203.0, 107.0, 58.0, 33.0, 24.0, 14.0, 17.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-21.484375, -21.0029296875, -20.521484375, -20.0400390625, -19.55859375, -19.0771484375, -18.595703125, -18.1142578125, -17.6328125, -17.1513671875, -16.669921875, -16.1884765625, -15.70703125, -15.2255859375, -14.744140625, -14.2626953125, -13.78125, -13.2998046875, -12.818359375, -12.3369140625, -11.85546875, -11.3740234375, -10.892578125, -10.4111328125, -9.9296875, -9.4482421875, -8.966796875, -8.4853515625, -8.00390625, -7.5224609375, -7.041015625, -6.5595703125, -6.078125, -5.5966796875, -5.115234375, -4.6337890625, -4.15234375, -3.6708984375, -3.189453125, -2.7080078125, -2.2265625, -1.7451171875, -1.263671875, -0.7822265625, -0.30078125, 0.1806640625, 0.662109375, 1.1435546875, 1.625, 2.1064453125, 2.587890625, 3.0693359375, 3.55078125, 4.0322265625, 4.513671875, 4.9951171875, 5.4765625, 5.9580078125, 6.439453125, 6.9208984375, 7.40234375, 7.8837890625, 8.365234375, 8.8466796875, 9.328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 9.0, 11.0, 16.0, 26.0, 31.0, 54.0, 49.0, 55.0, 78.0, 79.0, 79.0, 76.0, 68.0, 71.0, 66.0, 54.0, 40.0, 28.0, 32.0, 29.0, 13.0, 12.0, 4.0, 11.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.251953125, -2.1927642822265625, -2.133575439453125, -2.0743865966796875, -2.01519775390625, -1.9560089111328125, -1.896820068359375, -1.8376312255859375, -1.7784423828125, -1.7192535400390625, -1.660064697265625, -1.6008758544921875, -1.54168701171875, -1.4824981689453125, -1.423309326171875, -1.3641204833984375, -1.304931640625, -1.2457427978515625, -1.186553955078125, -1.1273651123046875, -1.06817626953125, -1.0089874267578125, -0.949798583984375, -0.8906097412109375, -0.8314208984375, -0.7722320556640625, -0.713043212890625, -0.6538543701171875, -0.59466552734375, -0.5354766845703125, -0.476287841796875, -0.4170989990234375, -0.35791015625, -0.2987213134765625, -0.239532470703125, -0.1803436279296875, -0.12115478515625, -0.0619659423828125, -0.002777099609375, 0.0564117431640625, 0.1156005859375, 0.1747894287109375, 0.233978271484375, 0.2931671142578125, 0.35235595703125, 0.4115447998046875, 0.470733642578125, 0.5299224853515625, 0.589111328125, 0.6483001708984375, 0.707489013671875, 0.7666778564453125, 0.82586669921875, 0.8850555419921875, 0.944244384765625, 1.0034332275390625, 1.0626220703125, 1.1218109130859375, 1.180999755859375, 1.2401885986328125, 1.29937744140625, 1.3585662841796875, 1.417755126953125, 1.4769439697265625, 1.5361328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 7.0, 13.0, 14.0, 22.0, 41.0, 47.0, 91.0, 162.0, 255.0, 568.0, 1387.0, 4325.0, 25960.0, 412898.0, 558567.0, 35972.0, 5254.0, 1500.0, 666.0, 327.0, 190.0, 90.0, 61.0, 46.0, 28.0, 16.0, 13.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.0, -18.4874267578125, -17.974853515625, -17.4622802734375, -16.94970703125, -16.4371337890625, -15.924560546875, -15.4119873046875, -14.8994140625, -14.3868408203125, -13.874267578125, -13.3616943359375, -12.84912109375, -12.3365478515625, -11.823974609375, -11.3114013671875, -10.798828125, -10.2862548828125, -9.773681640625, -9.2611083984375, -8.74853515625, -8.2359619140625, -7.723388671875, -7.2108154296875, -6.6982421875, -6.1856689453125, -5.673095703125, -5.1605224609375, -4.64794921875, -4.1353759765625, -3.622802734375, -3.1102294921875, -2.59765625, -2.0850830078125, -1.572509765625, -1.0599365234375, -0.54736328125, -0.0347900390625, 0.477783203125, 0.9903564453125, 1.5029296875, 2.0155029296875, 2.528076171875, 3.0406494140625, 3.55322265625, 4.0657958984375, 4.578369140625, 5.0909423828125, 5.603515625, 6.1160888671875, 6.628662109375, 7.1412353515625, 7.65380859375, 8.1663818359375, 8.678955078125, 9.1915283203125, 9.7041015625, 10.2166748046875, 10.729248046875, 11.2418212890625, 11.75439453125, 12.2669677734375, 12.779541015625, 13.2921142578125, 13.8046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 13.0, 17.0, 11.0, 18.0, 22.0, 17.0, 28.0, 29.0, 60.0, 44.0, 49.0, 56.0, 55.0, 59.0, 46.0, 63.0, 59.0, 52.0, 47.0, 43.0, 37.0, 27.0, 24.0, 22.0, 13.0, 22.0, 15.0, 8.0, 6.0, 8.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.44921875, -7.222900390625, -6.99658203125, -6.770263671875, -6.5439453125, -6.317626953125, -6.09130859375, -5.864990234375, -5.638671875, -5.412353515625, -5.18603515625, -4.959716796875, -4.7333984375, -4.507080078125, -4.28076171875, -4.054443359375, -3.828125, -3.601806640625, -3.37548828125, -3.149169921875, -2.9228515625, -2.696533203125, -2.47021484375, -2.243896484375, -2.017578125, -1.791259765625, -1.56494140625, -1.338623046875, -1.1123046875, -0.885986328125, -0.65966796875, -0.433349609375, -0.20703125, 0.019287109375, 0.24560546875, 0.471923828125, 0.6982421875, 0.924560546875, 1.15087890625, 1.377197265625, 1.603515625, 1.829833984375, 2.05615234375, 2.282470703125, 2.5087890625, 2.735107421875, 2.96142578125, 3.187744140625, 3.4140625, 3.640380859375, 3.86669921875, 4.093017578125, 4.3193359375, 4.545654296875, 4.77197265625, 4.998291015625, 5.224609375, 5.450927734375, 5.67724609375, 5.903564453125, 6.1298828125, 6.356201171875, 6.58251953125, 6.808837890625, 7.03515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 5.0, 10.0, 12.0, 15.0, 26.0, 54.0, 89.0, 111.0, 200.0, 333.0, 682.0, 1636.0, 4207.0, 12731.0, 52772.0, 346907.0, 520123.0, 81336.0, 17876.0, 5595.0, 2013.0, 837.0, 396.0, 212.0, 122.0, 74.0, 54.0, 35.0, 21.0, 18.0, 9.0, 8.0, 10.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3515625, -5.1678466796875, -4.984130859375, -4.8004150390625, -4.61669921875, -4.4329833984375, -4.249267578125, -4.0655517578125, -3.8818359375, -3.6981201171875, -3.514404296875, -3.3306884765625, -3.14697265625, -2.9632568359375, -2.779541015625, -2.5958251953125, -2.412109375, -2.2283935546875, -2.044677734375, -1.8609619140625, -1.67724609375, -1.4935302734375, -1.309814453125, -1.1260986328125, -0.9423828125, -0.7586669921875, -0.574951171875, -0.3912353515625, -0.20751953125, -0.0238037109375, 0.159912109375, 0.3436279296875, 0.52734375, 0.7110595703125, 0.894775390625, 1.0784912109375, 1.26220703125, 1.4459228515625, 1.629638671875, 1.8133544921875, 1.9970703125, 2.1807861328125, 2.364501953125, 2.5482177734375, 2.73193359375, 2.9156494140625, 3.099365234375, 3.2830810546875, 3.466796875, 3.6505126953125, 3.834228515625, 4.0179443359375, 4.20166015625, 4.3853759765625, 4.569091796875, 4.7528076171875, 4.9365234375, 5.1202392578125, 5.303955078125, 5.4876708984375, 5.67138671875, 5.8551025390625, 6.038818359375, 6.2225341796875, 6.40625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 9.0, 6.0, 11.0, 16.0, 21.0, 31.0, 39.0, 52.0, 87.0, 109.0, 128.0, 113.0, 114.0, 72.0, 55.0, 44.0, 29.0, 17.0, 10.0, 8.0, 8.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006842613220214844, -0.0006606057286262512, -0.0006369501352310181, -0.0006132945418357849, -0.0005896389484405518, -0.0005659833550453186, -0.0005423277616500854, -0.0005186721682548523, -0.0004950165748596191, -0.000471360981464386, -0.00044770538806915283, -0.0004240497946739197, -0.0004003942012786865, -0.00037673860788345337, -0.0003530830144882202, -0.00032942742109298706, -0.0003057718276977539, -0.00028211623430252075, -0.0002584606409072876, -0.00023480504751205444, -0.0002111494541168213, -0.00018749386072158813, -0.00016383826732635498, -0.00014018267393112183, -0.00011652708053588867, -9.287148714065552e-05, -6.921589374542236e-05, -4.556030035018921e-05, -2.1904706954956055e-05, 1.7508864402770996e-06, 2.5406479835510254e-05, 4.906207323074341e-05, 7.271766662597656e-05, 9.637326002120972e-05, 0.00012002885341644287, 0.00014368444681167603, 0.00016734004020690918, 0.00019099563360214233, 0.0002146512269973755, 0.00023830682039260864, 0.0002619624137878418, 0.00028561800718307495, 0.0003092736005783081, 0.00033292919397354126, 0.0003565847873687744, 0.00038024038076400757, 0.0004038959741592407, 0.0004275515675544739, 0.00045120716094970703, 0.0004748627543449402, 0.0004985183477401733, 0.0005221739411354065, 0.0005458295345306396, 0.0005694851279258728, 0.000593140721321106, 0.0006167963147163391, 0.0006404519081115723, 0.0006641075015068054, 0.0006877630949020386, 0.0007114186882972717, 0.0007350742816925049, 0.000758729875087738, 0.0007823854684829712, 0.0008060410618782043, 0.0008296966552734375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 9.0, 7.0, 9.0, 15.0, 23.0, 47.0, 66.0, 120.0, 246.0, 532.0, 1201.0, 3451.0, 14371.0, 109066.0, 740873.0, 153842.0, 17888.0, 4134.0, 1416.0, 612.0, 305.0, 133.0, 71.0, 42.0, 29.0, 16.0, 17.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.09375, -5.8643798828125, -5.635009765625, -5.4056396484375, -5.17626953125, -4.9468994140625, -4.717529296875, -4.4881591796875, -4.2587890625, -4.0294189453125, -3.800048828125, -3.5706787109375, -3.34130859375, -3.1119384765625, -2.882568359375, -2.6531982421875, -2.423828125, -2.1944580078125, -1.965087890625, -1.7357177734375, -1.50634765625, -1.2769775390625, -1.047607421875, -0.8182373046875, -0.5888671875, -0.3594970703125, -0.130126953125, 0.0992431640625, 0.32861328125, 0.5579833984375, 0.787353515625, 1.0167236328125, 1.24609375, 1.4754638671875, 1.704833984375, 1.9342041015625, 2.16357421875, 2.3929443359375, 2.622314453125, 2.8516845703125, 3.0810546875, 3.3104248046875, 3.539794921875, 3.7691650390625, 3.99853515625, 4.2279052734375, 4.457275390625, 4.6866455078125, 4.916015625, 5.1453857421875, 5.374755859375, 5.6041259765625, 5.83349609375, 6.0628662109375, 6.292236328125, 6.5216064453125, 6.7509765625, 6.9803466796875, 7.209716796875, 7.4390869140625, 7.66845703125, 7.8978271484375, 8.127197265625, 8.3565673828125, 8.5859375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 6.0, 9.0, 5.0, 10.0, 20.0, 16.0, 20.0, 23.0, 31.0, 40.0, 47.0, 71.0, 82.0, 90.0, 78.0, 84.0, 76.0, 49.0, 43.0, 36.0, 34.0, 19.0, 20.0, 19.0, 16.0, 9.0, 5.0, 6.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44140625, -3.333831787109375, -3.22625732421875, -3.118682861328125, -3.0111083984375, -2.903533935546875, -2.79595947265625, -2.688385009765625, -2.580810546875, -2.473236083984375, -2.36566162109375, -2.258087158203125, -2.1505126953125, -2.042938232421875, -1.93536376953125, -1.827789306640625, -1.72021484375, -1.612640380859375, -1.50506591796875, -1.397491455078125, -1.2899169921875, -1.182342529296875, -1.07476806640625, -0.967193603515625, -0.859619140625, -0.752044677734375, -0.64447021484375, -0.536895751953125, -0.4293212890625, -0.321746826171875, -0.21417236328125, -0.106597900390625, 0.0009765625, 0.108551025390625, 0.21612548828125, 0.323699951171875, 0.4312744140625, 0.538848876953125, 0.64642333984375, 0.753997802734375, 0.861572265625, 0.969146728515625, 1.07672119140625, 1.184295654296875, 1.2918701171875, 1.399444580078125, 1.50701904296875, 1.614593505859375, 1.72216796875, 1.829742431640625, 1.93731689453125, 2.044891357421875, 2.1524658203125, 2.260040283203125, 2.36761474609375, 2.475189208984375, 2.582763671875, 2.690338134765625, 2.79791259765625, 2.905487060546875, 3.0130615234375, 3.120635986328125, 3.22821044921875, 3.335784912109375, 3.443359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 30.0, 162.0, 400.0, 295.0, 73.0, 24.0, 12.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-245.78265380859375, -240.52084350585938, -235.259033203125, -229.99722290039062, -224.73541259765625, -219.47360229492188, -214.2117919921875, -208.94998168945312, -203.68817138671875, -198.42636108398438, -193.16455078125, -187.90274047851562, -182.64093017578125, -177.37911987304688, -172.1173095703125, -166.85549926757812, -161.59368896484375, -156.33187866210938, -151.070068359375, -145.80825805664062, -140.54644775390625, -135.28463745117188, -130.0228271484375, -124.76101684570312, -119.49922180175781, -114.23741149902344, -108.97560119628906, -103.71379089355469, -98.45198059082031, -93.19017028808594, -87.92835998535156, -82.66654968261719, -77.40473937988281, -72.14292907714844, -66.88111877441406, -61.61930847167969, -56.35749816894531, -51.09568786621094, -45.83388137817383, -40.57207107543945, -35.31026077270508, -30.048450469970703, -24.786640167236328, -19.524831771850586, -14.263021469116211, -9.001211166381836, -3.7394027709960938, 1.5224075317382812, 6.784217834472656, 12.046028137207031, 17.307838439941406, 22.56964683532715, 27.831457138061523, 33.09326934814453, 38.35507583618164, 43.616886138916016, 48.87869644165039, 54.140506744384766, 59.40231704711914, 64.66412353515625, 69.92593383789062, 75.187744140625, 80.44955444335938, 85.71136474609375, 90.97317504882812]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 15.0, 8.0, 15.0, 9.0, 23.0, 33.0, 33.0, 47.0, 44.0, 43.0, 69.0, 54.0, 65.0, 61.0, 74.0, 65.0, 56.0, 34.0, 49.0, 30.0, 39.0, 34.0, 24.0, 18.0, 7.0, 6.0, 12.0, 9.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.54570007324219, -48.94247055053711, -47.339237213134766, -45.73600769042969, -44.13277816772461, -42.52954864501953, -40.92631530761719, -39.32308578491211, -37.71985626220703, -36.11662673950195, -34.51339340209961, -32.91016387939453, -31.306934356689453, -29.703702926635742, -28.10047149658203, -26.497241973876953, -24.89400863647461, -23.2907772064209, -21.68754768371582, -20.08431625366211, -18.48108673095703, -16.87785530090332, -15.27462387084961, -13.671393394470215, -12.06816291809082, -10.464932441711426, -8.861701965332031, -7.25847053527832, -5.655240058898926, -4.052009582519531, -2.4487781524658203, -0.8455476760864258, 0.7576828002929688, 2.3609135150909424, 3.964144229888916, 5.567375183105469, 7.170605659484863, 8.773836135864258, 10.377067565917969, 11.980298042297363, 13.583528518676758, 15.186758995056152, 16.789989471435547, 18.393220901489258, 19.99645233154297, 21.599681854248047, 23.202913284301758, 24.80614471435547, 26.409374237060547, 28.012605667114258, 29.615835189819336, 31.219066619873047, 32.822296142578125, 34.42552947998047, 36.02875900268555, 37.631988525390625, 39.23522186279297, 40.83845138549805, 42.44168472290039, 44.04491424560547, 45.64814376831055, 47.251373291015625, 48.85460662841797, 50.45783615112305, 52.061065673828125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 11.0, 6.0, 22.0, 23.0, 32.0, 36.0, 45.0, 69.0, 87.0, 129.0, 190.0, 250.0, 428.0, 789.0, 1502.0, 3547.0, 9270.0, 31486.0, 163520.0, 3494122.0, 412112.0, 53680.0, 13996.0, 4825.0, 1963.0, 952.0, 440.0, 290.0, 170.0, 109.0, 62.0, 25.0, 21.0, 10.0, 12.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0], "bins": [-17.03125, -16.6322021484375, -16.233154296875, -15.8341064453125, -15.43505859375, -15.0360107421875, -14.636962890625, -14.2379150390625, -13.8388671875, -13.4398193359375, -13.040771484375, -12.6417236328125, -12.24267578125, -11.8436279296875, -11.444580078125, -11.0455322265625, -10.646484375, -10.2474365234375, -9.848388671875, -9.4493408203125, -9.05029296875, -8.6512451171875, -8.252197265625, -7.8531494140625, -7.4541015625, -7.0550537109375, -6.656005859375, -6.2569580078125, -5.85791015625, -5.4588623046875, -5.059814453125, -4.6607666015625, -4.26171875, -3.8626708984375, -3.463623046875, -3.0645751953125, -2.66552734375, -2.2664794921875, -1.867431640625, -1.4683837890625, -1.0693359375, -0.6702880859375, -0.271240234375, 0.1278076171875, 0.52685546875, 0.9259033203125, 1.324951171875, 1.7239990234375, 2.123046875, 2.5220947265625, 2.921142578125, 3.3201904296875, 3.71923828125, 4.1182861328125, 4.517333984375, 4.9163818359375, 5.3154296875, 5.7144775390625, 6.113525390625, 6.5125732421875, 6.91162109375, 7.3106689453125, 7.709716796875, 8.1087646484375, 8.5078125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 2.0, 5.0, 3.0, 4.0, 7.0, 14.0, 27.0, 23.0, 24.0, 42.0, 42.0, 53.0, 57.0, 62.0, 64.0, 65.0, 75.0, 75.0, 68.0, 55.0, 51.0, 34.0, 32.0, 27.0, 27.0, 18.0, 14.0, 12.0, 5.0, 6.0, 3.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0390625, -1.9850921630859375, -1.931121826171875, -1.8771514892578125, -1.82318115234375, -1.7692108154296875, -1.715240478515625, -1.6612701416015625, -1.6072998046875, -1.5533294677734375, -1.499359130859375, -1.4453887939453125, -1.39141845703125, -1.3374481201171875, -1.283477783203125, -1.2295074462890625, -1.175537109375, -1.1215667724609375, -1.067596435546875, -1.0136260986328125, -0.95965576171875, -0.9056854248046875, -0.851715087890625, -0.7977447509765625, -0.7437744140625, -0.6898040771484375, -0.635833740234375, -0.5818634033203125, -0.52789306640625, -0.4739227294921875, -0.419952392578125, -0.3659820556640625, -0.31201171875, -0.2580413818359375, -0.204071044921875, -0.1501007080078125, -0.09613037109375, -0.0421600341796875, 0.011810302734375, 0.0657806396484375, 0.1197509765625, 0.1737213134765625, 0.227691650390625, 0.2816619873046875, 0.33563232421875, 0.3896026611328125, 0.443572998046875, 0.4975433349609375, 0.551513671875, 0.6054840087890625, 0.659454345703125, 0.7134246826171875, 0.76739501953125, 0.8213653564453125, 0.875335693359375, 0.9293060302734375, 0.9832763671875, 1.0372467041015625, 1.091217041015625, 1.1451873779296875, 1.19915771484375, 1.2531280517578125, 1.307098388671875, 1.3610687255859375, 1.4150390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 2.0, 13.0, 14.0, 26.0, 44.0, 70.0, 131.0, 271.0, 697.0, 2265.0, 11418.0, 311102.0, 3833163.0, 28964.0, 4131.0, 1136.0, 380.0, 193.0, 92.0, 60.0, 22.0, 20.0, 16.0, 7.0, 12.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.8125, -23.962890625, -23.11328125, -22.263671875, -21.4140625, -20.564453125, -19.71484375, -18.865234375, -18.015625, -17.166015625, -16.31640625, -15.466796875, -14.6171875, -13.767578125, -12.91796875, -12.068359375, -11.21875, -10.369140625, -9.51953125, -8.669921875, -7.8203125, -6.970703125, -6.12109375, -5.271484375, -4.421875, -3.572265625, -2.72265625, -1.873046875, -1.0234375, -0.173828125, 0.67578125, 1.525390625, 2.375, 3.224609375, 4.07421875, 4.923828125, 5.7734375, 6.623046875, 7.47265625, 8.322265625, 9.171875, 10.021484375, 10.87109375, 11.720703125, 12.5703125, 13.419921875, 14.26953125, 15.119140625, 15.96875, 16.818359375, 17.66796875, 18.517578125, 19.3671875, 20.216796875, 21.06640625, 21.916015625, 22.765625, 23.615234375, 24.46484375, 25.314453125, 26.1640625, 27.013671875, 27.86328125, 28.712890625, 29.5625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 8.0, 10.0, 16.0, 15.0, 27.0, 34.0, 66.0, 111.0, 251.0, 496.0, 1332.0, 899.0, 374.0, 177.0, 88.0, 42.0, 29.0, 23.0, 10.0, 11.0, 13.0, 6.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.456787109375, -4.31201171875, -4.167236328125, -4.0224609375, -3.877685546875, -3.73291015625, -3.588134765625, -3.443359375, -3.298583984375, -3.15380859375, -3.009033203125, -2.8642578125, -2.719482421875, -2.57470703125, -2.429931640625, -2.28515625, -2.140380859375, -1.99560546875, -1.850830078125, -1.7060546875, -1.561279296875, -1.41650390625, -1.271728515625, -1.126953125, -0.982177734375, -0.83740234375, -0.692626953125, -0.5478515625, -0.403076171875, -0.25830078125, -0.113525390625, 0.03125, 0.176025390625, 0.32080078125, 0.465576171875, 0.6103515625, 0.755126953125, 0.89990234375, 1.044677734375, 1.189453125, 1.334228515625, 1.47900390625, 1.623779296875, 1.7685546875, 1.913330078125, 2.05810546875, 2.202880859375, 2.34765625, 2.492431640625, 2.63720703125, 2.781982421875, 2.9267578125, 3.071533203125, 3.21630859375, 3.361083984375, 3.505859375, 3.650634765625, 3.79541015625, 3.940185546875, 4.0849609375, 4.229736328125, 4.37451171875, 4.519287109375, 4.6640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 70.0, 504.0, 370.0, 47.0, 7.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.36361694335938, -175.72744750976562, -171.09127807617188, -166.45510864257812, -161.81893920898438, -157.18276977539062, -152.54660034179688, -147.91043090820312, -143.27426147460938, -138.63809204101562, -134.00192260742188, -129.36575317382812, -124.72958374023438, -120.09341430664062, -115.45724487304688, -110.82107543945312, -106.1849136352539, -101.54874420166016, -96.9125747680664, -92.27640533447266, -87.6402359008789, -83.00406646728516, -78.36790466308594, -73.73173522949219, -69.09556579589844, -64.45939636230469, -59.82322692871094, -55.18705749511719, -50.55088806152344, -45.91471862792969, -41.2785530090332, -36.64238357543945, -32.00621032714844, -27.370040893554688, -22.733871459960938, -18.09770393371582, -13.46153450012207, -8.82536506652832, -4.189197540283203, 0.4469718933105469, 5.083141326904297, 9.719310760498047, 14.35547924041748, 18.991647720336914, 23.627817153930664, 28.263986587524414, 32.90015411376953, 37.53632354736328, 42.17249298095703, 46.80866241455078, 51.44483184814453, 56.08100128173828, 60.71717071533203, 65.35334014892578, 69.989501953125, 74.62567138671875, 79.2618408203125, 83.89801025390625, 88.5341796875, 93.17034912109375, 97.8065185546875, 102.44268798828125, 107.078857421875, 111.71502685546875, 116.3511962890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 9.0, 10.0, 13.0, 14.0, 23.0, 25.0, 41.0, 40.0, 47.0, 46.0, 48.0, 41.0, 57.0, 51.0, 73.0, 51.0, 65.0, 64.0, 49.0, 44.0, 43.0, 28.0, 28.0, 19.0, 11.0, 15.0, 8.0, 6.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.07938003540039, -17.502084732055664, -16.924789428710938, -16.34749412536621, -15.770197868347168, -15.192902565002441, -14.615606307983398, -14.038311004638672, -13.461015701293945, -12.883720397949219, -12.306425094604492, -11.72912883758545, -11.151833534240723, -10.574538230895996, -9.997241973876953, -9.419946670532227, -8.8426513671875, -8.265356063842773, -7.688060283660889, -7.110764503479004, -6.533469200134277, -5.956173896789551, -5.378878116607666, -4.801582336425781, -4.224287033081055, -3.646991491317749, -3.0696959495544434, -2.4924004077911377, -1.915104866027832, -1.3378093242645264, -0.7605137825012207, -0.18321800231933594, 0.3940773010253906, 0.9713728427886963, 1.548668384552002, 2.1259639263153076, 2.7032594680786133, 3.280555009841919, 3.8578505516052246, 4.435146331787109, 5.012441635131836, 5.5897369384765625, 6.167032718658447, 6.744328498840332, 7.321623802185059, 7.898919105529785, 8.476215362548828, 9.053510665893555, 9.630805969238281, 10.208101272583008, 10.785396575927734, 11.362692832946777, 11.939988136291504, 12.51728343963623, 13.094579696655273, 13.671875, 14.249170303344727, 14.826465606689453, 15.40376091003418, 15.981057167053223, 16.558353424072266, 17.135648727416992, 17.71294403076172, 18.290239334106445, 18.867534637451172]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 8.0, 5.0, 11.0, 15.0, 14.0, 18.0, 14.0, 25.0, 31.0, 43.0, 63.0, 81.0, 149.0, 201.0, 349.0, 733.0, 1613.0, 3928.0, 11547.0, 40190.0, 168317.0, 525376.0, 222112.0, 50998.0, 14292.0, 4706.0, 1760.0, 799.0, 436.0, 245.0, 137.0, 102.0, 49.0, 39.0, 29.0, 25.0, 23.0, 18.0, 9.0, 10.0, 5.0, 6.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-11.9296875, -11.594482421875, -11.25927734375, -10.924072265625, -10.5888671875, -10.253662109375, -9.91845703125, -9.583251953125, -9.248046875, -8.912841796875, -8.57763671875, -8.242431640625, -7.9072265625, -7.572021484375, -7.23681640625, -6.901611328125, -6.56640625, -6.231201171875, -5.89599609375, -5.560791015625, -5.2255859375, -4.890380859375, -4.55517578125, -4.219970703125, -3.884765625, -3.549560546875, -3.21435546875, -2.879150390625, -2.5439453125, -2.208740234375, -1.87353515625, -1.538330078125, -1.203125, -0.867919921875, -0.53271484375, -0.197509765625, 0.1376953125, 0.472900390625, 0.80810546875, 1.143310546875, 1.478515625, 1.813720703125, 2.14892578125, 2.484130859375, 2.8193359375, 3.154541015625, 3.48974609375, 3.824951171875, 4.16015625, 4.495361328125, 4.83056640625, 5.165771484375, 5.5009765625, 5.836181640625, 6.17138671875, 6.506591796875, 6.841796875, 7.177001953125, 7.51220703125, 7.847412109375, 8.1826171875, 8.517822265625, 8.85302734375, 9.188232421875, 9.5234375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 7.0, 2.0, 14.0, 11.0, 23.0, 18.0, 30.0, 36.0, 29.0, 47.0, 45.0, 76.0, 67.0, 55.0, 59.0, 59.0, 63.0, 51.0, 44.0, 46.0, 52.0, 41.0, 22.0, 23.0, 16.0, 17.0, 13.0, 11.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-2.1484375, -2.097686767578125, -2.04693603515625, -1.996185302734375, -1.9454345703125, -1.894683837890625, -1.84393310546875, -1.793182373046875, -1.742431640625, -1.691680908203125, -1.64093017578125, -1.590179443359375, -1.5394287109375, -1.488677978515625, -1.43792724609375, -1.387176513671875, -1.33642578125, -1.285675048828125, -1.23492431640625, -1.184173583984375, -1.1334228515625, -1.082672119140625, -1.03192138671875, -0.981170654296875, -0.930419921875, -0.879669189453125, -0.82891845703125, -0.778167724609375, -0.7274169921875, -0.676666259765625, -0.62591552734375, -0.575164794921875, -0.5244140625, -0.473663330078125, -0.42291259765625, -0.372161865234375, -0.3214111328125, -0.270660400390625, -0.21990966796875, -0.169158935546875, -0.118408203125, -0.067657470703125, -0.01690673828125, 0.033843994140625, 0.0845947265625, 0.135345458984375, 0.18609619140625, 0.236846923828125, 0.28759765625, 0.338348388671875, 0.38909912109375, 0.439849853515625, 0.4906005859375, 0.541351318359375, 0.59210205078125, 0.642852783203125, 0.693603515625, 0.744354248046875, 0.79510498046875, 0.845855712890625, 0.8966064453125, 0.947357177734375, 0.99810791015625, 1.048858642578125, 1.099609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 5.0, 8.0, 8.0, 15.0, 18.0, 35.0, 51.0, 57.0, 112.0, 191.0, 422.0, 1039.0, 3414.0, 16971.0, 122106.0, 629063.0, 236352.0, 30614.0, 5328.0, 1522.0, 572.0, 255.0, 137.0, 93.0, 45.0, 23.0, 31.0, 15.0, 5.0, 9.0, 5.0, 6.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.4453125, -12.0963134765625, -11.747314453125, -11.3983154296875, -11.04931640625, -10.7003173828125, -10.351318359375, -10.0023193359375, -9.6533203125, -9.3043212890625, -8.955322265625, -8.6063232421875, -8.25732421875, -7.9083251953125, -7.559326171875, -7.2103271484375, -6.861328125, -6.5123291015625, -6.163330078125, -5.8143310546875, -5.46533203125, -5.1163330078125, -4.767333984375, -4.4183349609375, -4.0693359375, -3.7203369140625, -3.371337890625, -3.0223388671875, -2.67333984375, -2.3243408203125, -1.975341796875, -1.6263427734375, -1.27734375, -0.9283447265625, -0.579345703125, -0.2303466796875, 0.11865234375, 0.4676513671875, 0.816650390625, 1.1656494140625, 1.5146484375, 1.8636474609375, 2.212646484375, 2.5616455078125, 2.91064453125, 3.2596435546875, 3.608642578125, 3.9576416015625, 4.306640625, 4.6556396484375, 5.004638671875, 5.3536376953125, 5.70263671875, 6.0516357421875, 6.400634765625, 6.7496337890625, 7.0986328125, 7.4476318359375, 7.796630859375, 8.1456298828125, 8.49462890625, 8.8436279296875, 9.192626953125, 9.5416259765625, 9.890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 1.0, 8.0, 10.0, 10.0, 15.0, 12.0, 17.0, 25.0, 20.0, 26.0, 41.0, 31.0, 49.0, 42.0, 40.0, 38.0, 53.0, 49.0, 49.0, 55.0, 47.0, 40.0, 45.0, 35.0, 37.0, 27.0, 44.0, 20.0, 27.0, 15.0, 20.0, 11.0, 11.0, 12.0, 4.0, 3.0, 1.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.2421875, -7.04638671875, -6.8505859375, -6.65478515625, -6.458984375, -6.26318359375, -6.0673828125, -5.87158203125, -5.67578125, -5.47998046875, -5.2841796875, -5.08837890625, -4.892578125, -4.69677734375, -4.5009765625, -4.30517578125, -4.109375, -3.91357421875, -3.7177734375, -3.52197265625, -3.326171875, -3.13037109375, -2.9345703125, -2.73876953125, -2.54296875, -2.34716796875, -2.1513671875, -1.95556640625, -1.759765625, -1.56396484375, -1.3681640625, -1.17236328125, -0.9765625, -0.78076171875, -0.5849609375, -0.38916015625, -0.193359375, 0.00244140625, 0.1982421875, 0.39404296875, 0.58984375, 0.78564453125, 0.9814453125, 1.17724609375, 1.373046875, 1.56884765625, 1.7646484375, 1.96044921875, 2.15625, 2.35205078125, 2.5478515625, 2.74365234375, 2.939453125, 3.13525390625, 3.3310546875, 3.52685546875, 3.72265625, 3.91845703125, 4.1142578125, 4.31005859375, 4.505859375, 4.70166015625, 4.8974609375, 5.09326171875, 5.2890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 13.0, 13.0, 21.0, 35.0, 51.0, 109.0, 189.0, 418.0, 1104.0, 3539.0, 14466.0, 93735.0, 726577.0, 178220.0, 22621.0, 4971.0, 1392.0, 570.0, 227.0, 121.0, 53.0, 44.0, 27.0, 14.0, 6.0, 8.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.86199951171875, -6.5716552734375, -6.28131103515625, -5.990966796875, -5.70062255859375, -5.4102783203125, -5.11993408203125, -4.82958984375, -4.53924560546875, -4.2489013671875, -3.95855712890625, -3.668212890625, -3.37786865234375, -3.0875244140625, -2.79718017578125, -2.5068359375, -2.21649169921875, -1.9261474609375, -1.63580322265625, -1.345458984375, -1.05511474609375, -0.7647705078125, -0.47442626953125, -0.18408203125, 0.10626220703125, 0.3966064453125, 0.68695068359375, 0.977294921875, 1.26763916015625, 1.5579833984375, 1.84832763671875, 2.138671875, 2.42901611328125, 2.7193603515625, 3.00970458984375, 3.300048828125, 3.59039306640625, 3.8807373046875, 4.17108154296875, 4.46142578125, 4.75177001953125, 5.0421142578125, 5.33245849609375, 5.622802734375, 5.91314697265625, 6.2034912109375, 6.49383544921875, 6.7841796875, 7.07452392578125, 7.3648681640625, 7.65521240234375, 7.945556640625, 8.23590087890625, 8.5262451171875, 8.81658935546875, 9.10693359375, 9.39727783203125, 9.6876220703125, 9.97796630859375, 10.268310546875, 10.55865478515625, 10.8489990234375, 11.13934326171875, 11.4296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 3.0, 8.0, 10.0, 13.0, 17.0, 15.0, 18.0, 36.0, 33.0, 53.0, 70.0, 79.0, 119.0, 98.0, 90.0, 69.0, 51.0, 41.0, 34.0, 22.0, 18.0, 18.0, 11.0, 9.0, 10.0, 6.0, 9.0, 3.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0005536079406738281, -0.0005383417010307312, -0.0005230754613876343, -0.0005078092217445374, -0.0004925429821014404, -0.0004772767424583435, -0.0004620105028152466, -0.00044674426317214966, -0.00043147802352905273, -0.0004162117838859558, -0.0004009455442428589, -0.00038567930459976196, -0.00037041306495666504, -0.0003551468253135681, -0.0003398805856704712, -0.00032461434602737427, -0.00030934810638427734, -0.0002940818667411804, -0.0002788156270980835, -0.00026354938745498657, -0.00024828314781188965, -0.00023301690816879272, -0.0002177506685256958, -0.00020248442888259888, -0.00018721818923950195, -0.00017195194959640503, -0.0001566857099533081, -0.00014141947031021118, -0.00012615323066711426, -0.00011088699102401733, -9.562075138092041e-05, -8.035451173782349e-05, -6.508827209472656e-05, -4.982203245162964e-05, -3.4555792808532715e-05, -1.928955316543579e-05, -4.023313522338867e-06, 1.1242926120758057e-05, 2.650916576385498e-05, 4.1775405406951904e-05, 5.704164505004883e-05, 7.230788469314575e-05, 8.757412433624268e-05, 0.0001028403639793396, 0.00011810660362243652, 0.00013337284326553345, 0.00014863908290863037, 0.0001639053225517273, 0.00017917156219482422, 0.00019443780183792114, 0.00020970404148101807, 0.000224970281124115, 0.00024023652076721191, 0.00025550276041030884, 0.00027076900005340576, 0.0002860352396965027, 0.0003013014793395996, 0.00031656771898269653, 0.00033183395862579346, 0.0003471001982688904, 0.0003623664379119873, 0.00037763267755508423, 0.00039289891719818115, 0.0004081651568412781, 0.000423431396484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 5.0, 18.0, 32.0, 42.0, 96.0, 163.0, 303.0, 622.0, 1619.0, 5307.0, 26946.0, 271202.0, 671872.0, 56854.0, 9366.0, 2478.0, 821.0, 356.0, 174.0, 102.0, 60.0, 36.0, 27.0, 20.0, 11.0, 5.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -7.95751953125, -7.6416015625, -7.32568359375, -7.009765625, -6.69384765625, -6.3779296875, -6.06201171875, -5.74609375, -5.43017578125, -5.1142578125, -4.79833984375, -4.482421875, -4.16650390625, -3.8505859375, -3.53466796875, -3.21875, -2.90283203125, -2.5869140625, -2.27099609375, -1.955078125, -1.63916015625, -1.3232421875, -1.00732421875, -0.69140625, -0.37548828125, -0.0595703125, 0.25634765625, 0.572265625, 0.88818359375, 1.2041015625, 1.52001953125, 1.8359375, 2.15185546875, 2.4677734375, 2.78369140625, 3.099609375, 3.41552734375, 3.7314453125, 4.04736328125, 4.36328125, 4.67919921875, 4.9951171875, 5.31103515625, 5.626953125, 5.94287109375, 6.2587890625, 6.57470703125, 6.890625, 7.20654296875, 7.5224609375, 7.83837890625, 8.154296875, 8.47021484375, 8.7861328125, 9.10205078125, 9.41796875, 9.73388671875, 10.0498046875, 10.36572265625, 10.681640625, 10.99755859375, 11.3134765625, 11.62939453125, 11.9453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 12.0, 12.0, 7.0, 22.0, 21.0, 36.0, 49.0, 59.0, 76.0, 110.0, 141.0, 108.0, 94.0, 54.0, 48.0, 28.0, 24.0, 17.0, 18.0, 9.0, 3.0, 5.0, 5.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.16278076171875, -4.9935302734375, -4.82427978515625, -4.655029296875, -4.48577880859375, -4.3165283203125, -4.14727783203125, -3.97802734375, -3.80877685546875, -3.6395263671875, -3.47027587890625, -3.301025390625, -3.13177490234375, -2.9625244140625, -2.79327392578125, -2.6240234375, -2.45477294921875, -2.2855224609375, -2.11627197265625, -1.947021484375, -1.77777099609375, -1.6085205078125, -1.43927001953125, -1.27001953125, -1.10076904296875, -0.9315185546875, -0.76226806640625, -0.593017578125, -0.42376708984375, -0.2545166015625, -0.08526611328125, 0.083984375, 0.25323486328125, 0.4224853515625, 0.59173583984375, 0.760986328125, 0.93023681640625, 1.0994873046875, 1.26873779296875, 1.43798828125, 1.60723876953125, 1.7764892578125, 1.94573974609375, 2.114990234375, 2.28424072265625, 2.4534912109375, 2.62274169921875, 2.7919921875, 2.96124267578125, 3.1304931640625, 3.29974365234375, 3.468994140625, 3.63824462890625, 3.8074951171875, 3.97674560546875, 4.14599609375, 4.31524658203125, 4.4844970703125, 4.65374755859375, 4.822998046875, 4.99224853515625, 5.1614990234375, 5.33074951171875, 5.5]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 21.0, 29.0, 89.0, 202.0, 254.0, 220.0, 104.0, 45.0, 23.0, 10.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.09078979492188, -127.86033630371094, -124.6298828125, -121.39942932128906, -118.16898345947266, -114.93852996826172, -111.70807647705078, -108.47762298583984, -105.24717712402344, -102.0167236328125, -98.78627014160156, -95.55581665039062, -92.32537078857422, -89.09491729736328, -85.86446380615234, -82.6340103149414, -79.40355682373047, -76.17310333251953, -72.9426498413086, -69.71220397949219, -66.48175048828125, -63.25129699707031, -60.020843505859375, -56.79039001464844, -53.559940338134766, -50.32948684692383, -47.099037170410156, -43.86858367919922, -40.63813018798828, -37.40768051147461, -34.17722702026367, -30.946775436401367, -27.716331481933594, -24.48587989807129, -21.255428314208984, -18.024974822998047, -14.794523239135742, -11.564071655273438, -8.3336181640625, -5.103166580200195, -1.8727149963378906, 1.3577370643615723, 4.588189125061035, 7.818641662597656, 11.049093246459961, 14.279544830322266, 17.509998321533203, 20.740449905395508, 23.970901489257812, 27.201353073120117, 30.431804656982422, 33.66225814819336, 36.89270782470703, 40.12316131591797, 43.353614807128906, 46.584068298339844, 49.814517974853516, 53.04497146606445, 56.275421142578125, 59.50587463378906, 62.736328125, 65.96678161621094, 69.19723510742188, 72.42768096923828, 75.65813446044922]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 12.0, 10.0, 12.0, 19.0, 18.0, 25.0, 28.0, 34.0, 33.0, 34.0, 35.0, 36.0, 43.0, 47.0, 47.0, 47.0, 39.0, 43.0, 45.0, 42.0, 45.0, 23.0, 36.0, 35.0, 36.0, 23.0, 29.0, 15.0, 14.0, 12.0, 13.0, 10.0, 13.0, 5.0, 8.0, 10.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.629146575927734, -30.551347732543945, -29.473546981811523, -28.395748138427734, -27.317949295043945, -26.240150451660156, -25.162349700927734, -24.084550857543945, -23.006752014160156, -21.928953170776367, -20.851152420043945, -19.773353576660156, -18.695554733276367, -17.617755889892578, -16.539955139160156, -15.462156295776367, -14.384355545043945, -13.30655574798584, -12.22875690460205, -11.150957107543945, -10.073158264160156, -8.99535846710205, -7.917558670043945, -6.839759349822998, -5.761960029602051, -4.6841607093811035, -3.606361150741577, -2.528561592102051, -1.4507622718811035, -0.37296295166015625, 0.7048368453979492, 1.7826361656188965, 2.8604354858398438, 3.938234806060791, 5.016034126281738, 6.093833923339844, 7.171633243560791, 8.249432563781738, 9.327232360839844, 10.405031204223633, 11.482831001281738, 12.560630798339844, 13.638429641723633, 14.716229438781738, 15.794029235839844, 16.871828079223633, 17.949626922607422, 19.027427673339844, 20.105226516723633, 21.183025360107422, 22.260826110839844, 23.338624954223633, 24.416423797607422, 25.494224548339844, 26.572023391723633, 27.649822235107422, 28.727622985839844, 29.805421829223633, 30.883222579956055, 31.961021423339844, 33.038822174072266, 34.11661911010742, 35.194419860839844, 36.272220611572266, 37.35001754760742]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 9.0, 10.0, 14.0, 14.0, 22.0, 22.0, 37.0, 64.0, 87.0, 125.0, 200.0, 346.0, 750.0, 1586.0, 4077.0, 12594.0, 61910.0, 3211394.0, 839898.0, 44900.0, 10170.0, 3331.0, 1368.0, 590.0, 337.0, 138.0, 105.0, 53.0, 45.0, 25.0, 17.0, 10.0, 7.0, 10.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9921875, -11.604248046875, -11.21630859375, -10.828369140625, -10.4404296875, -10.052490234375, -9.66455078125, -9.276611328125, -8.888671875, -8.500732421875, -8.11279296875, -7.724853515625, -7.3369140625, -6.948974609375, -6.56103515625, -6.173095703125, -5.78515625, -5.397216796875, -5.00927734375, -4.621337890625, -4.2333984375, -3.845458984375, -3.45751953125, -3.069580078125, -2.681640625, -2.293701171875, -1.90576171875, -1.517822265625, -1.1298828125, -0.741943359375, -0.35400390625, 0.033935546875, 0.421875, 0.809814453125, 1.19775390625, 1.585693359375, 1.9736328125, 2.361572265625, 2.74951171875, 3.137451171875, 3.525390625, 3.913330078125, 4.30126953125, 4.689208984375, 5.0771484375, 5.465087890625, 5.85302734375, 6.240966796875, 6.62890625, 7.016845703125, 7.40478515625, 7.792724609375, 8.1806640625, 8.568603515625, 8.95654296875, 9.344482421875, 9.732421875, 10.120361328125, 10.50830078125, 10.896240234375, 11.2841796875, 11.672119140625, 12.06005859375, 12.447998046875, 12.8359375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 7.0, 9.0, 7.0, 10.0, 18.0, 17.0, 29.0, 31.0, 40.0, 51.0, 72.0, 54.0, 68.0, 54.0, 65.0, 74.0, 55.0, 50.0, 61.0, 40.0, 37.0, 27.0, 34.0, 29.0, 14.0, 9.0, 13.0, 11.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.248046875, -2.1935882568359375, -2.139129638671875, -2.0846710205078125, -2.03021240234375, -1.9757537841796875, -1.921295166015625, -1.8668365478515625, -1.8123779296875, -1.7579193115234375, -1.703460693359375, -1.6490020751953125, -1.59454345703125, -1.5400848388671875, -1.485626220703125, -1.4311676025390625, -1.376708984375, -1.3222503662109375, -1.267791748046875, -1.2133331298828125, -1.15887451171875, -1.1044158935546875, -1.049957275390625, -0.9954986572265625, -0.9410400390625, -0.8865814208984375, -0.832122802734375, -0.7776641845703125, -0.72320556640625, -0.6687469482421875, -0.614288330078125, -0.5598297119140625, -0.50537109375, -0.4509124755859375, -0.396453857421875, -0.3419952392578125, -0.28753662109375, -0.2330780029296875, -0.178619384765625, -0.1241607666015625, -0.0697021484375, -0.0152435302734375, 0.039215087890625, 0.0936737060546875, 0.14813232421875, 0.2025909423828125, 0.257049560546875, 0.3115081787109375, 0.365966796875, 0.4204254150390625, 0.474884033203125, 0.5293426513671875, 0.58380126953125, 0.6382598876953125, 0.692718505859375, 0.7471771240234375, 0.8016357421875, 0.8560943603515625, 0.910552978515625, 0.9650115966796875, 1.01947021484375, 1.0739288330078125, 1.128387451171875, 1.1828460693359375, 1.2373046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 1.0, 10.0, 17.0, 20.0, 36.0, 64.0, 60.0, 118.0, 193.0, 348.0, 849.0, 3010.0, 21997.0, 1870014.0, 2269190.0, 23390.0, 3070.0, 935.0, 371.0, 206.0, 142.0, 74.0, 48.0, 28.0, 24.0, 20.0, 12.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.921875, -20.306640625, -19.69140625, -19.076171875, -18.4609375, -17.845703125, -17.23046875, -16.615234375, -16.0, -15.384765625, -14.76953125, -14.154296875, -13.5390625, -12.923828125, -12.30859375, -11.693359375, -11.078125, -10.462890625, -9.84765625, -9.232421875, -8.6171875, -8.001953125, -7.38671875, -6.771484375, -6.15625, -5.541015625, -4.92578125, -4.310546875, -3.6953125, -3.080078125, -2.46484375, -1.849609375, -1.234375, -0.619140625, -0.00390625, 0.611328125, 1.2265625, 1.841796875, 2.45703125, 3.072265625, 3.6875, 4.302734375, 4.91796875, 5.533203125, 6.1484375, 6.763671875, 7.37890625, 7.994140625, 8.609375, 9.224609375, 9.83984375, 10.455078125, 11.0703125, 11.685546875, 12.30078125, 12.916015625, 13.53125, 14.146484375, 14.76171875, 15.376953125, 15.9921875, 16.607421875, 17.22265625, 17.837890625, 18.453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 15.0, 11.0, 17.0, 32.0, 55.0, 88.0, 183.0, 498.0, 1886.0, 762.0, 218.0, 108.0, 79.0, 36.0, 27.0, 15.0, 11.0, 11.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.81640625, -4.67315673828125, -4.5299072265625, -4.38665771484375, -4.243408203125, -4.10015869140625, -3.9569091796875, -3.81365966796875, -3.67041015625, -3.52716064453125, -3.3839111328125, -3.24066162109375, -3.097412109375, -2.95416259765625, -2.8109130859375, -2.66766357421875, -2.5244140625, -2.38116455078125, -2.2379150390625, -2.09466552734375, -1.951416015625, -1.80816650390625, -1.6649169921875, -1.52166748046875, -1.37841796875, -1.23516845703125, -1.0919189453125, -0.94866943359375, -0.805419921875, -0.66217041015625, -0.5189208984375, -0.37567138671875, -0.232421875, -0.08917236328125, 0.0540771484375, 0.19732666015625, 0.340576171875, 0.48382568359375, 0.6270751953125, 0.77032470703125, 0.91357421875, 1.05682373046875, 1.2000732421875, 1.34332275390625, 1.486572265625, 1.62982177734375, 1.7730712890625, 1.91632080078125, 2.0595703125, 2.20281982421875, 2.3460693359375, 2.48931884765625, 2.632568359375, 2.77581787109375, 2.9190673828125, 3.06231689453125, 3.20556640625, 3.34881591796875, 3.4920654296875, 3.63531494140625, 3.778564453125, 3.92181396484375, 4.0650634765625, 4.20831298828125, 4.3515625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 61.0, 271.0, 406.0, 196.0, 49.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.64601135253906, -46.456756591796875, -44.26750183105469, -42.0782470703125, -39.88899230957031, -37.699737548828125, -35.51047897338867, -33.321224212646484, -31.131969451904297, -28.94271469116211, -26.753459930419922, -24.5642032623291, -22.374948501586914, -20.185693740844727, -17.996437072753906, -15.807182312011719, -13.617927551269531, -11.428672790527344, -9.23941707611084, -7.050161838531494, -4.860906600952148, -2.671651840209961, -0.48239612579345703, 1.7068595886230469, 3.8961143493652344, 6.08536958694458, 8.274624824523926, 10.46388053894043, 12.653135299682617, 14.842390060424805, 17.031646728515625, 19.220901489257812, 21.41014862060547, 23.599403381347656, 25.788658142089844, 27.977914810180664, 30.16716957092285, 32.356422424316406, 34.54568099975586, 36.73493576049805, 38.924190521240234, 41.11344528198242, 43.30270004272461, 45.4919548034668, 47.68121337890625, 49.87046813964844, 52.059722900390625, 54.24897766113281, 56.438232421875, 58.62748718261719, 60.816741943359375, 63.00599670410156, 65.19525146484375, 67.38450622558594, 69.57376098632812, 71.76301574707031, 73.9522705078125, 76.14152526855469, 78.33078002929688, 80.52003479003906, 82.70928955078125, 84.89854431152344, 87.08779907226562, 89.27705383300781, 91.46631622314453]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 15.0, 16.0, 23.0, 26.0, 25.0, 33.0, 43.0, 50.0, 58.0, 63.0, 52.0, 46.0, 59.0, 52.0, 51.0, 54.0, 32.0, 49.0, 45.0, 34.0, 37.0, 33.0, 11.0, 21.0, 19.0, 11.0, 4.0, 5.0, 6.0, 3.0, 6.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.039474487304688, -13.590597152709961, -13.14172077178955, -12.692843437194824, -12.243967056274414, -11.795089721679688, -11.346212387084961, -10.897335052490234, -10.448458671569824, -9.999581336975098, -9.550704956054688, -9.101827621459961, -8.652950286865234, -8.204073905944824, -7.755196571350098, -7.306319713592529, -6.857442855834961, -6.408565998077393, -5.959689140319824, -5.510811805725098, -5.061934947967529, -4.613058090209961, -4.164180755615234, -3.715303897857666, -3.2664270401000977, -2.8175501823425293, -2.368673086166382, -1.919796109199524, -1.470919132232666, -1.0220422744750977, -0.5731651782989502, -0.12428808212280273, 0.3245878219604492, 0.7734647989273071, 1.222341775894165, 1.671218752861023, 2.120095729827881, 2.568972587585449, 3.0178496837615967, 3.466726779937744, 3.9156036376953125, 4.364480495452881, 4.813357353210449, 5.262234687805176, 5.711111545562744, 6.1599884033203125, 6.608865737915039, 7.057742595672607, 7.506619453430176, 7.955496311187744, 8.404373168945312, 8.853250503540039, 9.302127838134766, 9.751004219055176, 10.199881553649902, 10.648757934570312, 11.097635269165039, 11.546512603759766, 11.995388984680176, 12.444266319274902, 12.893142700195312, 13.342020034790039, 13.790897369384766, 14.239774703979492, 14.688651084899902]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 13.0, 8.0, 22.0, 47.0, 66.0, 156.0, 245.0, 509.0, 1378.0, 4553.0, 19249.0, 114021.0, 554924.0, 292892.0, 47237.0, 9036.0, 2443.0, 902.0, 402.0, 197.0, 102.0, 59.0, 28.0, 19.0, 10.0, 9.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.046875, -14.6260986328125, -14.205322265625, -13.7845458984375, -13.36376953125, -12.9429931640625, -12.522216796875, -12.1014404296875, -11.6806640625, -11.2598876953125, -10.839111328125, -10.4183349609375, -9.99755859375, -9.5767822265625, -9.156005859375, -8.7352294921875, -8.314453125, -7.8936767578125, -7.472900390625, -7.0521240234375, -6.63134765625, -6.2105712890625, -5.789794921875, -5.3690185546875, -4.9482421875, -4.5274658203125, -4.106689453125, -3.6859130859375, -3.26513671875, -2.8443603515625, -2.423583984375, -2.0028076171875, -1.58203125, -1.1612548828125, -0.740478515625, -0.3197021484375, 0.10107421875, 0.5218505859375, 0.942626953125, 1.3634033203125, 1.7841796875, 2.2049560546875, 2.625732421875, 3.0465087890625, 3.46728515625, 3.8880615234375, 4.308837890625, 4.7296142578125, 5.150390625, 5.5711669921875, 5.991943359375, 6.4127197265625, 6.83349609375, 7.2542724609375, 7.675048828125, 8.0958251953125, 8.5166015625, 8.9373779296875, 9.358154296875, 9.7789306640625, 10.19970703125, 10.6204833984375, 11.041259765625, 11.4620361328125, 11.8828125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 4.0, 7.0, 16.0, 17.0, 22.0, 22.0, 31.0, 31.0, 41.0, 61.0, 70.0, 68.0, 63.0, 68.0, 61.0, 53.0, 55.0, 49.0, 60.0, 35.0, 37.0, 30.0, 30.0, 17.0, 18.0, 8.0, 8.0, 5.0, 4.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.218017578125, -2.16064453125, -2.103271484375, -2.0458984375, -1.988525390625, -1.93115234375, -1.873779296875, -1.81640625, -1.759033203125, -1.70166015625, -1.644287109375, -1.5869140625, -1.529541015625, -1.47216796875, -1.414794921875, -1.357421875, -1.300048828125, -1.24267578125, -1.185302734375, -1.1279296875, -1.070556640625, -1.01318359375, -0.955810546875, -0.8984375, -0.841064453125, -0.78369140625, -0.726318359375, -0.6689453125, -0.611572265625, -0.55419921875, -0.496826171875, -0.439453125, -0.382080078125, -0.32470703125, -0.267333984375, -0.2099609375, -0.152587890625, -0.09521484375, -0.037841796875, 0.01953125, 0.076904296875, 0.13427734375, 0.191650390625, 0.2490234375, 0.306396484375, 0.36376953125, 0.421142578125, 0.478515625, 0.535888671875, 0.59326171875, 0.650634765625, 0.7080078125, 0.765380859375, 0.82275390625, 0.880126953125, 0.9375, 0.994873046875, 1.05224609375, 1.109619140625, 1.1669921875, 1.224365234375, 1.28173828125, 1.339111328125, 1.396484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 11.0, 12.0, 12.0, 14.0, 13.0, 45.0, 41.0, 59.0, 84.0, 109.0, 176.0, 258.0, 355.0, 659.0, 1482.0, 4197.0, 16923.0, 90841.0, 458455.0, 384076.0, 70120.0, 13763.0, 3736.0, 1376.0, 660.0, 383.0, 224.0, 142.0, 109.0, 56.0, 47.0, 33.0, 22.0, 16.0, 18.0, 8.0, 10.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.09375, -10.7933349609375, -10.492919921875, -10.1925048828125, -9.89208984375, -9.5916748046875, -9.291259765625, -8.9908447265625, -8.6904296875, -8.3900146484375, -8.089599609375, -7.7891845703125, -7.48876953125, -7.1883544921875, -6.887939453125, -6.5875244140625, -6.287109375, -5.9866943359375, -5.686279296875, -5.3858642578125, -5.08544921875, -4.7850341796875, -4.484619140625, -4.1842041015625, -3.8837890625, -3.5833740234375, -3.282958984375, -2.9825439453125, -2.68212890625, -2.3817138671875, -2.081298828125, -1.7808837890625, -1.48046875, -1.1800537109375, -0.879638671875, -0.5792236328125, -0.27880859375, 0.0216064453125, 0.322021484375, 0.6224365234375, 0.9228515625, 1.2232666015625, 1.523681640625, 1.8240966796875, 2.12451171875, 2.4249267578125, 2.725341796875, 3.0257568359375, 3.326171875, 3.6265869140625, 3.927001953125, 4.2274169921875, 4.52783203125, 4.8282470703125, 5.128662109375, 5.4290771484375, 5.7294921875, 6.0299072265625, 6.330322265625, 6.6307373046875, 6.93115234375, 7.2315673828125, 7.531982421875, 7.8323974609375, 8.1328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 7.0, 7.0, 7.0, 18.0, 11.0, 7.0, 16.0, 18.0, 27.0, 16.0, 18.0, 30.0, 32.0, 26.0, 34.0, 52.0, 43.0, 40.0, 26.0, 38.0, 38.0, 33.0, 31.0, 43.0, 28.0, 47.0, 54.0, 42.0, 32.0, 37.0, 25.0, 23.0, 25.0, 14.0, 11.0, 14.0, 6.0, 2.0, 7.0, 2.0, 6.0, 9.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.671875, -6.48712158203125, -6.3023681640625, -6.11761474609375, -5.932861328125, -5.74810791015625, -5.5633544921875, -5.37860107421875, -5.19384765625, -5.00909423828125, -4.8243408203125, -4.63958740234375, -4.454833984375, -4.27008056640625, -4.0853271484375, -3.90057373046875, -3.7158203125, -3.53106689453125, -3.3463134765625, -3.16156005859375, -2.976806640625, -2.79205322265625, -2.6072998046875, -2.42254638671875, -2.23779296875, -2.05303955078125, -1.8682861328125, -1.68353271484375, -1.498779296875, -1.31402587890625, -1.1292724609375, -0.94451904296875, -0.759765625, -0.57501220703125, -0.3902587890625, -0.20550537109375, -0.020751953125, 0.16400146484375, 0.3487548828125, 0.53350830078125, 0.71826171875, 0.90301513671875, 1.0877685546875, 1.27252197265625, 1.457275390625, 1.64202880859375, 1.8267822265625, 2.01153564453125, 2.1962890625, 2.38104248046875, 2.5657958984375, 2.75054931640625, 2.935302734375, 3.12005615234375, 3.3048095703125, 3.48956298828125, 3.67431640625, 3.85906982421875, 4.0438232421875, 4.22857666015625, 4.413330078125, 4.59808349609375, 4.7828369140625, 4.96759033203125, 5.15234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 2.0, 4.0, 11.0, 15.0, 15.0, 32.0, 54.0, 73.0, 159.0, 263.0, 477.0, 962.0, 1839.0, 4304.0, 10925.0, 32352.0, 133201.0, 565686.0, 226006.0, 46868.0, 14843.0, 5589.0, 2468.0, 1147.0, 571.0, 276.0, 170.0, 100.0, 54.0, 29.0, 18.0, 14.0, 11.0, 8.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53515625, -5.35455322265625, -5.1739501953125, -4.99334716796875, -4.812744140625, -4.63214111328125, -4.4515380859375, -4.27093505859375, -4.09033203125, -3.90972900390625, -3.7291259765625, -3.54852294921875, -3.367919921875, -3.18731689453125, -3.0067138671875, -2.82611083984375, -2.6455078125, -2.46490478515625, -2.2843017578125, -2.10369873046875, -1.923095703125, -1.74249267578125, -1.5618896484375, -1.38128662109375, -1.20068359375, -1.02008056640625, -0.8394775390625, -0.65887451171875, -0.478271484375, -0.29766845703125, -0.1170654296875, 0.06353759765625, 0.244140625, 0.42474365234375, 0.6053466796875, 0.78594970703125, 0.966552734375, 1.14715576171875, 1.3277587890625, 1.50836181640625, 1.68896484375, 1.86956787109375, 2.0501708984375, 2.23077392578125, 2.411376953125, 2.59197998046875, 2.7725830078125, 2.95318603515625, 3.1337890625, 3.31439208984375, 3.4949951171875, 3.67559814453125, 3.856201171875, 4.03680419921875, 4.2174072265625, 4.39801025390625, 4.57861328125, 4.75921630859375, 4.9398193359375, 5.12042236328125, 5.301025390625, 5.48162841796875, 5.6622314453125, 5.84283447265625, 6.0234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 8.0, 7.0, 18.0, 11.0, 12.0, 11.0, 26.0, 22.0, 26.0, 33.0, 36.0, 59.0, 64.0, 76.0, 88.0, 82.0, 77.0, 65.0, 53.0, 43.0, 24.0, 34.0, 23.0, 20.0, 10.0, 14.0, 7.0, 9.0, 4.0, 7.0, 5.0, 6.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0004901885986328125, -0.00047479569911956787, -0.00045940279960632324, -0.0004440099000930786, -0.000428617000579834, -0.00041322410106658936, -0.0003978312015533447, -0.0003824383020401001, -0.00036704540252685547, -0.00035165250301361084, -0.0003362596035003662, -0.0003208667039871216, -0.00030547380447387695, -0.0002900809049606323, -0.0002746880054473877, -0.00025929510593414307, -0.00024390220642089844, -0.0002285093069076538, -0.00021311640739440918, -0.00019772350788116455, -0.00018233060836791992, -0.0001669377088546753, -0.00015154480934143066, -0.00013615190982818604, -0.0001207590103149414, -0.00010536611080169678, -8.997321128845215e-05, -7.458031177520752e-05, -5.918741226196289e-05, -4.379451274871826e-05, -2.8401613235473633e-05, -1.3008713722229004e-05, 2.384185791015625e-06, 1.7777085304260254e-05, 3.316998481750488e-05, 4.856288433074951e-05, 6.395578384399414e-05, 7.934868335723877e-05, 9.47415828704834e-05, 0.00011013448238372803, 0.00012552738189697266, 0.00014092028141021729, 0.00015631318092346191, 0.00017170608043670654, 0.00018709897994995117, 0.0002024918794631958, 0.00021788477897644043, 0.00023327767848968506, 0.0002486705780029297, 0.0002640634775161743, 0.00027945637702941895, 0.0002948492765426636, 0.0003102421760559082, 0.00032563507556915283, 0.00034102797508239746, 0.0003564208745956421, 0.0003718137741088867, 0.00038720667362213135, 0.000402599573135376, 0.0004179924726486206, 0.00043338537216186523, 0.00044877827167510986, 0.0004641711711883545, 0.0004795640707015991, 0.0004949569702148438]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 11.0, 12.0, 19.0, 39.0, 44.0, 45.0, 92.0, 154.0, 234.0, 360.0, 689.0, 1372.0, 3019.0, 7981.0, 25107.0, 117344.0, 644790.0, 194136.0, 35089.0, 10373.0, 3946.0, 1657.0, 802.0, 448.0, 268.0, 182.0, 112.0, 66.0, 40.0, 29.0, 13.0, 21.0, 14.0, 7.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.609375, -6.400390625, -6.19140625, -5.982421875, -5.7734375, -5.564453125, -5.35546875, -5.146484375, -4.9375, -4.728515625, -4.51953125, -4.310546875, -4.1015625, -3.892578125, -3.68359375, -3.474609375, -3.265625, -3.056640625, -2.84765625, -2.638671875, -2.4296875, -2.220703125, -2.01171875, -1.802734375, -1.59375, -1.384765625, -1.17578125, -0.966796875, -0.7578125, -0.548828125, -0.33984375, -0.130859375, 0.078125, 0.287109375, 0.49609375, 0.705078125, 0.9140625, 1.123046875, 1.33203125, 1.541015625, 1.75, 1.958984375, 2.16796875, 2.376953125, 2.5859375, 2.794921875, 3.00390625, 3.212890625, 3.421875, 3.630859375, 3.83984375, 4.048828125, 4.2578125, 4.466796875, 4.67578125, 4.884765625, 5.09375, 5.302734375, 5.51171875, 5.720703125, 5.9296875, 6.138671875, 6.34765625, 6.556640625, 6.765625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 7.0, 7.0, 8.0, 8.0, 10.0, 16.0, 24.0, 35.0, 51.0, 63.0, 78.0, 139.0, 140.0, 115.0, 79.0, 69.0, 35.0, 31.0, 21.0, 23.0, 10.0, 7.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.968017578125, -4.79150390625, -4.614990234375, -4.4384765625, -4.261962890625, -4.08544921875, -3.908935546875, -3.732421875, -3.555908203125, -3.37939453125, -3.202880859375, -3.0263671875, -2.849853515625, -2.67333984375, -2.496826171875, -2.3203125, -2.143798828125, -1.96728515625, -1.790771484375, -1.6142578125, -1.437744140625, -1.26123046875, -1.084716796875, -0.908203125, -0.731689453125, -0.55517578125, -0.378662109375, -0.2021484375, -0.025634765625, 0.15087890625, 0.327392578125, 0.50390625, 0.680419921875, 0.85693359375, 1.033447265625, 1.2099609375, 1.386474609375, 1.56298828125, 1.739501953125, 1.916015625, 2.092529296875, 2.26904296875, 2.445556640625, 2.6220703125, 2.798583984375, 2.97509765625, 3.151611328125, 3.328125, 3.504638671875, 3.68115234375, 3.857666015625, 4.0341796875, 4.210693359375, 4.38720703125, 4.563720703125, 4.740234375, 4.916748046875, 5.09326171875, 5.269775390625, 5.4462890625, 5.622802734375, 5.79931640625, 5.975830078125, 6.15234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 27.0, 100.0, 307.0, 342.0, 153.0, 53.0, 11.0, 11.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-245.28428649902344, -240.19454956054688, -235.1048126220703, -230.01507568359375, -224.92532348632812, -219.83558654785156, -214.745849609375, -209.65611267089844, -204.56637573242188, -199.4766387939453, -194.38690185546875, -189.2971649169922, -184.20742797851562, -179.11767578125, -174.02793884277344, -168.93820190429688, -163.8484649658203, -158.75872802734375, -153.6689910888672, -148.57925415039062, -143.489501953125, -138.39976501464844, -133.31002807617188, -128.2202911376953, -123.13055419921875, -118.04081726074219, -112.95108032226562, -107.86133575439453, -102.77159881591797, -97.6818618774414, -92.59211730957031, -87.50238037109375, -82.41265869140625, -77.32292175292969, -72.23318481445312, -67.14344024658203, -62.05370330810547, -56.963966369628906, -51.87422561645508, -46.78448486328125, -41.69474792480469, -36.605010986328125, -31.515270233154297, -26.4255313873291, -21.335792541503906, -16.24605369567871, -11.156314849853516, -6.0665740966796875, -0.976837158203125, 4.11290168762207, 9.202640533447266, 14.292379379272461, 19.382118225097656, 24.47185707092285, 29.561595916748047, 34.651336669921875, 39.74107360839844, 44.830810546875, 49.92055130004883, 55.010292053222656, 60.10002899169922, 65.18976593017578, 70.27951049804688, 75.36924743652344, 80.458984375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 3.0, 2.0, 6.0, 13.0, 20.0, 22.0, 26.0, 22.0, 31.0, 36.0, 46.0, 52.0, 50.0, 61.0, 67.0, 60.0, 71.0, 69.0, 52.0, 59.0, 45.0, 38.0, 35.0, 26.0, 16.0, 19.0, 13.0, 10.0, 5.0, 5.0, 7.0, 7.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.400238037109375, -60.77083969116211, -59.14144515991211, -57.512046813964844, -55.882652282714844, -54.25325393676758, -52.62385559082031, -50.99446105957031, -49.36506271362305, -47.73566436767578, -46.10626983642578, -44.476871490478516, -42.847476959228516, -41.21807861328125, -39.58868408203125, -37.959285736083984, -36.32988739013672, -34.70048904418945, -33.07109451293945, -31.441696166992188, -29.812299728393555, -28.182903289794922, -26.55350685119629, -24.924110412597656, -23.294715881347656, -21.665319442749023, -20.03592300415039, -18.406524658203125, -16.777128219604492, -15.14773178100586, -13.518335342407227, -11.888937950134277, -10.259540557861328, -8.630144119262695, -7.000746726989746, -5.371350288391113, -3.7419533729553223, -2.1125564575195312, -0.48316001892089844, 1.1462373733520508, 2.7756338119506836, 4.405030727386475, 6.034427642822266, 7.663824081420898, 9.293220520019531, 10.92261791229248, 12.552014350891113, 14.181411743164062, 15.810808181762695, 17.440204620361328, 19.06960105895996, 20.698997497558594, 22.32839584350586, 23.957792282104492, 25.587188720703125, 27.21658706665039, 28.84598159790039, 30.475378036499023, 32.104774475097656, 33.73417282104492, 35.36356735229492, 36.99296569824219, 38.62236022949219, 40.25175857543945, 41.88115692138672]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 4.0, 10.0, 10.0, 10.0, 19.0, 20.0, 22.0, 41.0, 58.0, 79.0, 141.0, 163.0, 287.0, 477.0, 855.0, 1724.0, 3735.0, 9135.0, 28906.0, 135605.0, 3319166.0, 599520.0, 65754.0, 17112.0, 6019.0, 2560.0, 1257.0, 657.0, 360.0, 203.0, 137.0, 88.0, 48.0, 34.0, 22.0, 14.0, 10.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.109375, -11.77099609375, -11.4326171875, -11.09423828125, -10.755859375, -10.41748046875, -10.0791015625, -9.74072265625, -9.40234375, -9.06396484375, -8.7255859375, -8.38720703125, -8.048828125, -7.71044921875, -7.3720703125, -7.03369140625, -6.6953125, -6.35693359375, -6.0185546875, -5.68017578125, -5.341796875, -5.00341796875, -4.6650390625, -4.32666015625, -3.98828125, -3.64990234375, -3.3115234375, -2.97314453125, -2.634765625, -2.29638671875, -1.9580078125, -1.61962890625, -1.28125, -0.94287109375, -0.6044921875, -0.26611328125, 0.072265625, 0.41064453125, 0.7490234375, 1.08740234375, 1.42578125, 1.76416015625, 2.1025390625, 2.44091796875, 2.779296875, 3.11767578125, 3.4560546875, 3.79443359375, 4.1328125, 4.47119140625, 4.8095703125, 5.14794921875, 5.486328125, 5.82470703125, 6.1630859375, 6.50146484375, 6.83984375, 7.17822265625, 7.5166015625, 7.85498046875, 8.193359375, 8.53173828125, 8.8701171875, 9.20849609375, 9.546875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 6.0, 21.0, 28.0, 29.0, 46.0, 57.0, 68.0, 80.0, 98.0, 93.0, 91.0, 103.0, 73.0, 56.0, 55.0, 35.0, 28.0, 15.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.112457275390625, -4.01788330078125, -3.923309326171875, -3.8287353515625, -3.734161376953125, -3.63958740234375, -3.545013427734375, -3.450439453125, -3.355865478515625, -3.26129150390625, -3.166717529296875, -3.0721435546875, -2.977569580078125, -2.88299560546875, -2.788421630859375, -2.69384765625, -2.599273681640625, -2.50469970703125, -2.410125732421875, -2.3155517578125, -2.220977783203125, -2.12640380859375, -2.031829833984375, -1.937255859375, -1.842681884765625, -1.74810791015625, -1.653533935546875, -1.5589599609375, -1.464385986328125, -1.36981201171875, -1.275238037109375, -1.1806640625, -1.086090087890625, -0.99151611328125, -0.896942138671875, -0.8023681640625, -0.707794189453125, -0.61322021484375, -0.518646240234375, -0.424072265625, -0.329498291015625, -0.23492431640625, -0.140350341796875, -0.0457763671875, 0.048797607421875, 0.14337158203125, 0.237945556640625, 0.33251953125, 0.427093505859375, 0.52166748046875, 0.616241455078125, 0.7108154296875, 0.805389404296875, 0.89996337890625, 0.994537353515625, 1.089111328125, 1.183685302734375, 1.27825927734375, 1.372833251953125, 1.4674072265625, 1.561981201171875, 1.65655517578125, 1.751129150390625, 1.845703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 11.0, 8.0, 13.0, 53.0, 94.0, 257.0, 831.0, 3137.0, 19763.0, 401153.0, 3694950.0, 64773.0, 7028.0, 1468.0, 447.0, 141.0, 62.0, 36.0, 14.0, 16.0, 10.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.609375, -22.0474853515625, -21.485595703125, -20.9237060546875, -20.36181640625, -19.7999267578125, -19.238037109375, -18.6761474609375, -18.1142578125, -17.5523681640625, -16.990478515625, -16.4285888671875, -15.86669921875, -15.3048095703125, -14.742919921875, -14.1810302734375, -13.619140625, -13.0572509765625, -12.495361328125, -11.9334716796875, -11.37158203125, -10.8096923828125, -10.247802734375, -9.6859130859375, -9.1240234375, -8.5621337890625, -8.000244140625, -7.4383544921875, -6.87646484375, -6.3145751953125, -5.752685546875, -5.1907958984375, -4.62890625, -4.0670166015625, -3.505126953125, -2.9432373046875, -2.38134765625, -1.8194580078125, -1.257568359375, -0.6956787109375, -0.1337890625, 0.4281005859375, 0.989990234375, 1.5518798828125, 2.11376953125, 2.6756591796875, 3.237548828125, 3.7994384765625, 4.361328125, 4.9232177734375, 5.485107421875, 6.0469970703125, 6.60888671875, 7.1707763671875, 7.732666015625, 8.2945556640625, 8.8564453125, 9.4183349609375, 9.980224609375, 10.5421142578125, 11.10400390625, 11.6658935546875, 12.227783203125, 12.7896728515625, 13.3515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 12.0, 15.0, 32.0, 47.0, 62.0, 113.0, 236.0, 527.0, 1606.0, 739.0, 283.0, 153.0, 70.0, 39.0, 42.0, 25.0, 23.0, 15.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.45880126953125, -5.2965087890625, -5.13421630859375, -4.971923828125, -4.80963134765625, -4.6473388671875, -4.48504638671875, -4.32275390625, -4.16046142578125, -3.9981689453125, -3.83587646484375, -3.673583984375, -3.51129150390625, -3.3489990234375, -3.18670654296875, -3.0244140625, -2.86212158203125, -2.6998291015625, -2.53753662109375, -2.375244140625, -2.21295166015625, -2.0506591796875, -1.88836669921875, -1.72607421875, -1.56378173828125, -1.4014892578125, -1.23919677734375, -1.076904296875, -0.91461181640625, -0.7523193359375, -0.59002685546875, -0.427734375, -0.26544189453125, -0.1031494140625, 0.05914306640625, 0.221435546875, 0.38372802734375, 0.5460205078125, 0.70831298828125, 0.87060546875, 1.03289794921875, 1.1951904296875, 1.35748291015625, 1.519775390625, 1.68206787109375, 1.8443603515625, 2.00665283203125, 2.1689453125, 2.33123779296875, 2.4935302734375, 2.65582275390625, 2.818115234375, 2.98040771484375, 3.1427001953125, 3.30499267578125, 3.46728515625, 3.62957763671875, 3.7918701171875, 3.95416259765625, 4.116455078125, 4.27874755859375, 4.4410400390625, 4.60333251953125, 4.765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 13.0, 16.0, 29.0, 49.0, 95.0, 117.0, 139.0, 133.0, 128.0, 97.0, 50.0, 41.0, 39.0, 19.0, 9.0, 12.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.46781539916992, -32.674476623535156, -31.881141662597656, -31.08780288696289, -30.294466018676758, -29.501129150390625, -28.70779037475586, -27.914453506469727, -27.121116638183594, -26.32777976989746, -25.534442901611328, -24.741104125976562, -23.94776725769043, -23.154430389404297, -22.36109161376953, -21.5677547454834, -20.774417877197266, -19.981081008911133, -19.187744140625, -18.394405364990234, -17.6010684967041, -16.80773162841797, -16.014392852783203, -15.22105598449707, -14.427719116210938, -13.634382247924805, -12.841044425964355, -12.047706604003906, -11.254369735717773, -10.46103286743164, -9.667695045471191, -8.874357223510742, -8.081018447875977, -7.2876811027526855, -6.4943437576293945, -5.7010064125061035, -4.9076690673828125, -4.1143317222595215, -3.3209943771362305, -2.5276570320129395, -1.7343196868896484, -0.9409823417663574, -0.1476449966430664, 0.6456923484802246, 1.4390296936035156, 2.2323670387268066, 3.0257043838500977, 3.8190417289733887, 4.61237907409668, 5.405716419219971, 6.199053764343262, 6.992391109466553, 7.785728454589844, 8.579065322875977, 9.372403144836426, 10.165740966796875, 10.959077835083008, 11.75241470336914, 12.54575252532959, 13.339090347290039, 14.132427215576172, 14.925764083862305, 15.719101905822754, 16.512439727783203, 17.305776596069336]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 10.0, 20.0, 14.0, 35.0, 36.0, 49.0, 48.0, 49.0, 54.0, 58.0, 65.0, 76.0, 73.0, 67.0, 60.0, 49.0, 52.0, 45.0, 23.0, 29.0, 26.0, 13.0, 13.0, 8.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.450559616088867, -13.835054397583008, -13.219550132751465, -12.604044914245605, -11.988539695739746, -11.373035430908203, -10.757530212402344, -10.142024993896484, -9.526519775390625, -8.911014556884766, -8.295510292053223, -7.680005073547363, -7.064499855041504, -6.448995113372803, -5.833490371704102, -5.217985153198242, -4.602480888366699, -3.986975908279419, -3.3714709281921387, -2.7559661865234375, -2.1404612064361572, -1.524956226348877, -0.9094514846801758, -0.2939462661743164, 0.32155847549438477, 0.9370633959770203, 1.5525683164596558, 2.1680731773376465, 2.7835781574249268, 3.399083137512207, 4.014587879180908, 4.630093097686768, 5.245597839355469, 5.86110258102417, 6.476607799530029, 7.0921125411987305, 7.70761775970459, 8.323122024536133, 8.938627243041992, 9.554132461547852, 10.169637680053711, 10.78514289855957, 11.400647163391113, 12.016152381896973, 12.631657600402832, 13.247161865234375, 13.862667083740234, 14.478172302246094, 15.093676567077637, 15.709181785583496, 16.32468605041504, 16.9401912689209, 17.555696487426758, 18.171201705932617, 18.786705017089844, 19.402210235595703, 20.017715454101562, 20.633220672607422, 21.24872589111328, 21.86423110961914, 22.479734420776367, 23.095239639282227, 23.710744857788086, 24.326250076293945, 24.941755294799805]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 11.0, 23.0, 25.0, 44.0, 62.0, 81.0, 121.0, 195.0, 297.0, 558.0, 1009.0, 1789.0, 3472.0, 7355.0, 17490.0, 48526.0, 167371.0, 531102.0, 183203.0, 51307.0, 18565.0, 7817.0, 3638.0, 1908.0, 976.0, 581.0, 339.0, 217.0, 141.0, 85.0, 72.0, 37.0, 36.0, 23.0, 19.0, 14.0, 6.0, 3.0, 7.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.203125, -7.9344482421875, -7.665771484375, -7.3970947265625, -7.12841796875, -6.8597412109375, -6.591064453125, -6.3223876953125, -6.0537109375, -5.7850341796875, -5.516357421875, -5.2476806640625, -4.97900390625, -4.7103271484375, -4.441650390625, -4.1729736328125, -3.904296875, -3.6356201171875, -3.366943359375, -3.0982666015625, -2.82958984375, -2.5609130859375, -2.292236328125, -2.0235595703125, -1.7548828125, -1.4862060546875, -1.217529296875, -0.9488525390625, -0.68017578125, -0.4114990234375, -0.142822265625, 0.1258544921875, 0.39453125, 0.6632080078125, 0.931884765625, 1.2005615234375, 1.46923828125, 1.7379150390625, 2.006591796875, 2.2752685546875, 2.5439453125, 2.8126220703125, 3.081298828125, 3.3499755859375, 3.61865234375, 3.8873291015625, 4.156005859375, 4.4246826171875, 4.693359375, 4.9620361328125, 5.230712890625, 5.4993896484375, 5.76806640625, 6.0367431640625, 6.305419921875, 6.5740966796875, 6.8427734375, 7.1114501953125, 7.380126953125, 7.6488037109375, 7.91748046875, 8.1861572265625, 8.454833984375, 8.7235107421875, 8.9921875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 9.0, 2.0, 3.0, 12.0, 17.0, 17.0, 28.0, 22.0, 32.0, 28.0, 40.0, 32.0, 48.0, 45.0, 47.0, 65.0, 54.0, 50.0, 58.0, 57.0, 50.0, 33.0, 48.0, 34.0, 41.0, 31.0, 29.0, 13.0, 17.0, 6.0, 12.0, 9.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9599609375, -1.902008056640625, -1.84405517578125, -1.786102294921875, -1.7281494140625, -1.670196533203125, -1.61224365234375, -1.554290771484375, -1.496337890625, -1.438385009765625, -1.38043212890625, -1.322479248046875, -1.2645263671875, -1.206573486328125, -1.14862060546875, -1.090667724609375, -1.03271484375, -0.974761962890625, -0.91680908203125, -0.858856201171875, -0.8009033203125, -0.742950439453125, -0.68499755859375, -0.627044677734375, -0.569091796875, -0.511138916015625, -0.45318603515625, -0.395233154296875, -0.3372802734375, -0.279327392578125, -0.22137451171875, -0.163421630859375, -0.10546875, -0.047515869140625, 0.01043701171875, 0.068389892578125, 0.1263427734375, 0.184295654296875, 0.24224853515625, 0.300201416015625, 0.358154296875, 0.416107177734375, 0.47406005859375, 0.532012939453125, 0.5899658203125, 0.647918701171875, 0.70587158203125, 0.763824462890625, 0.82177734375, 0.879730224609375, 0.93768310546875, 0.995635986328125, 1.0535888671875, 1.111541748046875, 1.16949462890625, 1.227447509765625, 1.285400390625, 1.343353271484375, 1.40130615234375, 1.459259033203125, 1.5172119140625, 1.575164794921875, 1.63311767578125, 1.691070556640625, 1.7490234375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 7.0, 6.0, 10.0, 19.0, 30.0, 39.0, 64.0, 68.0, 133.0, 221.0, 372.0, 863.0, 2235.0, 7945.0, 47062.0, 549871.0, 393254.0, 36182.0, 6602.0, 1882.0, 761.0, 385.0, 190.0, 104.0, 91.0, 41.0, 34.0, 19.0, 18.0, 17.0, 9.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.4296875, -13.9915771484375, -13.553466796875, -13.1153564453125, -12.67724609375, -12.2391357421875, -11.801025390625, -11.3629150390625, -10.9248046875, -10.4866943359375, -10.048583984375, -9.6104736328125, -9.17236328125, -8.7342529296875, -8.296142578125, -7.8580322265625, -7.419921875, -6.9818115234375, -6.543701171875, -6.1055908203125, -5.66748046875, -5.2293701171875, -4.791259765625, -4.3531494140625, -3.9150390625, -3.4769287109375, -3.038818359375, -2.6007080078125, -2.16259765625, -1.7244873046875, -1.286376953125, -0.8482666015625, -0.41015625, 0.0279541015625, 0.466064453125, 0.9041748046875, 1.34228515625, 1.7803955078125, 2.218505859375, 2.6566162109375, 3.0947265625, 3.5328369140625, 3.970947265625, 4.4090576171875, 4.84716796875, 5.2852783203125, 5.723388671875, 6.1614990234375, 6.599609375, 7.0377197265625, 7.475830078125, 7.9139404296875, 8.35205078125, 8.7901611328125, 9.228271484375, 9.6663818359375, 10.1044921875, 10.5426025390625, 10.980712890625, 11.4188232421875, 11.85693359375, 12.2950439453125, 12.733154296875, 13.1712646484375, 13.609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 6.0, 7.0, 7.0, 10.0, 21.0, 17.0, 19.0, 23.0, 25.0, 32.0, 26.0, 38.0, 45.0, 42.0, 41.0, 48.0, 56.0, 40.0, 43.0, 52.0, 53.0, 41.0, 45.0, 38.0, 29.0, 28.0, 32.0, 33.0, 14.0, 24.0, 11.0, 8.0, 12.0, 8.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.4921875, -7.26239013671875, -7.0325927734375, -6.80279541015625, -6.572998046875, -6.34320068359375, -6.1134033203125, -5.88360595703125, -5.65380859375, -5.42401123046875, -5.1942138671875, -4.96441650390625, -4.734619140625, -4.50482177734375, -4.2750244140625, -4.04522705078125, -3.8154296875, -3.58563232421875, -3.3558349609375, -3.12603759765625, -2.896240234375, -2.66644287109375, -2.4366455078125, -2.20684814453125, -1.97705078125, -1.74725341796875, -1.5174560546875, -1.28765869140625, -1.057861328125, -0.82806396484375, -0.5982666015625, -0.36846923828125, -0.138671875, 0.09112548828125, 0.3209228515625, 0.55072021484375, 0.780517578125, 1.01031494140625, 1.2401123046875, 1.46990966796875, 1.69970703125, 1.92950439453125, 2.1593017578125, 2.38909912109375, 2.618896484375, 2.84869384765625, 3.0784912109375, 3.30828857421875, 3.5380859375, 3.76788330078125, 3.9976806640625, 4.22747802734375, 4.457275390625, 4.68707275390625, 4.9168701171875, 5.14666748046875, 5.37646484375, 5.60626220703125, 5.8360595703125, 6.06585693359375, 6.295654296875, 6.52545166015625, 6.7552490234375, 6.98504638671875, 7.21484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 18.0, 22.0, 42.0, 86.0, 131.0, 298.0, 868.0, 4088.0, 50217.0, 954923.0, 33287.0, 3262.0, 765.0, 273.0, 106.0, 66.0, 36.0, 17.0, 15.0, 10.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.484375, -20.894775390625, -20.30517578125, -19.715576171875, -19.1259765625, -18.536376953125, -17.94677734375, -17.357177734375, -16.767578125, -16.177978515625, -15.58837890625, -14.998779296875, -14.4091796875, -13.819580078125, -13.22998046875, -12.640380859375, -12.05078125, -11.461181640625, -10.87158203125, -10.281982421875, -9.6923828125, -9.102783203125, -8.51318359375, -7.923583984375, -7.333984375, -6.744384765625, -6.15478515625, -5.565185546875, -4.9755859375, -4.385986328125, -3.79638671875, -3.206787109375, -2.6171875, -2.027587890625, -1.43798828125, -0.848388671875, -0.2587890625, 0.330810546875, 0.92041015625, 1.510009765625, 2.099609375, 2.689208984375, 3.27880859375, 3.868408203125, 4.4580078125, 5.047607421875, 5.63720703125, 6.226806640625, 6.81640625, 7.406005859375, 7.99560546875, 8.585205078125, 9.1748046875, 9.764404296875, 10.35400390625, 10.943603515625, 11.533203125, 12.122802734375, 12.71240234375, 13.302001953125, 13.8916015625, 14.481201171875, 15.07080078125, 15.660400390625, 16.25]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 8.0, 12.0, 6.0, 11.0, 29.0, 43.0, 75.0, 189.0, 314.0, 163.0, 56.0, 33.0, 23.0, 11.0, 6.0, 9.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00205230712890625, -0.0020060762763023376, -0.0019598454236984253, -0.001913614571094513, -0.0018673837184906006, -0.0018211528658866882, -0.0017749220132827759, -0.0017286911606788635, -0.0016824603080749512, -0.0016362294554710388, -0.0015899986028671265, -0.0015437677502632141, -0.0014975368976593018, -0.0014513060450553894, -0.001405075192451477, -0.0013588443398475647, -0.0013126134872436523, -0.00126638263463974, -0.0012201517820358276, -0.0011739209294319153, -0.001127690076828003, -0.0010814592242240906, -0.0010352283716201782, -0.0009889975190162659, -0.0009427666664123535, -0.0008965358138084412, -0.0008503049612045288, -0.0008040741086006165, -0.0007578432559967041, -0.0007116124033927917, -0.0006653815507888794, -0.000619150698184967, -0.0005729198455810547, -0.0005266889929771423, -0.00048045814037323, -0.0004342272877693176, -0.0003879964351654053, -0.0003417655825614929, -0.00029553472995758057, -0.0002493038773536682, -0.00020307302474975586, -0.0001568421721458435, -0.00011061131954193115, -6.43804669380188e-05, -1.8149614334106445e-05, 2.8081238269805908e-05, 7.431209087371826e-05, 0.00012054294347763062, 0.00016677379608154297, 0.00021300464868545532, 0.0002592355012893677, 0.00030546635389328003, 0.0003516972064971924, 0.00039792805910110474, 0.0004441589117050171, 0.0004903897643089294, 0.0005366206169128418, 0.0005828514695167542, 0.0006290823221206665, 0.0006753131747245789, 0.0007215440273284912, 0.0007677748799324036, 0.0008140057325363159, 0.0008602365851402283, 0.0009064674377441406]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 9.0, 7.0, 11.0, 27.0, 57.0, 64.0, 163.0, 312.0, 960.0, 5350.0, 188220.0, 842025.0, 9263.0, 1300.0, 411.0, 172.0, 70.0, 54.0, 31.0, 17.0, 10.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.28125, -21.6083984375, -20.935546875, -20.2626953125, -19.58984375, -18.9169921875, -18.244140625, -17.5712890625, -16.8984375, -16.2255859375, -15.552734375, -14.8798828125, -14.20703125, -13.5341796875, -12.861328125, -12.1884765625, -11.515625, -10.8427734375, -10.169921875, -9.4970703125, -8.82421875, -8.1513671875, -7.478515625, -6.8056640625, -6.1328125, -5.4599609375, -4.787109375, -4.1142578125, -3.44140625, -2.7685546875, -2.095703125, -1.4228515625, -0.75, -0.0771484375, 0.595703125, 1.2685546875, 1.94140625, 2.6142578125, 3.287109375, 3.9599609375, 4.6328125, 5.3056640625, 5.978515625, 6.6513671875, 7.32421875, 7.9970703125, 8.669921875, 9.3427734375, 10.015625, 10.6884765625, 11.361328125, 12.0341796875, 12.70703125, 13.3798828125, 14.052734375, 14.7255859375, 15.3984375, 16.0712890625, 16.744140625, 17.4169921875, 18.08984375, 18.7626953125, 19.435546875, 20.1083984375, 20.78125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 4.0, 4.0, 5.0, 13.0, 16.0, 21.0, 22.0, 36.0, 63.0, 111.0, 171.0, 174.0, 129.0, 76.0, 43.0, 31.0, 17.0, 9.0, 8.0, 6.0, 4.0, 2.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3203125, -7.11126708984375, -6.9022216796875, -6.69317626953125, -6.484130859375, -6.27508544921875, -6.0660400390625, -5.85699462890625, -5.64794921875, -5.43890380859375, -5.2298583984375, -5.02081298828125, -4.811767578125, -4.60272216796875, -4.3936767578125, -4.18463134765625, -3.9755859375, -3.76654052734375, -3.5574951171875, -3.34844970703125, -3.139404296875, -2.93035888671875, -2.7213134765625, -2.51226806640625, -2.30322265625, -2.09417724609375, -1.8851318359375, -1.67608642578125, -1.467041015625, -1.25799560546875, -1.0489501953125, -0.83990478515625, -0.630859375, -0.42181396484375, -0.2127685546875, -0.00372314453125, 0.205322265625, 0.41436767578125, 0.6234130859375, 0.83245849609375, 1.04150390625, 1.25054931640625, 1.4595947265625, 1.66864013671875, 1.877685546875, 2.08673095703125, 2.2957763671875, 2.50482177734375, 2.7138671875, 2.92291259765625, 3.1319580078125, 3.34100341796875, 3.550048828125, 3.75909423828125, 3.9681396484375, 4.17718505859375, 4.38623046875, 4.59527587890625, 4.8043212890625, 5.01336669921875, 5.222412109375, 5.43145751953125, 5.6405029296875, 5.84954833984375, 6.05859375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 19.0, 49.0, 176.0, 292.0, 269.0, 127.0, 41.0, 16.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-226.10894775390625, -221.2001953125, -216.29144287109375, -211.38270568847656, -206.4739532470703, -201.56520080566406, -196.6564483642578, -191.74769592285156, -186.83895874023438, -181.93020629882812, -177.02145385742188, -172.1127166748047, -167.20396423339844, -162.2952117919922, -157.38645935058594, -152.4777069091797, -147.56895446777344, -142.6602020263672, -137.75144958496094, -132.84271240234375, -127.9339599609375, -123.02520751953125, -118.116455078125, -113.20770263671875, -108.29895782470703, -103.39020538330078, -98.48146057128906, -93.57270812988281, -88.66395568847656, -83.75521087646484, -78.8464584350586, -73.93771362304688, -69.02894592285156, -64.12019348144531, -59.211448669433594, -54.302696228027344, -49.39394760131836, -44.485198974609375, -39.576446533203125, -34.66769790649414, -29.758949279785156, -24.850200653076172, -19.941450119018555, -15.032700538635254, -10.123950958251953, -5.215202331542969, -0.30645179748535156, 4.602298736572266, 9.51104736328125, 14.41979694366455, 19.32854652404785, 24.23729705810547, 29.146045684814453, 34.05479431152344, 38.96354675292969, 43.87229537963867, 48.781044006347656, 53.68979263305664, 58.598541259765625, 63.507293701171875, 68.41604614257812, 73.32479095458984, 78.2335433959961, 83.14228820800781, 88.05104064941406]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 10.0, 6.0, 11.0, 15.0, 15.0, 14.0, 13.0, 20.0, 23.0, 22.0, 22.0, 24.0, 34.0, 35.0, 34.0, 40.0, 37.0, 36.0, 31.0, 37.0, 41.0, 40.0, 35.0, 38.0, 46.0, 34.0, 26.0, 42.0, 31.0, 26.0, 22.0, 15.0, 23.0, 16.0, 16.0, 13.0, 10.0, 12.0, 9.0, 3.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-33.73252487182617, -32.62526321411133, -31.518001556396484, -30.41073989868164, -29.303478240966797, -28.196216583251953, -27.088956832885742, -25.9816951751709, -24.874433517456055, -23.76717185974121, -22.659910202026367, -21.552648544311523, -20.445388793945312, -19.33812713623047, -18.230865478515625, -17.12360382080078, -16.016342163085938, -14.909080505371094, -13.80181884765625, -12.694558143615723, -11.587296485900879, -10.480034828186035, -9.372774124145508, -8.265512466430664, -7.15825080871582, -6.050989151000977, -4.943727970123291, -3.8364665508270264, -2.7292051315307617, -1.621943473815918, -0.5146822929382324, 0.5925788879394531, 1.6998367309570312, 2.807098150253296, 3.9143595695495605, 5.021620750427246, 6.12888240814209, 7.236144065856934, 8.343404769897461, 9.450666427612305, 10.557928085327148, 11.665189743041992, 12.772451400756836, 13.879712104797363, 14.986973762512207, 16.094234466552734, 17.201496124267578, 18.308757781982422, 19.416019439697266, 20.52328109741211, 21.630542755126953, 22.737804412841797, 23.84506607055664, 24.952327728271484, 26.059587478637695, 27.16684913635254, 28.274110794067383, 29.381372451782227, 30.48863410949707, 31.595895767211914, 32.703155517578125, 33.81041717529297, 34.91767883300781, 36.024940490722656, 37.1322021484375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 9.0, 16.0, 11.0, 29.0, 40.0, 55.0, 107.0, 173.0, 392.0, 988.0, 3032.0, 11344.0, 73698.0, 3872231.0, 205713.0, 19341.0, 4534.0, 1428.0, 544.0, 258.0, 140.0, 76.0, 43.0, 27.0, 13.0, 13.0, 11.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.609375, -22.947509765625, -22.28564453125, -21.623779296875, -20.9619140625, -20.300048828125, -19.63818359375, -18.976318359375, -18.314453125, -17.652587890625, -16.99072265625, -16.328857421875, -15.6669921875, -15.005126953125, -14.34326171875, -13.681396484375, -13.01953125, -12.357666015625, -11.69580078125, -11.033935546875, -10.3720703125, -9.710205078125, -9.04833984375, -8.386474609375, -7.724609375, -7.062744140625, -6.40087890625, -5.739013671875, -5.0771484375, -4.415283203125, -3.75341796875, -3.091552734375, -2.4296875, -1.767822265625, -1.10595703125, -0.444091796875, 0.2177734375, 0.879638671875, 1.54150390625, 2.203369140625, 2.865234375, 3.527099609375, 4.18896484375, 4.850830078125, 5.5126953125, 6.174560546875, 6.83642578125, 7.498291015625, 8.16015625, 8.822021484375, 9.48388671875, 10.145751953125, 10.8076171875, 11.469482421875, 12.13134765625, 12.793212890625, 13.455078125, 14.116943359375, 14.77880859375, 15.440673828125, 16.1025390625, 16.764404296875, 17.42626953125, 18.088134765625, 18.75]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 8.0, 8.0, 11.0, 8.0, 14.0, 12.0, 23.0, 22.0, 27.0, 24.0, 36.0, 41.0, 32.0, 54.0, 54.0, 61.0, 53.0, 54.0, 46.0, 29.0, 53.0, 49.0, 37.0, 39.0, 33.0, 38.0, 34.0, 23.0, 15.0, 11.0, 14.0, 6.0, 9.0, 5.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7626953125, -1.7024078369140625, -1.642120361328125, -1.5818328857421875, -1.52154541015625, -1.4612579345703125, -1.400970458984375, -1.3406829833984375, -1.2803955078125, -1.2201080322265625, -1.159820556640625, -1.0995330810546875, -1.03924560546875, -0.9789581298828125, -0.918670654296875, -0.8583831787109375, -0.798095703125, -0.7378082275390625, -0.677520751953125, -0.6172332763671875, -0.55694580078125, -0.4966583251953125, -0.436370849609375, -0.3760833740234375, -0.3157958984375, -0.2555084228515625, -0.195220947265625, -0.1349334716796875, -0.07464599609375, -0.0143585205078125, 0.045928955078125, 0.1062164306640625, 0.16650390625, 0.2267913818359375, 0.287078857421875, 0.3473663330078125, 0.40765380859375, 0.4679412841796875, 0.528228759765625, 0.5885162353515625, 0.6488037109375, 0.7090911865234375, 0.769378662109375, 0.8296661376953125, 0.88995361328125, 0.9502410888671875, 1.010528564453125, 1.0708160400390625, 1.131103515625, 1.1913909912109375, 1.251678466796875, 1.3119659423828125, 1.37225341796875, 1.4325408935546875, 1.492828369140625, 1.5531158447265625, 1.6134033203125, 1.6736907958984375, 1.733978271484375, 1.7942657470703125, 1.85455322265625, 1.9148406982421875, 1.975128173828125, 2.0354156494140625, 2.095703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 9.0, 1.0, 12.0, 21.0, 32.0, 68.0, 133.0, 291.0, 748.0, 2316.0, 10074.0, 86451.0, 3914732.0, 160592.0, 14461.0, 2825.0, 871.0, 357.0, 128.0, 80.0, 44.0, 10.0, 9.0, 6.0, 9.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.8125, -23.195556640625, -22.57861328125, -21.961669921875, -21.3447265625, -20.727783203125, -20.11083984375, -19.493896484375, -18.876953125, -18.260009765625, -17.64306640625, -17.026123046875, -16.4091796875, -15.792236328125, -15.17529296875, -14.558349609375, -13.94140625, -13.324462890625, -12.70751953125, -12.090576171875, -11.4736328125, -10.856689453125, -10.23974609375, -9.622802734375, -9.005859375, -8.388916015625, -7.77197265625, -7.155029296875, -6.5380859375, -5.921142578125, -5.30419921875, -4.687255859375, -4.0703125, -3.453369140625, -2.83642578125, -2.219482421875, -1.6025390625, -0.985595703125, -0.36865234375, 0.248291015625, 0.865234375, 1.482177734375, 2.09912109375, 2.716064453125, 3.3330078125, 3.949951171875, 4.56689453125, 5.183837890625, 5.80078125, 6.417724609375, 7.03466796875, 7.651611328125, 8.2685546875, 8.885498046875, 9.50244140625, 10.119384765625, 10.736328125, 11.353271484375, 11.97021484375, 12.587158203125, 13.2041015625, 13.821044921875, 14.43798828125, 15.054931640625, 15.671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 10.0, 9.0, 9.0, 27.0, 37.0, 55.0, 64.0, 140.0, 362.0, 1256.0, 1355.0, 348.0, 137.0, 77.0, 50.0, 29.0, 15.0, 21.0, 16.0, 11.0, 10.0, 9.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.10418701171875, -4.9583740234375, -4.81256103515625, -4.666748046875, -4.52093505859375, -4.3751220703125, -4.22930908203125, -4.08349609375, -3.93768310546875, -3.7918701171875, -3.64605712890625, -3.500244140625, -3.35443115234375, -3.2086181640625, -3.06280517578125, -2.9169921875, -2.77117919921875, -2.6253662109375, -2.47955322265625, -2.333740234375, -2.18792724609375, -2.0421142578125, -1.89630126953125, -1.75048828125, -1.60467529296875, -1.4588623046875, -1.31304931640625, -1.167236328125, -1.02142333984375, -0.8756103515625, -0.72979736328125, -0.583984375, -0.43817138671875, -0.2923583984375, -0.14654541015625, -0.000732421875, 0.14508056640625, 0.2908935546875, 0.43670654296875, 0.58251953125, 0.72833251953125, 0.8741455078125, 1.01995849609375, 1.165771484375, 1.31158447265625, 1.4573974609375, 1.60321044921875, 1.7490234375, 1.89483642578125, 2.0406494140625, 2.18646240234375, 2.332275390625, 2.47808837890625, 2.6239013671875, 2.76971435546875, 2.91552734375, 3.06134033203125, 3.2071533203125, 3.35296630859375, 3.498779296875, 3.64459228515625, 3.7904052734375, 3.93621826171875, 4.08203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 36.0, 111.0, 233.0, 317.0, 198.0, 71.0, 18.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.51558303833008, -43.651119232177734, -41.78665542602539, -39.92218780517578, -38.05772399902344, -36.193260192871094, -34.32879638671875, -32.464332580566406, -30.59986686706543, -28.735403060913086, -26.87093734741211, -25.006473541259766, -23.142009735107422, -21.277544021606445, -19.4130802154541, -17.548614501953125, -15.684150695800781, -13.819685935974121, -11.955221176147461, -10.090757369995117, -8.226292610168457, -6.361827850341797, -4.497364044189453, -2.632899284362793, -0.7684345245361328, 1.0960299968719482, 2.9604945182800293, 4.824958801269531, 6.689423561096191, 8.553888320922852, 10.418352127075195, 12.282816886901855, 14.14727783203125, 16.011741638183594, 17.87620735168457, 19.740671157836914, 21.60513687133789, 23.469600677490234, 25.334064483642578, 27.198528289794922, 29.0629940032959, 30.927457809448242, 32.79192352294922, 34.65638732910156, 36.520851135253906, 38.38531494140625, 40.249778747558594, 42.1142463684082, 43.97871017456055, 45.84317398071289, 47.707637786865234, 49.572105407714844, 51.43656921386719, 53.30103302001953, 55.165496826171875, 57.02996063232422, 58.89442443847656, 60.758888244628906, 62.62335205078125, 64.4878158569336, 66.35227966308594, 68.21675109863281, 70.08120727539062, 71.9456787109375, 73.81014251708984]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 4.0, 11.0, 7.0, 11.0, 10.0, 18.0, 12.0, 14.0, 19.0, 21.0, 24.0, 28.0, 30.0, 28.0, 32.0, 33.0, 31.0, 45.0, 38.0, 41.0, 49.0, 49.0, 30.0, 43.0, 43.0, 39.0, 38.0, 33.0, 36.0, 20.0, 30.0, 19.0, 12.0, 20.0, 12.0, 8.0, 9.0, 12.0, 10.0, 8.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-12.501359939575195, -12.115266799926758, -11.729172706604004, -11.343079566955566, -10.956985473632812, -10.570892333984375, -10.184799194335938, -9.7987060546875, -9.412611961364746, -9.026518821716309, -8.640424728393555, -8.254331588745117, -7.8682379722595215, -7.482144355773926, -7.096051216125488, -6.709957599639893, -6.323863983154297, -5.937770366668701, -5.5516767501831055, -5.165583610534668, -4.779489994049072, -4.393396377563477, -4.007303237915039, -3.6212096214294434, -3.2351160049438477, -2.849022388458252, -2.4629290103912354, -2.0768356323242188, -1.690742015838623, -1.304648518562317, -0.9185550212860107, -0.5324616432189941, -0.14636802673339844, 0.23972547054290771, 0.6258189678192139, 1.01191246509552, 1.3980059623718262, 1.7840994596481323, 2.1701929569244385, 2.556286334991455, 2.942379951477051, 3.3284735679626465, 3.714566946029663, 4.10066032409668, 4.486753940582275, 4.872847557067871, 5.258940696716309, 5.645034313201904, 6.0311279296875, 6.417221546173096, 6.803315162658691, 7.189408302307129, 7.575501918792725, 7.96159553527832, 8.347688674926758, 8.733781814575195, 9.11987590789795, 9.505969047546387, 9.89206314086914, 10.278156280517578, 10.664249420166016, 11.05034351348877, 11.436436653137207, 11.822530746459961, 12.208623886108398]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 6.0, 12.0, 20.0, 27.0, 28.0, 39.0, 66.0, 82.0, 125.0, 207.0, 320.0, 585.0, 1001.0, 1862.0, 3505.0, 7923.0, 17030.0, 41560.0, 110471.0, 394825.0, 315453.0, 90364.0, 34547.0, 14657.0, 6666.0, 3204.0, 1629.0, 910.0, 507.0, 297.0, 213.0, 125.0, 78.0, 50.0, 49.0, 26.0, 26.0, 4.0, 12.0, 11.0, 8.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.96875, -6.7276611328125, -6.486572265625, -6.2454833984375, -6.00439453125, -5.7633056640625, -5.522216796875, -5.2811279296875, -5.0400390625, -4.7989501953125, -4.557861328125, -4.3167724609375, -4.07568359375, -3.8345947265625, -3.593505859375, -3.3524169921875, -3.111328125, -2.8702392578125, -2.629150390625, -2.3880615234375, -2.14697265625, -1.9058837890625, -1.664794921875, -1.4237060546875, -1.1826171875, -0.9415283203125, -0.700439453125, -0.4593505859375, -0.21826171875, 0.0228271484375, 0.263916015625, 0.5050048828125, 0.74609375, 0.9871826171875, 1.228271484375, 1.4693603515625, 1.71044921875, 1.9515380859375, 2.192626953125, 2.4337158203125, 2.6748046875, 2.9158935546875, 3.156982421875, 3.3980712890625, 3.63916015625, 3.8802490234375, 4.121337890625, 4.3624267578125, 4.603515625, 4.8446044921875, 5.085693359375, 5.3267822265625, 5.56787109375, 5.8089599609375, 6.050048828125, 6.2911376953125, 6.5322265625, 6.7733154296875, 7.014404296875, 7.2554931640625, 7.49658203125, 7.7376708984375, 7.978759765625, 8.2198486328125, 8.4609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 8.0, 9.0, 17.0, 12.0, 17.0, 26.0, 32.0, 29.0, 26.0, 34.0, 35.0, 53.0, 47.0, 46.0, 56.0, 40.0, 52.0, 50.0, 44.0, 46.0, 35.0, 39.0, 41.0, 39.0, 31.0, 25.0, 24.0, 16.0, 13.0, 7.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8203125, -1.758544921875, -1.69677734375, -1.635009765625, -1.5732421875, -1.511474609375, -1.44970703125, -1.387939453125, -1.326171875, -1.264404296875, -1.20263671875, -1.140869140625, -1.0791015625, -1.017333984375, -0.95556640625, -0.893798828125, -0.83203125, -0.770263671875, -0.70849609375, -0.646728515625, -0.5849609375, -0.523193359375, -0.46142578125, -0.399658203125, -0.337890625, -0.276123046875, -0.21435546875, -0.152587890625, -0.0908203125, -0.029052734375, 0.03271484375, 0.094482421875, 0.15625, 0.218017578125, 0.27978515625, 0.341552734375, 0.4033203125, 0.465087890625, 0.52685546875, 0.588623046875, 0.650390625, 0.712158203125, 0.77392578125, 0.835693359375, 0.8974609375, 0.959228515625, 1.02099609375, 1.082763671875, 1.14453125, 1.206298828125, 1.26806640625, 1.329833984375, 1.3916015625, 1.453369140625, 1.51513671875, 1.576904296875, 1.638671875, 1.700439453125, 1.76220703125, 1.823974609375, 1.8857421875, 1.947509765625, 2.00927734375, 2.071044921875, 2.1328125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 10.0, 6.0, 15.0, 19.0, 20.0, 29.0, 32.0, 39.0, 76.0, 92.0, 157.0, 243.0, 517.0, 1289.0, 3825.0, 14521.0, 68243.0, 563580.0, 333604.0, 46730.0, 10374.0, 2894.0, 1054.0, 441.0, 229.0, 138.0, 96.0, 86.0, 44.0, 32.0, 24.0, 18.0, 18.0, 13.0, 8.0, 8.0, 6.0, 1.0, 0.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.1328125, -12.75634765625, -12.3798828125, -12.00341796875, -11.626953125, -11.25048828125, -10.8740234375, -10.49755859375, -10.12109375, -9.74462890625, -9.3681640625, -8.99169921875, -8.615234375, -8.23876953125, -7.8623046875, -7.48583984375, -7.109375, -6.73291015625, -6.3564453125, -5.97998046875, -5.603515625, -5.22705078125, -4.8505859375, -4.47412109375, -4.09765625, -3.72119140625, -3.3447265625, -2.96826171875, -2.591796875, -2.21533203125, -1.8388671875, -1.46240234375, -1.0859375, -0.70947265625, -0.3330078125, 0.04345703125, 0.419921875, 0.79638671875, 1.1728515625, 1.54931640625, 1.92578125, 2.30224609375, 2.6787109375, 3.05517578125, 3.431640625, 3.80810546875, 4.1845703125, 4.56103515625, 4.9375, 5.31396484375, 5.6904296875, 6.06689453125, 6.443359375, 6.81982421875, 7.1962890625, 7.57275390625, 7.94921875, 8.32568359375, 8.7021484375, 9.07861328125, 9.455078125, 9.83154296875, 10.2080078125, 10.58447265625, 10.9609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 3.0, 7.0, 10.0, 8.0, 15.0, 15.0, 28.0, 31.0, 27.0, 31.0, 36.0, 47.0, 49.0, 59.0, 68.0, 55.0, 66.0, 56.0, 48.0, 53.0, 39.0, 47.0, 32.0, 33.0, 25.0, 24.0, 21.0, 13.0, 18.0, 5.0, 11.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.0308837890625, -7.718017578125, -7.4051513671875, -7.09228515625, -6.7794189453125, -6.466552734375, -6.1536865234375, -5.8408203125, -5.5279541015625, -5.215087890625, -4.9022216796875, -4.58935546875, -4.2764892578125, -3.963623046875, -3.6507568359375, -3.337890625, -3.0250244140625, -2.712158203125, -2.3992919921875, -2.08642578125, -1.7735595703125, -1.460693359375, -1.1478271484375, -0.8349609375, -0.5220947265625, -0.209228515625, 0.1036376953125, 0.41650390625, 0.7293701171875, 1.042236328125, 1.3551025390625, 1.66796875, 1.9808349609375, 2.293701171875, 2.6065673828125, 2.91943359375, 3.2322998046875, 3.545166015625, 3.8580322265625, 4.1708984375, 4.4837646484375, 4.796630859375, 5.1094970703125, 5.42236328125, 5.7352294921875, 6.048095703125, 6.3609619140625, 6.673828125, 6.9866943359375, 7.299560546875, 7.6124267578125, 7.92529296875, 8.2381591796875, 8.551025390625, 8.8638916015625, 9.1767578125, 9.4896240234375, 9.802490234375, 10.1153564453125, 10.42822265625, 10.7410888671875, 11.053955078125, 11.3668212890625, 11.6796875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 18.0, 22.0, 30.0, 56.0, 94.0, 177.0, 287.0, 516.0, 956.0, 2268.0, 7643.0, 67354.0, 911614.0, 46916.0, 6546.0, 1966.0, 896.0, 482.0, 281.0, 158.0, 107.0, 49.0, 44.0, 24.0, 21.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.967041015625, -11.59814453125, -11.229248046875, -10.8603515625, -10.491455078125, -10.12255859375, -9.753662109375, -9.384765625, -9.015869140625, -8.64697265625, -8.278076171875, -7.9091796875, -7.540283203125, -7.17138671875, -6.802490234375, -6.43359375, -6.064697265625, -5.69580078125, -5.326904296875, -4.9580078125, -4.589111328125, -4.22021484375, -3.851318359375, -3.482421875, -3.113525390625, -2.74462890625, -2.375732421875, -2.0068359375, -1.637939453125, -1.26904296875, -0.900146484375, -0.53125, -0.162353515625, 0.20654296875, 0.575439453125, 0.9443359375, 1.313232421875, 1.68212890625, 2.051025390625, 2.419921875, 2.788818359375, 3.15771484375, 3.526611328125, 3.8955078125, 4.264404296875, 4.63330078125, 5.002197265625, 5.37109375, 5.739990234375, 6.10888671875, 6.477783203125, 6.8466796875, 7.215576171875, 7.58447265625, 7.953369140625, 8.322265625, 8.691162109375, 9.06005859375, 9.428955078125, 9.7978515625, 10.166748046875, 10.53564453125, 10.904541015625, 11.2734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 8.0, 21.0, 26.0, 40.0, 92.0, 299.0, 312.0, 106.0, 35.0, 23.0, 12.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002483367919921875, -0.002425655722618103, -0.002367943525314331, -0.002310231328010559, -0.002252519130706787, -0.002194806933403015, -0.002137094736099243, -0.002079382538795471, -0.0020216703414916992, -0.0019639581441879272, -0.0019062459468841553, -0.0018485337495803833, -0.0017908215522766113, -0.0017331093549728394, -0.0016753971576690674, -0.0016176849603652954, -0.0015599727630615234, -0.0015022605657577515, -0.0014445483684539795, -0.0013868361711502075, -0.0013291239738464355, -0.0012714117765426636, -0.0012136995792388916, -0.0011559873819351196, -0.0010982751846313477, -0.0010405629873275757, -0.0009828507900238037, -0.0009251385927200317, -0.0008674263954162598, -0.0008097141981124878, -0.0007520020008087158, -0.0006942898035049438, -0.0006365776062011719, -0.0005788654088973999, -0.0005211532115936279, -0.00046344101428985596, -0.000405728816986084, -0.000348016619682312, -0.00029030442237854004, -0.00023259222507476807, -0.0001748800277709961, -0.00011716783046722412, -5.945563316345215e-05, -1.7434358596801758e-06, 5.59687614440918e-05, 0.00011368095874786377, 0.00017139315605163574, 0.00022910535335540771, 0.0002868175506591797, 0.00034452974796295166, 0.00040224194526672363, 0.0004599541425704956, 0.0005176663398742676, 0.0005753785371780396, 0.0006330907344818115, 0.0006908029317855835, 0.0007485151290893555, 0.0008062273263931274, 0.0008639395236968994, 0.0009216517210006714, 0.0009793639183044434, 0.0010370761156082153, 0.0010947883129119873, 0.0011525005102157593, 0.0012102127075195312]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 8.0, 10.0, 14.0, 33.0, 56.0, 107.0, 229.0, 634.0, 2433.0, 20362.0, 985848.0, 34340.0, 3171.0, 773.0, 258.0, 131.0, 59.0, 39.0, 16.0, 8.0, 13.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.265625, -20.63232421875, -19.9990234375, -19.36572265625, -18.732421875, -18.09912109375, -17.4658203125, -16.83251953125, -16.19921875, -15.56591796875, -14.9326171875, -14.29931640625, -13.666015625, -13.03271484375, -12.3994140625, -11.76611328125, -11.1328125, -10.49951171875, -9.8662109375, -9.23291015625, -8.599609375, -7.96630859375, -7.3330078125, -6.69970703125, -6.06640625, -5.43310546875, -4.7998046875, -4.16650390625, -3.533203125, -2.89990234375, -2.2666015625, -1.63330078125, -1.0, -0.36669921875, 0.2666015625, 0.89990234375, 1.533203125, 2.16650390625, 2.7998046875, 3.43310546875, 4.06640625, 4.69970703125, 5.3330078125, 5.96630859375, 6.599609375, 7.23291015625, 7.8662109375, 8.49951171875, 9.1328125, 9.76611328125, 10.3994140625, 11.03271484375, 11.666015625, 12.29931640625, 12.9326171875, 13.56591796875, 14.19921875, 14.83251953125, 15.4658203125, 16.09912109375, 16.732421875, 17.36572265625, 17.9990234375, 18.63232421875, 19.265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 7.0, 12.0, 16.0, 38.0, 73.0, 160.0, 314.0, 200.0, 83.0, 35.0, 21.0, 12.0, 6.0, 4.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.2613525390625, -4.944580078125, -4.6278076171875, -4.31103515625, -3.9942626953125, -3.677490234375, -3.3607177734375, -3.0439453125, -2.7271728515625, -2.410400390625, -2.0936279296875, -1.77685546875, -1.4600830078125, -1.143310546875, -0.8265380859375, -0.509765625, -0.1929931640625, 0.123779296875, 0.4405517578125, 0.75732421875, 1.0740966796875, 1.390869140625, 1.7076416015625, 2.0244140625, 2.3411865234375, 2.657958984375, 2.9747314453125, 3.29150390625, 3.6082763671875, 3.925048828125, 4.2418212890625, 4.55859375, 4.8753662109375, 5.192138671875, 5.5089111328125, 5.82568359375, 6.1424560546875, 6.459228515625, 6.7760009765625, 7.0927734375, 7.4095458984375, 7.726318359375, 8.0430908203125, 8.35986328125, 8.6766357421875, 8.993408203125, 9.3101806640625, 9.626953125, 9.9437255859375, 10.260498046875, 10.5772705078125, 10.89404296875, 11.2108154296875, 11.527587890625, 11.8443603515625, 12.1611328125, 12.4779052734375, 12.794677734375, 13.1114501953125, 13.42822265625, 13.7449951171875, 14.061767578125, 14.3785400390625, 14.6953125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 15.0, 31.0, 97.0, 196.0, 343.0, 206.0, 75.0, 22.0, 15.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.20159912109375, -161.77169799804688, -157.341796875, -152.91189575195312, -148.4819793701172, -144.0520782470703, -139.62217712402344, -135.19227600097656, -130.7623748779297, -126.33247375488281, -121.9025650024414, -117.47266387939453, -113.04276275634766, -108.61285400390625, -104.18295288085938, -99.7530517578125, -95.3231430053711, -90.89324188232422, -86.46333312988281, -82.03343200683594, -77.60353088378906, -73.17362976074219, -68.74372100830078, -64.3138198852539, -59.883914947509766, -55.454010009765625, -51.02410888671875, -46.59420394897461, -42.16429901123047, -37.734397888183594, -33.30449295043945, -28.874589920043945, -24.44469451904297, -20.01479148864746, -15.584887504577637, -11.154983520507812, -6.725080490112305, -2.295177459716797, 2.1347274780273438, 6.564630508422852, 10.99453353881836, 15.424436569213867, 19.854339599609375, 24.284244537353516, 28.714147567749023, 33.14405059814453, 37.57395553588867, 42.00386047363281, 46.43376159667969, 50.86366653442383, 55.2935676574707, 59.723472595214844, 64.15337371826172, 68.58328247070312, 73.01318359375, 77.44308471679688, 81.87298583984375, 86.30288696289062, 90.73279571533203, 95.1626968383789, 99.59259796142578, 104.02250671386719, 108.45240783691406, 112.88230895996094, 117.31221771240234]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 10.0, 5.0, 9.0, 15.0, 12.0, 20.0, 10.0, 13.0, 12.0, 28.0, 18.0, 19.0, 26.0, 32.0, 30.0, 36.0, 35.0, 43.0, 41.0, 45.0, 44.0, 34.0, 54.0, 33.0, 36.0, 42.0, 30.0, 25.0, 42.0, 34.0, 22.0, 20.0, 17.0, 15.0, 17.0, 17.0, 9.0, 4.0, 13.0, 8.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-39.29570388793945, -38.12223434448242, -36.948760986328125, -35.775291442871094, -34.60182189941406, -33.428348541259766, -32.254878997802734, -31.08140754699707, -29.907936096191406, -28.734464645385742, -27.560993194580078, -26.387523651123047, -25.214052200317383, -24.04058074951172, -22.867111206054688, -21.693639755249023, -20.52016830444336, -19.346696853637695, -18.17322540283203, -16.999755859375, -15.826284408569336, -14.652812957763672, -13.479342460632324, -12.305871963500977, -11.132400512695312, -9.958929061889648, -8.7854585647583, -7.611987590789795, -6.438516616821289, -5.265045642852783, -4.091574668884277, -2.9181041717529297, -1.7446327209472656, -0.5711617469787598, 0.6023092269897461, 1.775780200958252, 2.949251174926758, 4.122722148895264, 5.2961931228637695, 6.469663619995117, 7.643135070800781, 8.816606521606445, 9.990077018737793, 11.16354751586914, 12.337018966674805, 13.510490417480469, 14.683960914611816, 15.857431411743164, 17.030902862548828, 18.204374313354492, 19.377845764160156, 20.551315307617188, 21.72478675842285, 22.898258209228516, 24.071727752685547, 25.24519920349121, 26.418670654296875, 27.59214210510254, 28.765613555908203, 29.939083099365234, 31.1125545501709, 32.28602600097656, 33.459495544433594, 34.632965087890625, 35.80643844604492]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 4.0, 7.0, 11.0, 19.0, 13.0, 19.0, 34.0, 48.0, 75.0, 145.0, 209.0, 395.0, 632.0, 1136.0, 2225.0, 4397.0, 10196.0, 27639.0, 108289.0, 3578000.0, 379329.0, 51419.0, 16507.0, 6713.0, 2970.0, 1640.0, 923.0, 528.0, 270.0, 159.0, 115.0, 69.0, 45.0, 30.0, 26.0, 10.0, 10.0, 7.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.53125, -14.1131591796875, -13.695068359375, -13.2769775390625, -12.85888671875, -12.4407958984375, -12.022705078125, -11.6046142578125, -11.1865234375, -10.7684326171875, -10.350341796875, -9.9322509765625, -9.51416015625, -9.0960693359375, -8.677978515625, -8.2598876953125, -7.841796875, -7.4237060546875, -7.005615234375, -6.5875244140625, -6.16943359375, -5.7513427734375, -5.333251953125, -4.9151611328125, -4.4970703125, -4.0789794921875, -3.660888671875, -3.2427978515625, -2.82470703125, -2.4066162109375, -1.988525390625, -1.5704345703125, -1.15234375, -0.7342529296875, -0.316162109375, 0.1019287109375, 0.52001953125, 0.9381103515625, 1.356201171875, 1.7742919921875, 2.1923828125, 2.6104736328125, 3.028564453125, 3.4466552734375, 3.86474609375, 4.2828369140625, 4.700927734375, 5.1190185546875, 5.537109375, 5.9552001953125, 6.373291015625, 6.7913818359375, 7.20947265625, 7.6275634765625, 8.045654296875, 8.4637451171875, 8.8818359375, 9.2999267578125, 9.718017578125, 10.1361083984375, 10.55419921875, 10.9722900390625, 11.390380859375, 11.8084716796875, 12.2265625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 7.0, 15.0, 7.0, 10.0, 14.0, 20.0, 18.0, 18.0, 29.0, 35.0, 20.0, 43.0, 40.0, 42.0, 45.0, 43.0, 44.0, 55.0, 50.0, 36.0, 68.0, 31.0, 38.0, 35.0, 26.0, 35.0, 39.0, 26.0, 25.0, 17.0, 10.0, 17.0, 4.0, 9.0, 3.0, 8.0, 8.0, 2.0, 2.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.822265625, -1.759185791015625, -1.69610595703125, -1.633026123046875, -1.5699462890625, -1.506866455078125, -1.44378662109375, -1.380706787109375, -1.317626953125, -1.254547119140625, -1.19146728515625, -1.128387451171875, -1.0653076171875, -1.002227783203125, -0.93914794921875, -0.876068115234375, -0.81298828125, -0.749908447265625, -0.68682861328125, -0.623748779296875, -0.5606689453125, -0.497589111328125, -0.43450927734375, -0.371429443359375, -0.308349609375, -0.245269775390625, -0.18218994140625, -0.119110107421875, -0.0560302734375, 0.007049560546875, 0.07012939453125, 0.133209228515625, 0.1962890625, 0.259368896484375, 0.32244873046875, 0.385528564453125, 0.4486083984375, 0.511688232421875, 0.57476806640625, 0.637847900390625, 0.700927734375, 0.764007568359375, 0.82708740234375, 0.890167236328125, 0.9532470703125, 1.016326904296875, 1.07940673828125, 1.142486572265625, 1.20556640625, 1.268646240234375, 1.33172607421875, 1.394805908203125, 1.4578857421875, 1.520965576171875, 1.58404541015625, 1.647125244140625, 1.710205078125, 1.773284912109375, 1.83636474609375, 1.899444580078125, 1.9625244140625, 2.025604248046875, 2.08868408203125, 2.151763916015625, 2.21484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 10.0, 19.0, 39.0, 83.0, 168.0, 470.0, 1775.0, 12152.0, 200816.0, 3931388.0, 41349.0, 4648.0, 862.0, 267.0, 103.0, 51.0, 38.0, 17.0, 10.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.78125, -31.8515625, -30.921875, -29.9921875, -29.0625, -28.1328125, -27.203125, -26.2734375, -25.34375, -24.4140625, -23.484375, -22.5546875, -21.625, -20.6953125, -19.765625, -18.8359375, -17.90625, -16.9765625, -16.046875, -15.1171875, -14.1875, -13.2578125, -12.328125, -11.3984375, -10.46875, -9.5390625, -8.609375, -7.6796875, -6.75, -5.8203125, -4.890625, -3.9609375, -3.03125, -2.1015625, -1.171875, -0.2421875, 0.6875, 1.6171875, 2.546875, 3.4765625, 4.40625, 5.3359375, 6.265625, 7.1953125, 8.125, 9.0546875, 9.984375, 10.9140625, 11.84375, 12.7734375, 13.703125, 14.6328125, 15.5625, 16.4921875, 17.421875, 18.3515625, 19.28125, 20.2109375, 21.140625, 22.0703125, 23.0, 23.9296875, 24.859375, 25.7890625, 26.71875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 5.0, 6.0, 7.0, 12.0, 27.0, 40.0, 43.0, 69.0, 156.0, 622.0, 2530.0, 293.0, 119.0, 46.0, 24.0, 20.0, 15.0, 14.0, 7.0, 9.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.419189453125, -9.16650390625, -8.913818359375, -8.6611328125, -8.408447265625, -8.15576171875, -7.903076171875, -7.650390625, -7.397705078125, -7.14501953125, -6.892333984375, -6.6396484375, -6.386962890625, -6.13427734375, -5.881591796875, -5.62890625, -5.376220703125, -5.12353515625, -4.870849609375, -4.6181640625, -4.365478515625, -4.11279296875, -3.860107421875, -3.607421875, -3.354736328125, -3.10205078125, -2.849365234375, -2.5966796875, -2.343994140625, -2.09130859375, -1.838623046875, -1.5859375, -1.333251953125, -1.08056640625, -0.827880859375, -0.5751953125, -0.322509765625, -0.06982421875, 0.182861328125, 0.435546875, 0.688232421875, 0.94091796875, 1.193603515625, 1.4462890625, 1.698974609375, 1.95166015625, 2.204345703125, 2.45703125, 2.709716796875, 2.96240234375, 3.215087890625, 3.4677734375, 3.720458984375, 3.97314453125, 4.225830078125, 4.478515625, 4.731201171875, 4.98388671875, 5.236572265625, 5.4892578125, 5.741943359375, 5.99462890625, 6.247314453125, 6.5]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 10.0, 18.0, 35.0, 73.0, 103.0, 195.0, 206.0, 150.0, 99.0, 46.0, 29.0, 16.0, 6.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.949222564697266, -39.78824234008789, -38.62725830078125, -37.466278076171875, -36.305294036865234, -35.14431381225586, -33.98332977294922, -32.822349548339844, -31.661365509033203, -30.500383377075195, -29.339401245117188, -28.17841911315918, -27.017436981201172, -25.856454849243164, -24.695472717285156, -23.53449249267578, -22.373510360717773, -21.212528228759766, -20.051546096801758, -18.89056396484375, -17.729581832885742, -16.568599700927734, -15.407618522644043, -14.246636390686035, -13.085654258728027, -11.92467212677002, -10.763689994812012, -9.60270881652832, -8.441726684570312, -7.2807440757751465, -6.119762420654297, -4.958780288696289, -3.7977981567382812, -2.6368160247802734, -1.4758341312408447, -0.314852237701416, 0.8461298942565918, 2.0071120262145996, 3.168093681335449, 4.329075813293457, 5.490057945251465, 6.651040077209473, 7.8120222091674805, 8.973003387451172, 10.13398551940918, 11.294967651367188, 12.455949783325195, 13.616931915283203, 14.777914047241211, 15.938896179199219, 17.099878311157227, 18.260860443115234, 19.421842575073242, 20.58282470703125, 21.743804931640625, 22.904788970947266, 24.06576919555664, 25.22675132751465, 26.387733459472656, 27.548715591430664, 28.709697723388672, 29.87067985534668, 31.031661987304688, 32.19264221191406, 33.3536262512207]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 10.0, 7.0, 11.0, 19.0, 9.0, 12.0, 14.0, 25.0, 27.0, 31.0, 26.0, 25.0, 46.0, 36.0, 41.0, 38.0, 36.0, 38.0, 32.0, 46.0, 51.0, 56.0, 43.0, 37.0, 35.0, 35.0, 27.0, 31.0, 22.0, 16.0, 22.0, 18.0, 19.0, 11.0, 11.0, 4.0, 5.0, 9.0, 1.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.395833969116211, -14.941278457641602, -14.486722946166992, -14.0321683883667, -13.57761287689209, -13.12305736541748, -12.668502807617188, -12.213947296142578, -11.759391784667969, -11.30483627319336, -10.85028076171875, -10.395726203918457, -9.941170692443848, -9.486615180969238, -9.032060623168945, -8.577505111694336, -8.122949600219727, -7.668394088745117, -7.213839054107666, -6.759284019470215, -6.3047285079956055, -5.850172996520996, -5.395617961883545, -4.941062927246094, -4.486507415771484, -4.031951904296875, -3.577396869659424, -3.1228415966033936, -2.6682863235473633, -2.213731050491333, -1.7591757774353027, -1.3046205043792725, -0.8500652313232422, -0.3955099582672119, 0.05904531478881836, 0.5136005878448486, 0.9681558609008789, 1.4227111339569092, 1.8772664070129395, 2.3318216800689697, 2.786376953125, 3.2409322261810303, 3.6954874992370605, 4.150042533874512, 4.604598045349121, 5.0591535568237305, 5.513708591461182, 5.968263626098633, 6.422819137573242, 6.877374649047852, 7.331929683685303, 7.786484718322754, 8.241040229797363, 8.695595741271973, 9.150150299072266, 9.604705810546875, 10.059261322021484, 10.513816833496094, 10.968372344970703, 11.422926902770996, 11.877482414245605, 12.332037925720215, 12.786592483520508, 13.241147994995117, 13.695703506469727]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 10.0, 14.0, 17.0, 30.0, 34.0, 42.0, 68.0, 89.0, 147.0, 222.0, 333.0, 610.0, 980.0, 1924.0, 3650.0, 7139.0, 14848.0, 32579.0, 73963.0, 167821.0, 341786.0, 223030.0, 97282.0, 43136.0, 19584.0, 9104.0, 4522.0, 2337.0, 1319.0, 694.0, 413.0, 290.0, 159.0, 101.0, 91.0, 54.0, 39.0, 33.0, 20.0, 11.0, 8.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3359375, -7.10430908203125, -6.8726806640625, -6.64105224609375, -6.409423828125, -6.17779541015625, -5.9461669921875, -5.71453857421875, -5.48291015625, -5.25128173828125, -5.0196533203125, -4.78802490234375, -4.556396484375, -4.32476806640625, -4.0931396484375, -3.86151123046875, -3.6298828125, -3.39825439453125, -3.1666259765625, -2.93499755859375, -2.703369140625, -2.47174072265625, -2.2401123046875, -2.00848388671875, -1.77685546875, -1.54522705078125, -1.3135986328125, -1.08197021484375, -0.850341796875, -0.61871337890625, -0.3870849609375, -0.15545654296875, 0.076171875, 0.30780029296875, 0.5394287109375, 0.77105712890625, 1.002685546875, 1.23431396484375, 1.4659423828125, 1.69757080078125, 1.92919921875, 2.16082763671875, 2.3924560546875, 2.62408447265625, 2.855712890625, 3.08734130859375, 3.3189697265625, 3.55059814453125, 3.7822265625, 4.01385498046875, 4.2454833984375, 4.47711181640625, 4.708740234375, 4.94036865234375, 5.1719970703125, 5.40362548828125, 5.63525390625, 5.86688232421875, 6.0985107421875, 6.33013916015625, 6.561767578125, 6.79339599609375, 7.0250244140625, 7.25665283203125, 7.48828125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 9.0, 11.0, 7.0, 15.0, 12.0, 14.0, 20.0, 28.0, 20.0, 23.0, 33.0, 37.0, 35.0, 41.0, 39.0, 42.0, 54.0, 50.0, 46.0, 40.0, 44.0, 42.0, 32.0, 38.0, 41.0, 32.0, 29.0, 18.0, 29.0, 25.0, 12.0, 17.0, 15.0, 8.0, 8.0, 9.0, 7.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6727447509765625, -1.606231689453125, -1.5397186279296875, -1.47320556640625, -1.4066925048828125, -1.340179443359375, -1.2736663818359375, -1.2071533203125, -1.1406402587890625, -1.074127197265625, -1.0076141357421875, -0.94110107421875, -0.8745880126953125, -0.808074951171875, -0.7415618896484375, -0.675048828125, -0.6085357666015625, -0.542022705078125, -0.4755096435546875, -0.40899658203125, -0.3424835205078125, -0.275970458984375, -0.2094573974609375, -0.1429443359375, -0.0764312744140625, -0.009918212890625, 0.0565948486328125, 0.12310791015625, 0.1896209716796875, 0.256134033203125, 0.3226470947265625, 0.38916015625, 0.4556732177734375, 0.522186279296875, 0.5886993408203125, 0.65521240234375, 0.7217254638671875, 0.788238525390625, 0.8547515869140625, 0.9212646484375, 0.9877777099609375, 1.054290771484375, 1.1208038330078125, 1.18731689453125, 1.2538299560546875, 1.320343017578125, 1.3868560791015625, 1.453369140625, 1.5198822021484375, 1.586395263671875, 1.6529083251953125, 1.71942138671875, 1.7859344482421875, 1.852447509765625, 1.9189605712890625, 1.9854736328125, 2.0519866943359375, 2.118499755859375, 2.1850128173828125, 2.25152587890625, 2.3180389404296875, 2.384552001953125, 2.4510650634765625, 2.517578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 9.0, 11.0, 18.0, 18.0, 22.0, 35.0, 46.0, 57.0, 91.0, 110.0, 144.0, 204.0, 310.0, 458.0, 804.0, 1903.0, 5277.0, 21444.0, 117915.0, 588033.0, 252464.0, 44054.0, 9215.0, 2762.0, 1101.0, 626.0, 405.0, 238.0, 166.0, 137.0, 90.0, 85.0, 67.0, 61.0, 33.0, 35.0, 25.0, 20.0, 12.0, 11.0, 6.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.21875, -12.814697265625, -12.41064453125, -12.006591796875, -11.6025390625, -11.198486328125, -10.79443359375, -10.390380859375, -9.986328125, -9.582275390625, -9.17822265625, -8.774169921875, -8.3701171875, -7.966064453125, -7.56201171875, -7.157958984375, -6.75390625, -6.349853515625, -5.94580078125, -5.541748046875, -5.1376953125, -4.733642578125, -4.32958984375, -3.925537109375, -3.521484375, -3.117431640625, -2.71337890625, -2.309326171875, -1.9052734375, -1.501220703125, -1.09716796875, -0.693115234375, -0.2890625, 0.114990234375, 0.51904296875, 0.923095703125, 1.3271484375, 1.731201171875, 2.13525390625, 2.539306640625, 2.943359375, 3.347412109375, 3.75146484375, 4.155517578125, 4.5595703125, 4.963623046875, 5.36767578125, 5.771728515625, 6.17578125, 6.579833984375, 6.98388671875, 7.387939453125, 7.7919921875, 8.196044921875, 8.60009765625, 9.004150390625, 9.408203125, 9.812255859375, 10.21630859375, 10.620361328125, 11.0244140625, 11.428466796875, 11.83251953125, 12.236572265625, 12.640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 6.0, 11.0, 8.0, 12.0, 17.0, 26.0, 32.0, 28.0, 44.0, 42.0, 67.0, 64.0, 72.0, 74.0, 73.0, 67.0, 70.0, 48.0, 51.0, 43.0, 28.0, 33.0, 18.0, 22.0, 14.0, 8.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.323974609375, -15.78857421875, -15.253173828125, -14.7177734375, -14.182373046875, -13.64697265625, -13.111572265625, -12.576171875, -12.040771484375, -11.50537109375, -10.969970703125, -10.4345703125, -9.899169921875, -9.36376953125, -8.828369140625, -8.29296875, -7.757568359375, -7.22216796875, -6.686767578125, -6.1513671875, -5.615966796875, -5.08056640625, -4.545166015625, -4.009765625, -3.474365234375, -2.93896484375, -2.403564453125, -1.8681640625, -1.332763671875, -0.79736328125, -0.261962890625, 0.2734375, 0.808837890625, 1.34423828125, 1.879638671875, 2.4150390625, 2.950439453125, 3.48583984375, 4.021240234375, 4.556640625, 5.092041015625, 5.62744140625, 6.162841796875, 6.6982421875, 7.233642578125, 7.76904296875, 8.304443359375, 8.83984375, 9.375244140625, 9.91064453125, 10.446044921875, 10.9814453125, 11.516845703125, 12.05224609375, 12.587646484375, 13.123046875, 13.658447265625, 14.19384765625, 14.729248046875, 15.2646484375, 15.800048828125, 16.33544921875, 16.870849609375, 17.40625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 11.0, 16.0, 13.0, 12.0, 41.0, 47.0, 119.0, 188.0, 339.0, 747.0, 1746.0, 5455.0, 35083.0, 707034.0, 272345.0, 18900.0, 3867.0, 1326.0, 587.0, 296.0, 137.0, 82.0, 65.0, 29.0, 28.0, 10.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0], "bins": [-15.3125, -14.9283447265625, -14.544189453125, -14.1600341796875, -13.77587890625, -13.3917236328125, -13.007568359375, -12.6234130859375, -12.2392578125, -11.8551025390625, -11.470947265625, -11.0867919921875, -10.70263671875, -10.3184814453125, -9.934326171875, -9.5501708984375, -9.166015625, -8.7818603515625, -8.397705078125, -8.0135498046875, -7.62939453125, -7.2452392578125, -6.861083984375, -6.4769287109375, -6.0927734375, -5.7086181640625, -5.324462890625, -4.9403076171875, -4.55615234375, -4.1719970703125, -3.787841796875, -3.4036865234375, -3.01953125, -2.6353759765625, -2.251220703125, -1.8670654296875, -1.48291015625, -1.0987548828125, -0.714599609375, -0.3304443359375, 0.0537109375, 0.4378662109375, 0.822021484375, 1.2061767578125, 1.59033203125, 1.9744873046875, 2.358642578125, 2.7427978515625, 3.126953125, 3.5111083984375, 3.895263671875, 4.2794189453125, 4.66357421875, 5.0477294921875, 5.431884765625, 5.8160400390625, 6.2001953125, 6.5843505859375, 6.968505859375, 7.3526611328125, 7.73681640625, 8.1209716796875, 8.505126953125, 8.8892822265625, 9.2734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 8.0, 3.0, 7.0, 13.0, 21.0, 20.0, 27.0, 55.0, 72.0, 93.0, 239.0, 162.0, 76.0, 54.0, 37.0, 39.0, 22.0, 13.0, 11.0, 4.0, 3.0, 6.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016632080078125, -0.0016224756836891174, -0.0015817433595657349, -0.0015410110354423523, -0.0015002787113189697, -0.0014595463871955872, -0.0014188140630722046, -0.001378081738948822, -0.0013373494148254395, -0.0012966170907020569, -0.0012558847665786743, -0.0012151524424552917, -0.0011744201183319092, -0.0011336877942085266, -0.001092955470085144, -0.0010522231459617615, -0.001011490821838379, -0.0009707584977149963, -0.0009300261735916138, -0.0008892938494682312, -0.0008485615253448486, -0.0008078292012214661, -0.0007670968770980835, -0.0007263645529747009, -0.0006856322288513184, -0.0006448999047279358, -0.0006041675806045532, -0.0005634352564811707, -0.0005227029323577881, -0.0004819706082344055, -0.00044123828411102295, -0.0004005059599876404, -0.0003597736358642578, -0.00031904131174087524, -0.0002783089876174927, -0.0002375766634941101, -0.00019684433937072754, -0.00015611201524734497, -0.0001153796911239624, -7.464736700057983e-05, -3.3915042877197266e-05, 6.817281246185303e-06, 4.754960536956787e-05, 8.828192949295044e-05, 0.000129014253616333, 0.00016974657773971558, 0.00021047890186309814, 0.0002512112259864807, 0.0002919435501098633, 0.00033267587423324585, 0.0003734081983566284, 0.000414140522480011, 0.00045487284660339355, 0.0004956051707267761, 0.0005363374948501587, 0.0005770698189735413, 0.0006178021430969238, 0.0006585344672203064, 0.000699266791343689, 0.0007399991154670715, 0.0007807314395904541, 0.0008214637637138367, 0.0008621960878372192, 0.0009029284119606018, 0.0009436607360839844]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 3.0, 4.0, 7.0, 10.0, 24.0, 59.0, 161.0, 452.0, 1335.0, 11963.0, 893069.0, 136478.0, 3772.0, 748.0, 248.0, 114.0, 51.0, 24.0, 8.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.171875, -28.4737548828125, -27.775634765625, -27.0775146484375, -26.37939453125, -25.6812744140625, -24.983154296875, -24.2850341796875, -23.5869140625, -22.8887939453125, -22.190673828125, -21.4925537109375, -20.79443359375, -20.0963134765625, -19.398193359375, -18.7000732421875, -18.001953125, -17.3038330078125, -16.605712890625, -15.9075927734375, -15.20947265625, -14.5113525390625, -13.813232421875, -13.1151123046875, -12.4169921875, -11.7188720703125, -11.020751953125, -10.3226318359375, -9.62451171875, -8.9263916015625, -8.228271484375, -7.5301513671875, -6.83203125, -6.1339111328125, -5.435791015625, -4.7376708984375, -4.03955078125, -3.3414306640625, -2.643310546875, -1.9451904296875, -1.2470703125, -0.5489501953125, 0.149169921875, 0.8472900390625, 1.54541015625, 2.2435302734375, 2.941650390625, 3.6397705078125, 4.337890625, 5.0360107421875, 5.734130859375, 6.4322509765625, 7.13037109375, 7.8284912109375, 8.526611328125, 9.2247314453125, 9.9228515625, 10.6209716796875, 11.319091796875, 12.0172119140625, 12.71533203125, 13.4134521484375, 14.111572265625, 14.8096923828125, 15.5078125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 14.0, 18.0, 32.0, 40.0, 65.0, 108.0, 159.0, 193.0, 146.0, 71.0, 54.0, 36.0, 21.0, 7.0, 4.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.1484375, -13.821044921875, -13.49365234375, -13.166259765625, -12.8388671875, -12.511474609375, -12.18408203125, -11.856689453125, -11.529296875, -11.201904296875, -10.87451171875, -10.547119140625, -10.2197265625, -9.892333984375, -9.56494140625, -9.237548828125, -8.91015625, -8.582763671875, -8.25537109375, -7.927978515625, -7.6005859375, -7.273193359375, -6.94580078125, -6.618408203125, -6.291015625, -5.963623046875, -5.63623046875, -5.308837890625, -4.9814453125, -4.654052734375, -4.32666015625, -3.999267578125, -3.671875, -3.344482421875, -3.01708984375, -2.689697265625, -2.3623046875, -2.034912109375, -1.70751953125, -1.380126953125, -1.052734375, -0.725341796875, -0.39794921875, -0.070556640625, 0.2568359375, 0.584228515625, 0.91162109375, 1.239013671875, 1.56640625, 1.893798828125, 2.22119140625, 2.548583984375, 2.8759765625, 3.203369140625, 3.53076171875, 3.858154296875, 4.185546875, 4.512939453125, 4.84033203125, 5.167724609375, 5.4951171875, 5.822509765625, 6.14990234375, 6.477294921875, 6.8046875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 24.0, 35.0, 77.0, 122.0, 189.0, 199.0, 141.0, 101.0, 52.0, 17.0, 14.0, 10.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-132.65936279296875, -128.76719665527344, -124.87501525878906, -120.98284912109375, -117.0906753540039, -113.19850158691406, -109.30633544921875, -105.4141616821289, -101.52198791503906, -97.62981414794922, -93.73764038085938, -89.84547424316406, -85.95330047607422, -82.06112670898438, -78.16896057128906, -74.27678680419922, -70.38461303710938, -66.49243927001953, -62.60026931762695, -58.708099365234375, -54.81592559814453, -50.92375183105469, -47.03158187866211, -43.13941192626953, -39.24723815917969, -35.355064392089844, -31.462894439697266, -27.570722579956055, -23.678550720214844, -19.786378860473633, -15.894207000732422, -12.002035140991211, -8.109870910644531, -4.21769905090332, -0.3255271911621094, 3.5666446685791016, 7.4588165283203125, 11.350988388061523, 15.243160247802734, 19.135332107543945, 23.027503967285156, 26.919675827026367, 30.811847686767578, 34.704017639160156, 38.59619140625, 42.488365173339844, 46.38053512573242, 50.272705078125, 54.164878845214844, 58.05705261230469, 61.949222564697266, 65.84139251708984, 69.73356628417969, 73.62574005126953, 77.51791381835938, 81.41007995605469, 85.30225372314453, 89.19442749023438, 93.08659362792969, 96.97876739501953, 100.87094116210938, 104.76311492919922, 108.65528869628906, 112.54745483398438, 116.43962860107422]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 7.0, 3.0, 8.0, 9.0, 14.0, 7.0, 14.0, 19.0, 21.0, 17.0, 25.0, 38.0, 34.0, 58.0, 43.0, 69.0, 51.0, 67.0, 61.0, 60.0, 50.0, 49.0, 54.0, 31.0, 35.0, 32.0, 18.0, 17.0, 14.0, 20.0, 13.0, 8.0, 5.0, 9.0, 2.0, 3.0, 7.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.0032958984375, -85.32564544677734, -82.64800262451172, -79.97035217285156, -77.29270935058594, -74.61505889892578, -71.93740844726562, -69.259765625, -66.58211517333984, -63.90446853637695, -61.22682189941406, -58.549171447753906, -55.871524810791016, -53.193878173828125, -50.51622772216797, -47.83858108520508, -45.16093444824219, -42.4832878112793, -39.805641174316406, -37.12799072265625, -34.45034408569336, -31.77269744873047, -29.095048904418945, -26.417400360107422, -23.73975372314453, -21.06210708618164, -18.384458541870117, -15.70681095123291, -13.029163360595703, -10.351515769958496, -7.673868179321289, -4.996219635009766, -2.318572998046875, 0.35907459259033203, 3.036722183227539, 5.714369773864746, 8.392017364501953, 11.06966495513916, 13.747312545776367, 16.42496109008789, 19.10260772705078, 21.780254364013672, 24.457902908325195, 27.13555145263672, 29.81319808959961, 32.4908447265625, 35.168495178222656, 37.84614181518555, 40.52378845214844, 43.20143508911133, 45.87908172607422, 48.556732177734375, 51.234378814697266, 53.912025451660156, 56.58967590332031, 59.2673225402832, 61.944969177246094, 64.62261962890625, 67.30026245117188, 69.97791290283203, 72.65556335449219, 75.33320617675781, 78.01085662841797, 80.68850708007812, 83.36614990234375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 13.0, 6.0, 13.0, 26.0, 37.0, 55.0, 95.0, 160.0, 310.0, 586.0, 1177.0, 2403.0, 5789.0, 16126.0, 60312.0, 753648.0, 3232670.0, 86800.0, 21304.0, 7070.0, 2895.0, 1322.0, 648.0, 355.0, 180.0, 114.0, 69.0, 41.0, 15.0, 10.0, 9.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.8828125, -12.4549560546875, -12.027099609375, -11.5992431640625, -11.17138671875, -10.7435302734375, -10.315673828125, -9.8878173828125, -9.4599609375, -9.0321044921875, -8.604248046875, -8.1763916015625, -7.74853515625, -7.3206787109375, -6.892822265625, -6.4649658203125, -6.037109375, -5.6092529296875, -5.181396484375, -4.7535400390625, -4.32568359375, -3.8978271484375, -3.469970703125, -3.0421142578125, -2.6142578125, -2.1864013671875, -1.758544921875, -1.3306884765625, -0.90283203125, -0.4749755859375, -0.047119140625, 0.3807373046875, 0.80859375, 1.2364501953125, 1.664306640625, 2.0921630859375, 2.52001953125, 2.9478759765625, 3.375732421875, 3.8035888671875, 4.2314453125, 4.6593017578125, 5.087158203125, 5.5150146484375, 5.94287109375, 6.3707275390625, 6.798583984375, 7.2264404296875, 7.654296875, 8.0821533203125, 8.510009765625, 8.9378662109375, 9.36572265625, 9.7935791015625, 10.221435546875, 10.6492919921875, 11.0771484375, 11.5050048828125, 11.932861328125, 12.3607177734375, 12.78857421875, 13.2164306640625, 13.644287109375, 14.0721435546875, 14.5]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 10.0, 4.0, 12.0, 12.0, 11.0, 14.0, 27.0, 33.0, 39.0, 34.0, 33.0, 55.0, 56.0, 60.0, 63.0, 59.0, 71.0, 61.0, 45.0, 43.0, 33.0, 38.0, 44.0, 34.0, 19.0, 21.0, 18.0, 17.0, 7.0, 4.0, 7.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.8441162109375, -3.739013671875, -3.6339111328125, -3.52880859375, -3.4237060546875, -3.318603515625, -3.2135009765625, -3.1083984375, -3.0032958984375, -2.898193359375, -2.7930908203125, -2.68798828125, -2.5828857421875, -2.477783203125, -2.3726806640625, -2.267578125, -2.1624755859375, -2.057373046875, -1.9522705078125, -1.84716796875, -1.7420654296875, -1.636962890625, -1.5318603515625, -1.4267578125, -1.3216552734375, -1.216552734375, -1.1114501953125, -1.00634765625, -0.9012451171875, -0.796142578125, -0.6910400390625, -0.5859375, -0.4808349609375, -0.375732421875, -0.2706298828125, -0.16552734375, -0.0604248046875, 0.044677734375, 0.1497802734375, 0.2548828125, 0.3599853515625, 0.465087890625, 0.5701904296875, 0.67529296875, 0.7803955078125, 0.885498046875, 0.9906005859375, 1.095703125, 1.2008056640625, 1.305908203125, 1.4110107421875, 1.51611328125, 1.6212158203125, 1.726318359375, 1.8314208984375, 1.9365234375, 2.0416259765625, 2.146728515625, 2.2518310546875, 2.35693359375, 2.4620361328125, 2.567138671875, 2.6722412109375, 2.77734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 7.0, 5.0, 21.0, 26.0, 48.0, 96.0, 159.0, 294.0, 612.0, 2105.0, 14807.0, 335602.0, 3794554.0, 39955.0, 4151.0, 996.0, 393.0, 213.0, 109.0, 56.0, 28.0, 26.0, 16.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.40625, -23.5703125, -22.734375, -21.8984375, -21.0625, -20.2265625, -19.390625, -18.5546875, -17.71875, -16.8828125, -16.046875, -15.2109375, -14.375, -13.5390625, -12.703125, -11.8671875, -11.03125, -10.1953125, -9.359375, -8.5234375, -7.6875, -6.8515625, -6.015625, -5.1796875, -4.34375, -3.5078125, -2.671875, -1.8359375, -1.0, -0.1640625, 0.671875, 1.5078125, 2.34375, 3.1796875, 4.015625, 4.8515625, 5.6875, 6.5234375, 7.359375, 8.1953125, 9.03125, 9.8671875, 10.703125, 11.5390625, 12.375, 13.2109375, 14.046875, 14.8828125, 15.71875, 16.5546875, 17.390625, 18.2265625, 19.0625, 19.8984375, 20.734375, 21.5703125, 22.40625, 23.2421875, 24.078125, 24.9140625, 25.75, 26.5859375, 27.421875, 28.2578125, 29.09375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 10.0, 5.0, 26.0, 44.0, 78.0, 229.0, 2280.0, 1095.0, 167.0, 65.0, 49.0, 14.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.265625, -15.79931640625, -15.3330078125, -14.86669921875, -14.400390625, -13.93408203125, -13.4677734375, -13.00146484375, -12.53515625, -12.06884765625, -11.6025390625, -11.13623046875, -10.669921875, -10.20361328125, -9.7373046875, -9.27099609375, -8.8046875, -8.33837890625, -7.8720703125, -7.40576171875, -6.939453125, -6.47314453125, -6.0068359375, -5.54052734375, -5.07421875, -4.60791015625, -4.1416015625, -3.67529296875, -3.208984375, -2.74267578125, -2.2763671875, -1.81005859375, -1.34375, -0.87744140625, -0.4111328125, 0.05517578125, 0.521484375, 0.98779296875, 1.4541015625, 1.92041015625, 2.38671875, 2.85302734375, 3.3193359375, 3.78564453125, 4.251953125, 4.71826171875, 5.1845703125, 5.65087890625, 6.1171875, 6.58349609375, 7.0498046875, 7.51611328125, 7.982421875, 8.44873046875, 8.9150390625, 9.38134765625, 9.84765625, 10.31396484375, 10.7802734375, 11.24658203125, 11.712890625, 12.17919921875, 12.6455078125, 13.11181640625, 13.578125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 20.0, 44.0, 193.0, 347.0, 284.0, 88.0, 21.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.44204711914062, -89.44474029541016, -86.44744110107422, -83.45013427734375, -80.45282745361328, -77.45552062988281, -74.45822143554688, -71.4609146118164, -68.46360778808594, -65.46630096435547, -62.468997955322266, -59.47169494628906, -56.474388122558594, -53.47708511352539, -50.47978210449219, -47.48247528076172, -44.48517608642578, -41.48787307739258, -38.49056625366211, -35.493263244628906, -32.49595642089844, -29.498653411865234, -26.50135040283203, -23.504045486450195, -20.50674057006836, -17.509435653686523, -14.512131690979004, -11.514827728271484, -8.517522811889648, -5.5202178955078125, -2.5229148864746094, 0.47439002990722656, 3.4716873168945312, 6.468991756439209, 9.466296195983887, 12.463600158691406, 15.460905075073242, 18.458209991455078, 21.45551300048828, 24.452817916870117, 27.450122833251953, 30.44742774963379, 33.444732666015625, 36.44203567504883, 39.43933868408203, 42.4366455078125, 45.4339485168457, 48.431251525878906, 51.428558349609375, 54.42586135864258, 57.42316818237305, 60.42047119140625, 63.41777801513672, 66.41508483886719, 69.41238403320312, 72.4096908569336, 75.40699768066406, 78.40430450439453, 81.40160369873047, 84.39891052246094, 87.3962173461914, 90.39352416992188, 93.39082336425781, 96.38813018798828, 99.38542938232422]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 10.0, 12.0, 14.0, 9.0, 13.0, 20.0, 25.0, 26.0, 25.0, 39.0, 36.0, 39.0, 42.0, 44.0, 50.0, 70.0, 50.0, 63.0, 68.0, 41.0, 44.0, 40.0, 38.0, 24.0, 28.0, 25.0, 30.0, 20.0, 16.0, 13.0, 9.0, 7.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.645124435424805, -27.810861587524414, -26.976598739624023, -26.142335891723633, -25.308074951171875, -24.473812103271484, -23.639549255371094, -22.805286407470703, -21.971023559570312, -21.136760711669922, -20.30249786376953, -19.46823501586914, -18.63397216796875, -17.79970932006836, -16.9654483795166, -16.13118553161621, -15.29692268371582, -14.46265983581543, -13.628396987915039, -12.794135093688965, -11.959872245788574, -11.125609397888184, -10.29134750366211, -9.457084655761719, -8.622821807861328, -7.7885589599609375, -6.954296588897705, -6.120034217834473, -5.285771369934082, -4.451508522033691, -3.617246150970459, -2.7829837799072266, -1.9487190246582031, -1.1144564151763916, -0.2801938056945801, 0.5540688037872314, 1.388331413269043, 2.2225942611694336, 3.056856632232666, 3.8911190032958984, 4.725381851196289, 5.55964469909668, 6.393907070159912, 7.2281694412231445, 8.062432289123535, 8.896695137023926, 9.73095703125, 10.56521987915039, 11.399482727050781, 12.233745574951172, 13.068008422851562, 13.902270317077637, 14.736533164978027, 15.570796012878418, 16.405057907104492, 17.239320755004883, 18.073583602905273, 18.907846450805664, 19.742109298706055, 20.576372146606445, 21.410633087158203, 22.244895935058594, 23.079158782958984, 23.913421630859375, 24.747684478759766]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 15.0, 17.0, 16.0, 25.0, 34.0, 56.0, 80.0, 113.0, 164.0, 232.0, 380.0, 573.0, 895.0, 1455.0, 2496.0, 4446.0, 8009.0, 15663.0, 30735.0, 64640.0, 134068.0, 237374.0, 251021.0, 149826.0, 72756.0, 35194.0, 17196.0, 9179.0, 4843.0, 2696.0, 1601.0, 948.0, 627.0, 366.0, 264.0, 190.0, 114.0, 73.0, 46.0, 29.0, 24.0, 19.0, 19.0, 12.0, 10.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.01953125, -5.82586669921875, -5.6322021484375, -5.43853759765625, -5.244873046875, -5.05120849609375, -4.8575439453125, -4.66387939453125, -4.47021484375, -4.27655029296875, -4.0828857421875, -3.88922119140625, -3.695556640625, -3.50189208984375, -3.3082275390625, -3.11456298828125, -2.9208984375, -2.72723388671875, -2.5335693359375, -2.33990478515625, -2.146240234375, -1.95257568359375, -1.7589111328125, -1.56524658203125, -1.37158203125, -1.17791748046875, -0.9842529296875, -0.79058837890625, -0.596923828125, -0.40325927734375, -0.2095947265625, -0.01593017578125, 0.177734375, 0.37139892578125, 0.5650634765625, 0.75872802734375, 0.952392578125, 1.14605712890625, 1.3397216796875, 1.53338623046875, 1.72705078125, 1.92071533203125, 2.1143798828125, 2.30804443359375, 2.501708984375, 2.69537353515625, 2.8890380859375, 3.08270263671875, 3.2763671875, 3.47003173828125, 3.6636962890625, 3.85736083984375, 4.051025390625, 4.24468994140625, 4.4383544921875, 4.63201904296875, 4.82568359375, 5.01934814453125, 5.2130126953125, 5.40667724609375, 5.600341796875, 5.79400634765625, 5.9876708984375, 6.18133544921875, 6.375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 5.0, 9.0, 6.0, 12.0, 16.0, 20.0, 20.0, 25.0, 26.0, 31.0, 18.0, 43.0, 39.0, 53.0, 54.0, 68.0, 43.0, 54.0, 52.0, 43.0, 44.0, 39.0, 40.0, 29.0, 39.0, 30.0, 25.0, 16.0, 22.0, 17.0, 14.0, 8.0, 7.0, 7.0, 10.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.939666748046875, -2.84808349609375, -2.756500244140625, -2.6649169921875, -2.573333740234375, -2.48175048828125, -2.390167236328125, -2.298583984375, -2.207000732421875, -2.11541748046875, -2.023834228515625, -1.9322509765625, -1.840667724609375, -1.74908447265625, -1.657501220703125, -1.56591796875, -1.474334716796875, -1.38275146484375, -1.291168212890625, -1.1995849609375, -1.108001708984375, -1.01641845703125, -0.924835205078125, -0.833251953125, -0.741668701171875, -0.65008544921875, -0.558502197265625, -0.4669189453125, -0.375335693359375, -0.28375244140625, -0.192169189453125, -0.1005859375, -0.009002685546875, 0.08258056640625, 0.174163818359375, 0.2657470703125, 0.357330322265625, 0.44891357421875, 0.540496826171875, 0.632080078125, 0.723663330078125, 0.81524658203125, 0.906829833984375, 0.9984130859375, 1.089996337890625, 1.18157958984375, 1.273162841796875, 1.36474609375, 1.456329345703125, 1.54791259765625, 1.639495849609375, 1.7310791015625, 1.822662353515625, 1.91424560546875, 2.005828857421875, 2.097412109375, 2.188995361328125, 2.28057861328125, 2.372161865234375, 2.4637451171875, 2.555328369140625, 2.64691162109375, 2.738494873046875, 2.830078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 9.0, 10.0, 16.0, 15.0, 20.0, 35.0, 42.0, 70.0, 83.0, 115.0, 170.0, 244.0, 385.0, 630.0, 1211.0, 3057.0, 10374.0, 50702.0, 312763.0, 529581.0, 110466.0, 19570.0, 4958.0, 1785.0, 807.0, 451.0, 285.0, 203.0, 139.0, 93.0, 74.0, 56.0, 29.0, 29.0, 17.0, 17.0, 13.0, 4.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8671875, -11.446533203125, -11.02587890625, -10.605224609375, -10.1845703125, -9.763916015625, -9.34326171875, -8.922607421875, -8.501953125, -8.081298828125, -7.66064453125, -7.239990234375, -6.8193359375, -6.398681640625, -5.97802734375, -5.557373046875, -5.13671875, -4.716064453125, -4.29541015625, -3.874755859375, -3.4541015625, -3.033447265625, -2.61279296875, -2.192138671875, -1.771484375, -1.350830078125, -0.93017578125, -0.509521484375, -0.0888671875, 0.331787109375, 0.75244140625, 1.173095703125, 1.59375, 2.014404296875, 2.43505859375, 2.855712890625, 3.2763671875, 3.697021484375, 4.11767578125, 4.538330078125, 4.958984375, 5.379638671875, 5.80029296875, 6.220947265625, 6.6416015625, 7.062255859375, 7.48291015625, 7.903564453125, 8.32421875, 8.744873046875, 9.16552734375, 9.586181640625, 10.0068359375, 10.427490234375, 10.84814453125, 11.268798828125, 11.689453125, 12.110107421875, 12.53076171875, 12.951416015625, 13.3720703125, 13.792724609375, 14.21337890625, 14.634033203125, 15.0546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 8.0, 4.0, 6.0, 3.0, 11.0, 13.0, 11.0, 17.0, 17.0, 27.0, 22.0, 30.0, 25.0, 38.0, 43.0, 32.0, 50.0, 43.0, 43.0, 44.0, 46.0, 56.0, 41.0, 58.0, 38.0, 34.0, 33.0, 39.0, 33.0, 21.0, 26.0, 11.0, 18.0, 6.0, 12.0, 7.0, 8.0, 4.0, 3.0, 1.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0078125, -14.5040283203125, -14.000244140625, -13.4964599609375, -12.99267578125, -12.4888916015625, -11.985107421875, -11.4813232421875, -10.9775390625, -10.4737548828125, -9.969970703125, -9.4661865234375, -8.96240234375, -8.4586181640625, -7.954833984375, -7.4510498046875, -6.947265625, -6.4434814453125, -5.939697265625, -5.4359130859375, -4.93212890625, -4.4283447265625, -3.924560546875, -3.4207763671875, -2.9169921875, -2.4132080078125, -1.909423828125, -1.4056396484375, -0.90185546875, -0.3980712890625, 0.105712890625, 0.6094970703125, 1.11328125, 1.6170654296875, 2.120849609375, 2.6246337890625, 3.12841796875, 3.6322021484375, 4.135986328125, 4.6397705078125, 5.1435546875, 5.6473388671875, 6.151123046875, 6.6549072265625, 7.15869140625, 7.6624755859375, 8.166259765625, 8.6700439453125, 9.173828125, 9.6776123046875, 10.181396484375, 10.6851806640625, 11.18896484375, 11.6927490234375, 12.196533203125, 12.7003173828125, 13.2041015625, 13.7078857421875, 14.211669921875, 14.7154541015625, 15.21923828125, 15.7230224609375, 16.226806640625, 16.7305908203125, 17.234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 6.0, 3.0, 2.0, 7.0, 14.0, 22.0, 24.0, 55.0, 113.0, 168.0, 368.0, 961.0, 2359.0, 7394.0, 33033.0, 239687.0, 619509.0, 117705.0, 19219.0, 4954.0, 1664.0, 618.0, 326.0, 137.0, 87.0, 42.0, 27.0, 14.0, 13.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0390625, -6.799072265625, -6.55908203125, -6.319091796875, -6.0791015625, -5.839111328125, -5.59912109375, -5.359130859375, -5.119140625, -4.879150390625, -4.63916015625, -4.399169921875, -4.1591796875, -3.919189453125, -3.67919921875, -3.439208984375, -3.19921875, -2.959228515625, -2.71923828125, -2.479248046875, -2.2392578125, -1.999267578125, -1.75927734375, -1.519287109375, -1.279296875, -1.039306640625, -0.79931640625, -0.559326171875, -0.3193359375, -0.079345703125, 0.16064453125, 0.400634765625, 0.640625, 0.880615234375, 1.12060546875, 1.360595703125, 1.6005859375, 1.840576171875, 2.08056640625, 2.320556640625, 2.560546875, 2.800537109375, 3.04052734375, 3.280517578125, 3.5205078125, 3.760498046875, 4.00048828125, 4.240478515625, 4.48046875, 4.720458984375, 4.96044921875, 5.200439453125, 5.4404296875, 5.680419921875, 5.92041015625, 6.160400390625, 6.400390625, 6.640380859375, 6.88037109375, 7.120361328125, 7.3603515625, 7.600341796875, 7.84033203125, 8.080322265625, 8.3203125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 13.0, 28.0, 37.0, 56.0, 79.0, 123.0, 143.0, 154.0, 115.0, 78.0, 54.0, 39.0, 19.0, 17.0, 10.0, 9.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00157928466796875, -0.001536548137664795, -0.0014938116073608398, -0.0014510750770568848, -0.0014083385467529297, -0.0013656020164489746, -0.0013228654861450195, -0.0012801289558410645, -0.0012373924255371094, -0.0011946558952331543, -0.0011519193649291992, -0.0011091828346252441, -0.001066446304321289, -0.001023709774017334, -0.000980973243713379, -0.0009382367134094238, -0.0008955001831054688, -0.0008527636528015137, -0.0008100271224975586, -0.0007672905921936035, -0.0007245540618896484, -0.0006818175315856934, -0.0006390810012817383, -0.0005963444709777832, -0.0005536079406738281, -0.000510871410369873, -0.00046813488006591797, -0.0004253983497619629, -0.0003826618194580078, -0.00033992528915405273, -0.00029718875885009766, -0.0002544522285461426, -0.0002117156982421875, -0.00016897916793823242, -0.00012624263763427734, -8.350610733032227e-05, -4.076957702636719e-05, 1.9669532775878906e-06, 4.470348358154297e-05, 8.744001388549805e-05, 0.00013017654418945312, 0.0001729130744934082, 0.00021564960479736328, 0.00025838613510131836, 0.00030112266540527344, 0.0003438591957092285, 0.0003865957260131836, 0.00042933225631713867, 0.00047206878662109375, 0.0005148053169250488, 0.0005575418472290039, 0.000600278377532959, 0.0006430149078369141, 0.0006857514381408691, 0.0007284879684448242, 0.0007712244987487793, 0.0008139610290527344, 0.0008566975593566895, 0.0008994340896606445, 0.0009421706199645996, 0.0009849071502685547, 0.0010276436805725098, 0.0010703802108764648, 0.00111311674118042, 0.001155853271484375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 4.0, 9.0, 14.0, 14.0, 21.0, 28.0, 37.0, 84.0, 130.0, 203.0, 312.0, 630.0, 1363.0, 3939.0, 15190.0, 95454.0, 609255.0, 275135.0, 35191.0, 7139.0, 2253.0, 937.0, 488.0, 283.0, 154.0, 88.0, 55.0, 36.0, 28.0, 20.0, 11.0, 14.0, 6.0, 6.0, 7.0, 0.0, 2.0, 0.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.7734375, -8.52093505859375, -8.2684326171875, -8.01593017578125, -7.763427734375, -7.51092529296875, -7.2584228515625, -7.00592041015625, -6.75341796875, -6.50091552734375, -6.2484130859375, -5.99591064453125, -5.743408203125, -5.49090576171875, -5.2384033203125, -4.98590087890625, -4.7333984375, -4.48089599609375, -4.2283935546875, -3.97589111328125, -3.723388671875, -3.47088623046875, -3.2183837890625, -2.96588134765625, -2.71337890625, -2.46087646484375, -2.2083740234375, -1.95587158203125, -1.703369140625, -1.45086669921875, -1.1983642578125, -0.94586181640625, -0.693359375, -0.44085693359375, -0.1883544921875, 0.06414794921875, 0.316650390625, 0.56915283203125, 0.8216552734375, 1.07415771484375, 1.32666015625, 1.57916259765625, 1.8316650390625, 2.08416748046875, 2.336669921875, 2.58917236328125, 2.8416748046875, 3.09417724609375, 3.3466796875, 3.59918212890625, 3.8516845703125, 4.10418701171875, 4.356689453125, 4.60919189453125, 4.8616943359375, 5.11419677734375, 5.36669921875, 5.61920166015625, 5.8717041015625, 6.12420654296875, 6.376708984375, 6.62921142578125, 6.8817138671875, 7.13421630859375, 7.38671875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 11.0, 7.0, 10.0, 11.0, 15.0, 25.0, 29.0, 32.0, 48.0, 70.0, 93.0, 110.0, 101.0, 103.0, 89.0, 63.0, 54.0, 38.0, 36.0, 16.0, 13.0, 9.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7109375, -9.4505615234375, -9.190185546875, -8.9298095703125, -8.66943359375, -8.4090576171875, -8.148681640625, -7.8883056640625, -7.6279296875, -7.3675537109375, -7.107177734375, -6.8468017578125, -6.58642578125, -6.3260498046875, -6.065673828125, -5.8052978515625, -5.544921875, -5.2845458984375, -5.024169921875, -4.7637939453125, -4.50341796875, -4.2430419921875, -3.982666015625, -3.7222900390625, -3.4619140625, -3.2015380859375, -2.941162109375, -2.6807861328125, -2.42041015625, -2.1600341796875, -1.899658203125, -1.6392822265625, -1.37890625, -1.1185302734375, -0.858154296875, -0.5977783203125, -0.33740234375, -0.0770263671875, 0.183349609375, 0.4437255859375, 0.7041015625, 0.9644775390625, 1.224853515625, 1.4852294921875, 1.74560546875, 2.0059814453125, 2.266357421875, 2.5267333984375, 2.787109375, 3.0474853515625, 3.307861328125, 3.5682373046875, 3.82861328125, 4.0889892578125, 4.349365234375, 4.6097412109375, 4.8701171875, 5.1304931640625, 5.390869140625, 5.6512451171875, 5.91162109375, 6.1719970703125, 6.432373046875, 6.6927490234375, 6.953125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 17.0, 58.0, 261.0, 450.0, 178.0, 25.0, 7.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-230.19296264648438, -221.15652465820312, -212.12010192871094, -203.08367919921875, -194.0472412109375, -185.01080322265625, -175.97438049316406, -166.93795776367188, -157.90151977539062, -148.86508178710938, -139.8286590576172, -130.792236328125, -121.75579833984375, -112.71936798095703, -103.68293762207031, -94.6465072631836, -85.61007690429688, -76.57364654541016, -67.53721618652344, -58.50078582763672, -49.46435546875, -40.42792510986328, -31.391494750976562, -22.355064392089844, -13.318634033203125, -4.282203674316406, 4.7542266845703125, 13.790657043457031, 22.82708740234375, 31.86351776123047, 40.89994812011719, 49.936378479003906, 58.9727783203125, 68.00920867919922, 77.04563903808594, 86.08206939697266, 95.11849975585938, 104.1549301147461, 113.19136047363281, 122.22779083251953, 131.26422119140625, 140.3006591796875, 149.3370819091797, 158.37350463867188, 167.40994262695312, 176.44638061523438, 185.48280334472656, 194.51922607421875, 203.5556640625, 212.59210205078125, 221.62852478027344, 230.66494750976562, 239.70138549804688, 248.73782348632812, 257.77423095703125, 266.8106689453125, 275.84710693359375, 284.883544921875, 293.91998291015625, 302.9563903808594, 311.9928283691406, 321.0292663574219, 330.065673828125, 339.10211181640625, 348.1385498046875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 2.0, 2.0, 4.0, 4.0, 8.0, 1.0, 2.0, 0.0, 8.0, 8.0, 12.0, 3.0, 18.0, 12.0, 17.0, 29.0, 24.0, 21.0, 32.0, 40.0, 33.0, 30.0, 41.0, 46.0, 40.0, 34.0, 47.0, 38.0, 40.0, 44.0, 42.0, 43.0, 37.0, 26.0, 29.0, 32.0, 13.0, 17.0, 25.0, 16.0, 16.0, 14.0, 8.0, 10.0, 9.0, 7.0, 7.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.11553955078125, -69.69876098632812, -67.281982421875, -64.86519622802734, -62.44841766357422, -60.031639099121094, -57.6148567199707, -55.19807434082031, -52.78129577636719, -50.36451721191406, -47.94773483276367, -45.53095245361328, -43.114173889160156, -40.69739532470703, -38.28061294555664, -35.86383056640625, -33.447052001953125, -31.030271530151367, -28.61349105834961, -26.19671058654785, -23.779930114746094, -21.363149642944336, -18.946369171142578, -16.52958869934082, -14.112808227539062, -11.696027755737305, -9.279247283935547, -6.862466812133789, -4.445686340332031, -2.0289058685302734, 0.3878746032714844, 2.804655075073242, 5.221443176269531, 7.638223648071289, 10.055004119873047, 12.471784591674805, 14.888565063476562, 17.30534553527832, 19.722126007080078, 22.138906478881836, 24.555686950683594, 26.97246742248535, 29.38924789428711, 31.806028366088867, 34.222808837890625, 36.63958740234375, 39.05636978149414, 41.47315216064453, 43.889930725097656, 46.30670928955078, 48.72349166870117, 51.14027404785156, 53.55705261230469, 55.97383117675781, 58.3906135559082, 60.807395935058594, 63.22417449951172, 65.64095306396484, 68.0577392578125, 70.47451782226562, 72.89129638671875, 75.30807495117188, 77.724853515625, 80.14163970947266, 82.55841827392578]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 3.0, 3.0, 2.0, 8.0, 14.0, 10.0, 14.0, 15.0, 20.0, 39.0, 44.0, 57.0, 85.0, 95.0, 153.0, 244.0, 358.0, 660.0, 1278.0, 2838.0, 8025.0, 35370.0, 3910807.0, 204106.0, 19816.0, 5554.0, 2151.0, 1033.0, 505.0, 297.0, 168.0, 126.0, 93.0, 65.0, 59.0, 41.0, 36.0, 22.0, 15.0, 18.0, 14.0, 3.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-16.25, -15.7965087890625, -15.343017578125, -14.8895263671875, -14.43603515625, -13.9825439453125, -13.529052734375, -13.0755615234375, -12.6220703125, -12.1685791015625, -11.715087890625, -11.2615966796875, -10.80810546875, -10.3546142578125, -9.901123046875, -9.4476318359375, -8.994140625, -8.5406494140625, -8.087158203125, -7.6336669921875, -7.18017578125, -6.7266845703125, -6.273193359375, -5.8197021484375, -5.3662109375, -4.9127197265625, -4.459228515625, -4.0057373046875, -3.55224609375, -3.0987548828125, -2.645263671875, -2.1917724609375, -1.73828125, -1.2847900390625, -0.831298828125, -0.3778076171875, 0.07568359375, 0.5291748046875, 0.982666015625, 1.4361572265625, 1.8896484375, 2.3431396484375, 2.796630859375, 3.2501220703125, 3.70361328125, 4.1571044921875, 4.610595703125, 5.0640869140625, 5.517578125, 5.9710693359375, 6.424560546875, 6.8780517578125, 7.33154296875, 7.7850341796875, 8.238525390625, 8.6920166015625, 9.1455078125, 9.5989990234375, 10.052490234375, 10.5059814453125, 10.95947265625, 11.4129638671875, 11.866455078125, 12.3199462890625, 12.7734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 7.0, 8.0, 16.0, 11.0, 16.0, 17.0, 18.0, 33.0, 43.0, 26.0, 37.0, 53.0, 47.0, 60.0, 65.0, 59.0, 57.0, 59.0, 50.0, 45.0, 41.0, 48.0, 40.0, 31.0, 24.0, 24.0, 11.0, 12.0, 7.0, 3.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.78515625, -4.64996337890625, -4.5147705078125, -4.37957763671875, -4.244384765625, -4.10919189453125, -3.9739990234375, -3.83880615234375, -3.70361328125, -3.56842041015625, -3.4332275390625, -3.29803466796875, -3.162841796875, -3.02764892578125, -2.8924560546875, -2.75726318359375, -2.6220703125, -2.48687744140625, -2.3516845703125, -2.21649169921875, -2.081298828125, -1.94610595703125, -1.8109130859375, -1.67572021484375, -1.54052734375, -1.40533447265625, -1.2701416015625, -1.13494873046875, -0.999755859375, -0.86456298828125, -0.7293701171875, -0.59417724609375, -0.458984375, -0.32379150390625, -0.1885986328125, -0.05340576171875, 0.081787109375, 0.21697998046875, 0.3521728515625, 0.48736572265625, 0.62255859375, 0.75775146484375, 0.8929443359375, 1.02813720703125, 1.163330078125, 1.29852294921875, 1.4337158203125, 1.56890869140625, 1.7041015625, 1.83929443359375, 1.9744873046875, 2.10968017578125, 2.244873046875, 2.38006591796875, 2.5152587890625, 2.65045166015625, 2.78564453125, 2.92083740234375, 3.0560302734375, 3.19122314453125, 3.326416015625, 3.46160888671875, 3.5968017578125, 3.73199462890625, 3.8671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 13.0, 12.0, 16.0, 16.0, 30.0, 36.0, 60.0, 68.0, 147.0, 236.0, 378.0, 646.0, 1187.0, 3280.0, 14262.0, 197595.0, 3940452.0, 27256.0, 5040.0, 1619.0, 807.0, 425.0, 228.0, 154.0, 95.0, 59.0, 57.0, 32.0, 27.0, 14.0, 11.0, 7.0, 4.0, 9.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.5, -19.9896240234375, -19.479248046875, -18.9688720703125, -18.45849609375, -17.9481201171875, -17.437744140625, -16.9273681640625, -16.4169921875, -15.9066162109375, -15.396240234375, -14.8858642578125, -14.37548828125, -13.8651123046875, -13.354736328125, -12.8443603515625, -12.333984375, -11.8236083984375, -11.313232421875, -10.8028564453125, -10.29248046875, -9.7821044921875, -9.271728515625, -8.7613525390625, -8.2509765625, -7.7406005859375, -7.230224609375, -6.7198486328125, -6.20947265625, -5.6990966796875, -5.188720703125, -4.6783447265625, -4.16796875, -3.6575927734375, -3.147216796875, -2.6368408203125, -2.12646484375, -1.6160888671875, -1.105712890625, -0.5953369140625, -0.0849609375, 0.4254150390625, 0.935791015625, 1.4461669921875, 1.95654296875, 2.4669189453125, 2.977294921875, 3.4876708984375, 3.998046875, 4.5084228515625, 5.018798828125, 5.5291748046875, 6.03955078125, 6.5499267578125, 7.060302734375, 7.5706787109375, 8.0810546875, 8.5914306640625, 9.101806640625, 9.6121826171875, 10.12255859375, 10.6329345703125, 11.143310546875, 11.6536865234375, 12.1640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 8.0, 18.0, 36.0, 74.0, 2950.0, 818.0, 91.0, 32.0, 16.0, 13.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2890625, -4.1549072265625, -4.020751953125, -3.8865966796875, -3.75244140625, -3.6182861328125, -3.484130859375, -3.3499755859375, -3.2158203125, -3.0816650390625, -2.947509765625, -2.8133544921875, -2.67919921875, -2.5450439453125, -2.410888671875, -2.2767333984375, -2.142578125, -2.0084228515625, -1.874267578125, -1.7401123046875, -1.60595703125, -1.4718017578125, -1.337646484375, -1.2034912109375, -1.0693359375, -0.9351806640625, -0.801025390625, -0.6668701171875, -0.53271484375, -0.3985595703125, -0.264404296875, -0.1302490234375, 0.00390625, 0.1380615234375, 0.272216796875, 0.4063720703125, 0.54052734375, 0.6746826171875, 0.808837890625, 0.9429931640625, 1.0771484375, 1.2113037109375, 1.345458984375, 1.4796142578125, 1.61376953125, 1.7479248046875, 1.882080078125, 2.0162353515625, 2.150390625, 2.2845458984375, 2.418701171875, 2.5528564453125, 2.68701171875, 2.8211669921875, 2.955322265625, 3.0894775390625, 3.2236328125, 3.3577880859375, 3.491943359375, 3.6260986328125, 3.76025390625, 3.8944091796875, 4.028564453125, 4.1627197265625, 4.296875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 14.0, 17.0, 26.0, 74.0, 161.0, 237.0, 222.0, 147.0, 55.0, 27.0, 10.0, 5.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.77552318572998, -8.255213737487793, -7.734903335571289, -7.214593887329102, -6.694283962249756, -6.17397403717041, -5.653664588928223, -5.133354663848877, -4.613044738769531, -4.0927348136901855, -3.572425127029419, -3.0521154403686523, -2.5318055152893066, -2.011495590209961, -1.4911859035491943, -0.9708762168884277, -0.45056629180908203, 0.06974351406097412, 0.5900533199310303, 1.1103631258010864, 1.6306729316711426, 2.1509828567504883, 2.671292543411255, 3.1916022300720215, 3.711912155151367, 4.232222080230713, 4.752532005310059, 5.272841453552246, 5.793151378631592, 6.3134613037109375, 6.833770751953125, 7.354080677032471, 7.874391555786133, 8.39470100402832, 8.915011405944824, 9.435320854187012, 9.955631256103516, 10.475940704345703, 10.99625015258789, 11.516559600830078, 12.036870002746582, 12.55717945098877, 13.077489852905273, 13.597799301147461, 14.118108749389648, 14.638419151306152, 15.15872859954834, 15.679039001464844, 16.19934844970703, 16.71965789794922, 17.239967346191406, 17.760278701782227, 18.280588150024414, 18.8008975982666, 19.32120704650879, 19.841516494750977, 20.361827850341797, 20.882137298583984, 21.402446746826172, 21.922758102416992, 22.44306755065918, 22.963376998901367, 23.483686447143555, 24.003995895385742, 24.52430534362793]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 3.0, 13.0, 10.0, 6.0, 11.0, 15.0, 15.0, 22.0, 15.0, 25.0, 19.0, 25.0, 25.0, 23.0, 27.0, 32.0, 31.0, 38.0, 38.0, 47.0, 34.0, 40.0, 41.0, 43.0, 40.0, 46.0, 40.0, 35.0, 24.0, 33.0, 24.0, 23.0, 25.0, 13.0, 20.0, 6.0, 11.0, 13.0, 15.0, 8.0, 1.0, 8.0, 1.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.721169948577881, -4.57758092880249, -4.433992385864258, -4.290403366088867, -4.146814346313477, -4.003225326538086, -3.8596365451812744, -3.716047763824463, -3.5724587440490723, -3.4288697242736816, -3.28528094291687, -3.1416921615600586, -2.998103141784668, -2.8545141220092773, -2.710925340652466, -2.5673365592956543, -2.4237475395202637, -2.280158519744873, -2.1365697383880615, -1.9929808378219604, -1.8493919372558594, -1.7058030366897583, -1.5622141361236572, -1.4186252355575562, -1.275036334991455, -1.131447434425354, -0.9878585338592529, -0.8442696332931519, -0.7006807327270508, -0.5570918321609497, -0.41350293159484863, -0.26991403102874756, -0.12632513046264648, 0.01726377010345459, 0.16085267066955566, 0.30444157123565674, 0.4480304718017578, 0.5916193723678589, 0.73520827293396, 0.878797173500061, 1.022386074066162, 1.1659749746322632, 1.3095638751983643, 1.4531527757644653, 1.5967416763305664, 1.7403305768966675, 1.8839194774627686, 2.02750825881958, 2.1710972785949707, 2.3146862983703613, 2.458275079727173, 2.6018638610839844, 2.745452880859375, 2.8890419006347656, 3.032630681991577, 3.1762194633483887, 3.3198084831237793, 3.46339750289917, 3.6069862842559814, 3.750575065612793, 3.8941640853881836, 4.037753105163574, 4.181342124938965, 4.324930667877197, 4.468519687652588]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 3.0, 20.0, 13.0, 18.0, 27.0, 45.0, 59.0, 92.0, 160.0, 302.0, 655.0, 1650.0, 4961.0, 16905.0, 68960.0, 284022.0, 458565.0, 159725.0, 37518.0, 9730.0, 2933.0, 1136.0, 443.0, 235.0, 133.0, 66.0, 50.0, 35.0, 29.0, 16.0, 15.0, 5.0, 4.0, 3.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.2890625, -11.9407958984375, -11.592529296875, -11.2442626953125, -10.89599609375, -10.5477294921875, -10.199462890625, -9.8511962890625, -9.5029296875, -9.1546630859375, -8.806396484375, -8.4581298828125, -8.10986328125, -7.7615966796875, -7.413330078125, -7.0650634765625, -6.716796875, -6.3685302734375, -6.020263671875, -5.6719970703125, -5.32373046875, -4.9754638671875, -4.627197265625, -4.2789306640625, -3.9306640625, -3.5823974609375, -3.234130859375, -2.8858642578125, -2.53759765625, -2.1893310546875, -1.841064453125, -1.4927978515625, -1.14453125, -0.7962646484375, -0.447998046875, -0.0997314453125, 0.24853515625, 0.5968017578125, 0.945068359375, 1.2933349609375, 1.6416015625, 1.9898681640625, 2.338134765625, 2.6864013671875, 3.03466796875, 3.3829345703125, 3.731201171875, 4.0794677734375, 4.427734375, 4.7760009765625, 5.124267578125, 5.4725341796875, 5.82080078125, 6.1690673828125, 6.517333984375, 6.8656005859375, 7.2138671875, 7.5621337890625, 7.910400390625, 8.2586669921875, 8.60693359375, 8.9552001953125, 9.303466796875, 9.6517333984375, 10.0]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 8.0, 11.0, 10.0, 14.0, 20.0, 17.0, 36.0, 26.0, 38.0, 33.0, 45.0, 48.0, 50.0, 66.0, 63.0, 56.0, 61.0, 59.0, 58.0, 41.0, 48.0, 34.0, 34.0, 28.0, 23.0, 16.0, 15.0, 11.0, 9.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.92578125, -4.78485107421875, -4.6439208984375, -4.50299072265625, -4.362060546875, -4.22113037109375, -4.0802001953125, -3.93927001953125, -3.79833984375, -3.65740966796875, -3.5164794921875, -3.37554931640625, -3.234619140625, -3.09368896484375, -2.9527587890625, -2.81182861328125, -2.6708984375, -2.52996826171875, -2.3890380859375, -2.24810791015625, -2.107177734375, -1.96624755859375, -1.8253173828125, -1.68438720703125, -1.54345703125, -1.40252685546875, -1.2615966796875, -1.12066650390625, -0.979736328125, -0.83880615234375, -0.6978759765625, -0.55694580078125, -0.416015625, -0.27508544921875, -0.1341552734375, 0.00677490234375, 0.147705078125, 0.28863525390625, 0.4295654296875, 0.57049560546875, 0.71142578125, 0.85235595703125, 0.9932861328125, 1.13421630859375, 1.275146484375, 1.41607666015625, 1.5570068359375, 1.69793701171875, 1.8388671875, 1.97979736328125, 2.1207275390625, 2.26165771484375, 2.402587890625, 2.54351806640625, 2.6844482421875, 2.82537841796875, 2.96630859375, 3.10723876953125, 3.2481689453125, 3.38909912109375, 3.530029296875, 3.67095947265625, 3.8118896484375, 3.95281982421875, 4.09375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 9.0, 17.0, 21.0, 26.0, 39.0, 38.0, 67.0, 103.0, 121.0, 171.0, 253.0, 330.0, 499.0, 906.0, 1872.0, 5406.0, 26603.0, 211315.0, 659698.0, 116835.0, 16498.0, 3924.0, 1450.0, 758.0, 461.0, 314.0, 214.0, 174.0, 97.0, 80.0, 63.0, 45.0, 33.0, 19.0, 30.0, 11.0, 10.0, 5.0, 4.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.578125, -13.11572265625, -12.6533203125, -12.19091796875, -11.728515625, -11.26611328125, -10.8037109375, -10.34130859375, -9.87890625, -9.41650390625, -8.9541015625, -8.49169921875, -8.029296875, -7.56689453125, -7.1044921875, -6.64208984375, -6.1796875, -5.71728515625, -5.2548828125, -4.79248046875, -4.330078125, -3.86767578125, -3.4052734375, -2.94287109375, -2.48046875, -2.01806640625, -1.5556640625, -1.09326171875, -0.630859375, -0.16845703125, 0.2939453125, 0.75634765625, 1.21875, 1.68115234375, 2.1435546875, 2.60595703125, 3.068359375, 3.53076171875, 3.9931640625, 4.45556640625, 4.91796875, 5.38037109375, 5.8427734375, 6.30517578125, 6.767578125, 7.22998046875, 7.6923828125, 8.15478515625, 8.6171875, 9.07958984375, 9.5419921875, 10.00439453125, 10.466796875, 10.92919921875, 11.3916015625, 11.85400390625, 12.31640625, 12.77880859375, 13.2412109375, 13.70361328125, 14.166015625, 14.62841796875, 15.0908203125, 15.55322265625, 16.015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 8.0, 6.0, 12.0, 12.0, 14.0, 23.0, 22.0, 24.0, 39.0, 38.0, 43.0, 53.0, 50.0, 50.0, 43.0, 55.0, 62.0, 56.0, 50.0, 40.0, 48.0, 36.0, 40.0, 29.0, 26.0, 30.0, 20.0, 12.0, 11.0, 13.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.75, -20.029541015625, -19.30908203125, -18.588623046875, -17.8681640625, -17.147705078125, -16.42724609375, -15.706787109375, -14.986328125, -14.265869140625, -13.54541015625, -12.824951171875, -12.1044921875, -11.384033203125, -10.66357421875, -9.943115234375, -9.22265625, -8.502197265625, -7.78173828125, -7.061279296875, -6.3408203125, -5.620361328125, -4.89990234375, -4.179443359375, -3.458984375, -2.738525390625, -2.01806640625, -1.297607421875, -0.5771484375, 0.143310546875, 0.86376953125, 1.584228515625, 2.3046875, 3.025146484375, 3.74560546875, 4.466064453125, 5.1865234375, 5.906982421875, 6.62744140625, 7.347900390625, 8.068359375, 8.788818359375, 9.50927734375, 10.229736328125, 10.9501953125, 11.670654296875, 12.39111328125, 13.111572265625, 13.83203125, 14.552490234375, 15.27294921875, 15.993408203125, 16.7138671875, 17.434326171875, 18.15478515625, 18.875244140625, 19.595703125, 20.316162109375, 21.03662109375, 21.757080078125, 22.4775390625, 23.197998046875, 23.91845703125, 24.638916015625, 25.359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 11.0, 22.0, 20.0, 35.0, 49.0, 100.0, 145.0, 249.0, 642.0, 1487.0, 5138.0, 25755.0, 223095.0, 666383.0, 105531.0, 14450.0, 3315.0, 1121.0, 445.0, 222.0, 122.0, 66.0, 43.0, 25.0, 20.0, 16.0, 11.0, 7.0, 8.0, 8.0, 6.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.96875, -7.76617431640625, -7.5635986328125, -7.36102294921875, -7.158447265625, -6.95587158203125, -6.7532958984375, -6.55072021484375, -6.34814453125, -6.14556884765625, -5.9429931640625, -5.74041748046875, -5.537841796875, -5.33526611328125, -5.1326904296875, -4.93011474609375, -4.7275390625, -4.52496337890625, -4.3223876953125, -4.11981201171875, -3.917236328125, -3.71466064453125, -3.5120849609375, -3.30950927734375, -3.10693359375, -2.90435791015625, -2.7017822265625, -2.49920654296875, -2.296630859375, -2.09405517578125, -1.8914794921875, -1.68890380859375, -1.486328125, -1.28375244140625, -1.0811767578125, -0.87860107421875, -0.676025390625, -0.47344970703125, -0.2708740234375, -0.06829833984375, 0.13427734375, 0.33685302734375, 0.5394287109375, 0.74200439453125, 0.944580078125, 1.14715576171875, 1.3497314453125, 1.55230712890625, 1.7548828125, 1.95745849609375, 2.1600341796875, 2.36260986328125, 2.565185546875, 2.76776123046875, 2.9703369140625, 3.17291259765625, 3.37548828125, 3.57806396484375, 3.7806396484375, 3.98321533203125, 4.185791015625, 4.38836669921875, 4.5909423828125, 4.79351806640625, 4.99609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 16.0, 28.0, 20.0, 43.0, 53.0, 68.0, 68.0, 86.0, 107.0, 98.0, 96.0, 67.0, 54.0, 49.0, 32.0, 18.0, 14.0, 14.0, 12.0, 9.0, 8.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006771087646484375, -0.000655055046081543, -0.0006330013275146484, -0.0006109476089477539, -0.0005888938903808594, -0.0005668401718139648, -0.0005447864532470703, -0.0005227327346801758, -0.0005006790161132812, -0.0004786252975463867, -0.0004565715789794922, -0.00043451786041259766, -0.0004124641418457031, -0.0003904104232788086, -0.00036835670471191406, -0.00034630298614501953, -0.000324249267578125, -0.00030219554901123047, -0.00028014183044433594, -0.0002580881118774414, -0.00023603439331054688, -0.00021398067474365234, -0.0001919269561767578, -0.00016987323760986328, -0.00014781951904296875, -0.00012576580047607422, -0.00010371208190917969, -8.165836334228516e-05, -5.9604644775390625e-05, -3.7550926208496094e-05, -1.5497207641601562e-05, 6.556510925292969e-06, 2.86102294921875e-05, 5.066394805908203e-05, 7.271766662597656e-05, 9.47713851928711e-05, 0.00011682510375976562, 0.00013887882232666016, 0.0001609325408935547, 0.00018298625946044922, 0.00020503997802734375, 0.00022709369659423828, 0.0002491474151611328, 0.00027120113372802734, 0.0002932548522949219, 0.0003153085708618164, 0.00033736228942871094, 0.00035941600799560547, 0.0003814697265625, 0.00040352344512939453, 0.00042557716369628906, 0.0004476308822631836, 0.0004696846008300781, 0.0004917383193969727, 0.0005137920379638672, 0.0005358457565307617, 0.0005578994750976562, 0.0005799531936645508, 0.0006020069122314453, 0.0006240606307983398, 0.0006461143493652344, 0.0006681680679321289, 0.0006902217864990234, 0.000712275505065918, 0.0007343292236328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 11.0, 7.0, 14.0, 16.0, 19.0, 35.0, 56.0, 88.0, 132.0, 228.0, 418.0, 838.0, 2013.0, 6694.0, 42405.0, 460080.0, 479923.0, 44547.0, 7004.0, 2075.0, 891.0, 451.0, 247.0, 123.0, 75.0, 51.0, 30.0, 21.0, 15.0, 9.0, 12.0, 6.0, 6.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.9356689453125, -6.718994140625, -6.5023193359375, -6.28564453125, -6.0689697265625, -5.852294921875, -5.6356201171875, -5.4189453125, -5.2022705078125, -4.985595703125, -4.7689208984375, -4.55224609375, -4.3355712890625, -4.118896484375, -3.9022216796875, -3.685546875, -3.4688720703125, -3.252197265625, -3.0355224609375, -2.81884765625, -2.6021728515625, -2.385498046875, -2.1688232421875, -1.9521484375, -1.7354736328125, -1.518798828125, -1.3021240234375, -1.08544921875, -0.8687744140625, -0.652099609375, -0.4354248046875, -0.21875, -0.0020751953125, 0.214599609375, 0.4312744140625, 0.64794921875, 0.8646240234375, 1.081298828125, 1.2979736328125, 1.5146484375, 1.7313232421875, 1.947998046875, 2.1646728515625, 2.38134765625, 2.5980224609375, 2.814697265625, 3.0313720703125, 3.248046875, 3.4647216796875, 3.681396484375, 3.8980712890625, 4.11474609375, 4.3314208984375, 4.548095703125, 4.7647705078125, 4.9814453125, 5.1981201171875, 5.414794921875, 5.6314697265625, 5.84814453125, 6.0648193359375, 6.281494140625, 6.4981689453125, 6.71484375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 7.0, 12.0, 15.0, 20.0, 28.0, 35.0, 63.0, 75.0, 107.0, 121.0, 123.0, 109.0, 86.0, 65.0, 46.0, 37.0, 20.0, 18.0, 10.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44140625, -6.16302490234375, -5.8846435546875, -5.60626220703125, -5.327880859375, -5.04949951171875, -4.7711181640625, -4.49273681640625, -4.21435546875, -3.93597412109375, -3.6575927734375, -3.37921142578125, -3.100830078125, -2.82244873046875, -2.5440673828125, -2.26568603515625, -1.9873046875, -1.70892333984375, -1.4305419921875, -1.15216064453125, -0.873779296875, -0.59539794921875, -0.3170166015625, -0.03863525390625, 0.23974609375, 0.51812744140625, 0.7965087890625, 1.07489013671875, 1.353271484375, 1.63165283203125, 1.9100341796875, 2.18841552734375, 2.466796875, 2.74517822265625, 3.0235595703125, 3.30194091796875, 3.580322265625, 3.85870361328125, 4.1370849609375, 4.41546630859375, 4.69384765625, 4.97222900390625, 5.2506103515625, 5.52899169921875, 5.807373046875, 6.08575439453125, 6.3641357421875, 6.64251708984375, 6.9208984375, 7.19927978515625, 7.4776611328125, 7.75604248046875, 8.034423828125, 8.31280517578125, 8.5911865234375, 8.86956787109375, 9.14794921875, 9.42633056640625, 9.7047119140625, 9.98309326171875, 10.261474609375, 10.53985595703125, 10.8182373046875, 11.09661865234375, 11.375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 9.0, 29.0, 55.0, 146.0, 262.0, 282.0, 147.0, 48.0, 22.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.33538055419922, -60.4007568359375, -54.46613311767578, -48.53150939941406, -42.596885681152344, -36.662261962890625, -30.727638244628906, -24.793014526367188, -18.85839080810547, -12.92376708984375, -6.989143371582031, -1.0545196533203125, 4.880104064941406, 10.814727783203125, 16.749351501464844, 22.683975219726562, 28.61859893798828, 34.55322265625, 40.48784637451172, 46.42247009277344, 52.357093811035156, 58.291717529296875, 64.2263412475586, 70.16096496582031, 76.09558868408203, 82.03021240234375, 87.96483612060547, 93.89945983886719, 99.8340835571289, 105.76870727539062, 111.70333099365234, 117.63795471191406, 123.57257080078125, 129.5072021484375, 135.4418182373047, 141.37643432617188, 147.31106567382812, 153.24569702148438, 159.18031311035156, 165.11492919921875, 171.049560546875, 176.98419189453125, 182.91880798339844, 188.85342407226562, 194.78805541992188, 200.72268676757812, 206.6573028564453, 212.5919189453125, 218.52655029296875, 224.461181640625, 230.3957977294922, 236.33041381835938, 242.26504516601562, 248.19967651367188, 254.13429260253906, 260.06890869140625, 266.0035400390625, 271.93817138671875, 277.872802734375, 283.8074035644531, 289.7420349121094, 295.6766662597656, 301.61126708984375, 307.5458984375, 313.48052978515625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 6.0, 8.0, 5.0, 13.0, 7.0, 12.0, 15.0, 27.0, 17.0, 29.0, 40.0, 24.0, 36.0, 40.0, 40.0, 45.0, 49.0, 60.0, 55.0, 44.0, 53.0, 46.0, 39.0, 45.0, 23.0, 40.0, 28.0, 26.0, 25.0, 15.0, 17.0, 11.0, 12.0, 5.0, 7.0, 5.0, 10.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.71615600585938, -71.97296905517578, -69.22978973388672, -66.48660278320312, -63.74342346191406, -61.00023651123047, -58.25705337524414, -55.51387023925781, -52.770687103271484, -50.027503967285156, -47.28432083129883, -44.5411376953125, -41.797950744628906, -39.054771423339844, -36.31158447265625, -33.56840133666992, -30.825218200683594, -28.082035064697266, -25.338851928710938, -22.595666885375977, -19.85248374938965, -17.10930061340332, -14.36611557006836, -11.622932434082031, -8.879749298095703, -6.136565685272217, -3.3933820724487305, -0.6501979827880859, 2.092985153198242, 4.83616828918457, 7.579353332519531, 10.32253646850586, 13.065719604492188, 15.808902740478516, 18.552085876464844, 21.295270919799805, 24.038454055786133, 26.78163719177246, 29.524822235107422, 32.26800537109375, 35.01118850708008, 37.754371643066406, 40.497554779052734, 43.24073791503906, 45.983924865722656, 48.72710418701172, 51.47029113769531, 54.21347427368164, 56.95665740966797, 59.6998405456543, 62.443023681640625, 65.18621063232422, 67.92938995361328, 70.67257690429688, 73.41575622558594, 76.15894317626953, 78.90213012695312, 81.64531707763672, 84.38849639892578, 87.13168334960938, 89.87486267089844, 92.61804962158203, 95.36123657226562, 98.10441589355469, 100.84759521484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 11.0, 7.0, 9.0, 12.0, 19.0, 21.0, 31.0, 45.0, 74.0, 107.0, 169.0, 245.0, 388.0, 653.0, 1217.0, 2262.0, 4828.0, 12191.0, 40856.0, 406813.0, 3646729.0, 51807.0, 14265.0, 5657.0, 2555.0, 1396.0, 773.0, 427.0, 258.0, 142.0, 90.0, 69.0, 39.0, 32.0, 24.0, 15.0, 12.0, 11.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-7.62109375, -7.39068603515625, -7.1602783203125, -6.92987060546875, -6.699462890625, -6.46905517578125, -6.2386474609375, -6.00823974609375, -5.77783203125, -5.54742431640625, -5.3170166015625, -5.08660888671875, -4.856201171875, -4.62579345703125, -4.3953857421875, -4.16497802734375, -3.9345703125, -3.70416259765625, -3.4737548828125, -3.24334716796875, -3.012939453125, -2.78253173828125, -2.5521240234375, -2.32171630859375, -2.09130859375, -1.86090087890625, -1.6304931640625, -1.40008544921875, -1.169677734375, -0.93927001953125, -0.7088623046875, -0.47845458984375, -0.248046875, -0.01763916015625, 0.2127685546875, 0.44317626953125, 0.673583984375, 0.90399169921875, 1.1343994140625, 1.36480712890625, 1.59521484375, 1.82562255859375, 2.0560302734375, 2.28643798828125, 2.516845703125, 2.74725341796875, 2.9776611328125, 3.20806884765625, 3.4384765625, 3.66888427734375, 3.8992919921875, 4.12969970703125, 4.360107421875, 4.59051513671875, 4.8209228515625, 5.05133056640625, 5.28173828125, 5.51214599609375, 5.7425537109375, 5.97296142578125, 6.203369140625, 6.43377685546875, 6.6641845703125, 6.89459228515625, 7.125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 11.0, 14.0, 17.0, 17.0, 16.0, 31.0, 44.0, 36.0, 47.0, 57.0, 59.0, 58.0, 78.0, 69.0, 64.0, 56.0, 61.0, 44.0, 40.0, 51.0, 22.0, 24.0, 22.0, 14.0, 9.0, 13.0, 5.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96875, -4.8143310546875, -4.659912109375, -4.5054931640625, -4.35107421875, -4.1966552734375, -4.042236328125, -3.8878173828125, -3.7333984375, -3.5789794921875, -3.424560546875, -3.2701416015625, -3.11572265625, -2.9613037109375, -2.806884765625, -2.6524658203125, -2.498046875, -2.3436279296875, -2.189208984375, -2.0347900390625, -1.88037109375, -1.7259521484375, -1.571533203125, -1.4171142578125, -1.2626953125, -1.1082763671875, -0.953857421875, -0.7994384765625, -0.64501953125, -0.4906005859375, -0.336181640625, -0.1817626953125, -0.02734375, 0.1270751953125, 0.281494140625, 0.4359130859375, 0.59033203125, 0.7447509765625, 0.899169921875, 1.0535888671875, 1.2080078125, 1.3624267578125, 1.516845703125, 1.6712646484375, 1.82568359375, 1.9801025390625, 2.134521484375, 2.2889404296875, 2.443359375, 2.5977783203125, 2.752197265625, 2.9066162109375, 3.06103515625, 3.2154541015625, 3.369873046875, 3.5242919921875, 3.6787109375, 3.8331298828125, 3.987548828125, 4.1419677734375, 4.29638671875, 4.4508056640625, 4.605224609375, 4.7596435546875, 4.9140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 8.0, 13.0, 10.0, 16.0, 18.0, 29.0, 45.0, 53.0, 71.0, 85.0, 123.0, 176.0, 274.0, 430.0, 720.0, 1312.0, 2585.0, 6075.0, 16397.0, 65891.0, 3653314.0, 382646.0, 42057.0, 12224.0, 4662.0, 2126.0, 1099.0, 637.0, 363.0, 233.0, 163.0, 135.0, 72.0, 55.0, 49.0, 32.0, 30.0, 16.0, 13.0, 11.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.87890625, -7.6651611328125, -7.451416015625, -7.2376708984375, -7.02392578125, -6.8101806640625, -6.596435546875, -6.3826904296875, -6.1689453125, -5.9552001953125, -5.741455078125, -5.5277099609375, -5.31396484375, -5.1002197265625, -4.886474609375, -4.6727294921875, -4.458984375, -4.2452392578125, -4.031494140625, -3.8177490234375, -3.60400390625, -3.3902587890625, -3.176513671875, -2.9627685546875, -2.7490234375, -2.5352783203125, -2.321533203125, -2.1077880859375, -1.89404296875, -1.6802978515625, -1.466552734375, -1.2528076171875, -1.0390625, -0.8253173828125, -0.611572265625, -0.3978271484375, -0.18408203125, 0.0296630859375, 0.243408203125, 0.4571533203125, 0.6708984375, 0.8846435546875, 1.098388671875, 1.3121337890625, 1.52587890625, 1.7396240234375, 1.953369140625, 2.1671142578125, 2.380859375, 2.5946044921875, 2.808349609375, 3.0220947265625, 3.23583984375, 3.4495849609375, 3.663330078125, 3.8770751953125, 4.0908203125, 4.3045654296875, 4.518310546875, 4.7320556640625, 4.94580078125, 5.1595458984375, 5.373291015625, 5.5870361328125, 5.80078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 18.0, 24.0, 34.0, 91.0, 309.0, 3224.0, 219.0, 61.0, 29.0, 16.0, 10.0, 10.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.923828125, -3.828826904296875, -3.73382568359375, -3.638824462890625, -3.5438232421875, -3.448822021484375, -3.35382080078125, -3.258819580078125, -3.163818359375, -3.068817138671875, -2.97381591796875, -2.878814697265625, -2.7838134765625, -2.688812255859375, -2.59381103515625, -2.498809814453125, -2.40380859375, -2.308807373046875, -2.21380615234375, -2.118804931640625, -2.0238037109375, -1.928802490234375, -1.83380126953125, -1.738800048828125, -1.643798828125, -1.548797607421875, -1.45379638671875, -1.358795166015625, -1.2637939453125, -1.168792724609375, -1.07379150390625, -0.978790283203125, -0.8837890625, -0.788787841796875, -0.69378662109375, -0.598785400390625, -0.5037841796875, -0.408782958984375, -0.31378173828125, -0.218780517578125, -0.123779296875, -0.028778076171875, 0.06622314453125, 0.161224365234375, 0.2562255859375, 0.351226806640625, 0.44622802734375, 0.541229248046875, 0.63623046875, 0.731231689453125, 0.82623291015625, 0.921234130859375, 1.0162353515625, 1.111236572265625, 1.20623779296875, 1.301239013671875, 1.396240234375, 1.491241455078125, 1.58624267578125, 1.681243896484375, 1.7762451171875, 1.871246337890625, 1.96624755859375, 2.061248779296875, 2.15625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 25.0, 72.0, 307.0, 394.0, 157.0, 33.0, 10.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.83179473876953, -34.04258346557617, -33.25336837768555, -32.46415710449219, -31.674945831298828, -30.885732650756836, -30.096519470214844, -29.307308197021484, -28.518095016479492, -27.7288818359375, -26.93967056274414, -26.15045738220215, -25.361244201660156, -24.572032928466797, -23.782819747924805, -22.993606567382812, -22.204395294189453, -21.41518211364746, -20.6259708404541, -19.83675765991211, -19.04754638671875, -18.258333206176758, -17.469120025634766, -16.679908752441406, -15.890695571899414, -15.101483345031738, -14.312271118164062, -13.52305793762207, -12.733845710754395, -11.944633483886719, -11.155420303344727, -10.36620807647705, -9.576997756958008, -8.787785530090332, -7.998572826385498, -7.209360122680664, -6.420147895812988, -5.6309356689453125, -4.8417229652404785, -4.0525102615356445, -3.2632980346679688, -2.474085569381714, -1.684873104095459, -0.8956606388092041, -0.10644817352294922, 0.6827642917633057, 1.4719767570495605, 2.2611894607543945, 3.0504016876220703, 3.839614152908325, 4.62882661819458, 5.418039321899414, 6.20725154876709, 6.996463775634766, 7.7856764793396, 8.574889183044434, 9.36410140991211, 10.153313636779785, 10.942525863647461, 11.731739044189453, 12.520951271057129, 13.310163497924805, 14.099376678466797, 14.888588905334473, 15.677801132202148]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 2.0, 4.0, 3.0, 8.0, 11.0, 14.0, 13.0, 18.0, 19.0, 28.0, 21.0, 25.0, 30.0, 27.0, 24.0, 40.0, 34.0, 37.0, 40.0, 38.0, 46.0, 26.0, 42.0, 40.0, 38.0, 30.0, 49.0, 28.0, 30.0, 23.0, 23.0, 23.0, 24.0, 25.0, 15.0, 13.0, 13.0, 16.0, 15.0, 10.0, 9.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-3.446737766265869, -3.3314435482025146, -3.21614933013916, -3.1008553504943848, -2.9855611324310303, -2.870266914367676, -2.7549726963043213, -2.639678478240967, -2.5243844985961914, -2.409090280532837, -2.2937960624694824, -2.178502082824707, -2.0632078647613525, -1.947913646697998, -1.8326194286346436, -1.717325210571289, -1.6020309925079346, -1.48673677444458, -1.3714426755905151, -1.2561484575271606, -1.1408543586730957, -1.0255601406097412, -0.9102659225463867, -0.794971764087677, -0.6796776056289673, -0.5643834471702576, -0.44908925890922546, -0.33379507064819336, -0.21850091218948364, -0.10320675373077393, 0.012087464332580566, 0.12738162279129028, 0.24267578125, 0.3579699397087097, 0.4732641279697418, 0.5885583162307739, 0.7038524746894836, 0.8191466331481934, 0.9344408512115479, 1.0497350692749023, 1.1650291681289673, 1.2803233861923218, 1.3956174850463867, 1.5109117031097412, 1.6262059211730957, 1.7415000200271606, 1.8567942380905151, 1.97208833694458, 2.0873825550079346, 2.202676773071289, 2.3179709911346436, 2.433265209197998, 2.5485591888427734, 2.663853406906128, 2.7791476249694824, 2.894441843032837, 3.0097360610961914, 3.125030279159546, 3.2403244972229004, 3.355618476867676, 3.4709126949310303, 3.5862069129943848, 3.7015011310577393, 3.8167953491210938, 3.932089328765869]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 7.0, 3.0, 14.0, 11.0, 29.0, 35.0, 46.0, 57.0, 101.0, 181.0, 308.0, 492.0, 1021.0, 2218.0, 5228.0, 13665.0, 39933.0, 122785.0, 309499.0, 335294.0, 143692.0, 47092.0, 15977.0, 5830.0, 2471.0, 1142.0, 542.0, 333.0, 195.0, 110.0, 68.0, 40.0, 31.0, 25.0, 27.0, 13.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.9375, -6.72119140625, -6.5048828125, -6.28857421875, -6.072265625, -5.85595703125, -5.6396484375, -5.42333984375, -5.20703125, -4.99072265625, -4.7744140625, -4.55810546875, -4.341796875, -4.12548828125, -3.9091796875, -3.69287109375, -3.4765625, -3.26025390625, -3.0439453125, -2.82763671875, -2.611328125, -2.39501953125, -2.1787109375, -1.96240234375, -1.74609375, -1.52978515625, -1.3134765625, -1.09716796875, -0.880859375, -0.66455078125, -0.4482421875, -0.23193359375, -0.015625, 0.20068359375, 0.4169921875, 0.63330078125, 0.849609375, 1.06591796875, 1.2822265625, 1.49853515625, 1.71484375, 1.93115234375, 2.1474609375, 2.36376953125, 2.580078125, 2.79638671875, 3.0126953125, 3.22900390625, 3.4453125, 3.66162109375, 3.8779296875, 4.09423828125, 4.310546875, 4.52685546875, 4.7431640625, 4.95947265625, 5.17578125, 5.39208984375, 5.6083984375, 5.82470703125, 6.041015625, 6.25732421875, 6.4736328125, 6.68994140625, 6.90625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 9.0, 10.0, 15.0, 13.0, 15.0, 13.0, 29.0, 30.0, 31.0, 46.0, 40.0, 46.0, 51.0, 56.0, 55.0, 69.0, 61.0, 59.0, 49.0, 48.0, 39.0, 34.0, 40.0, 36.0, 14.0, 27.0, 17.0, 11.0, 4.0, 10.0, 4.0, 6.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.13360595703125, -3.9976806640625, -3.86175537109375, -3.725830078125, -3.58990478515625, -3.4539794921875, -3.31805419921875, -3.18212890625, -3.04620361328125, -2.9102783203125, -2.77435302734375, -2.638427734375, -2.50250244140625, -2.3665771484375, -2.23065185546875, -2.0947265625, -1.95880126953125, -1.8228759765625, -1.68695068359375, -1.551025390625, -1.41510009765625, -1.2791748046875, -1.14324951171875, -1.00732421875, -0.87139892578125, -0.7354736328125, -0.59954833984375, -0.463623046875, -0.32769775390625, -0.1917724609375, -0.05584716796875, 0.080078125, 0.21600341796875, 0.3519287109375, 0.48785400390625, 0.623779296875, 0.75970458984375, 0.8956298828125, 1.03155517578125, 1.16748046875, 1.30340576171875, 1.4393310546875, 1.57525634765625, 1.711181640625, 1.84710693359375, 1.9830322265625, 2.11895751953125, 2.2548828125, 2.39080810546875, 2.5267333984375, 2.66265869140625, 2.798583984375, 2.93450927734375, 3.0704345703125, 3.20635986328125, 3.34228515625, 3.47821044921875, 3.6141357421875, 3.75006103515625, 3.885986328125, 4.02191162109375, 4.1578369140625, 4.29376220703125, 4.4296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 6.0, 0.0, 3.0, 6.0, 14.0, 7.0, 18.0, 18.0, 23.0, 26.0, 49.0, 37.0, 60.0, 71.0, 120.0, 170.0, 236.0, 333.0, 458.0, 716.0, 1176.0, 2254.0, 5797.0, 21789.0, 117672.0, 558553.0, 274971.0, 45730.0, 10223.0, 3525.0, 1584.0, 920.0, 567.0, 373.0, 298.0, 191.0, 143.0, 120.0, 69.0, 55.0, 42.0, 32.0, 30.0, 15.0, 15.0, 7.0, 10.0, 6.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.703125, -9.3973388671875, -9.091552734375, -8.7857666015625, -8.47998046875, -8.1741943359375, -7.868408203125, -7.5626220703125, -7.2568359375, -6.9510498046875, -6.645263671875, -6.3394775390625, -6.03369140625, -5.7279052734375, -5.422119140625, -5.1163330078125, -4.810546875, -4.5047607421875, -4.198974609375, -3.8931884765625, -3.58740234375, -3.2816162109375, -2.975830078125, -2.6700439453125, -2.3642578125, -2.0584716796875, -1.752685546875, -1.4468994140625, -1.14111328125, -0.8353271484375, -0.529541015625, -0.2237548828125, 0.08203125, 0.3878173828125, 0.693603515625, 0.9993896484375, 1.30517578125, 1.6109619140625, 1.916748046875, 2.2225341796875, 2.5283203125, 2.8341064453125, 3.139892578125, 3.4456787109375, 3.75146484375, 4.0572509765625, 4.363037109375, 4.6688232421875, 4.974609375, 5.2803955078125, 5.586181640625, 5.8919677734375, 6.19775390625, 6.5035400390625, 6.809326171875, 7.1151123046875, 7.4208984375, 7.7266845703125, 8.032470703125, 8.3382568359375, 8.64404296875, 8.9498291015625, 9.255615234375, 9.5614013671875, 9.8671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 4.0, 12.0, 12.0, 15.0, 14.0, 7.0, 21.0, 16.0, 19.0, 40.0, 36.0, 37.0, 27.0, 43.0, 52.0, 56.0, 40.0, 71.0, 50.0, 48.0, 56.0, 49.0, 46.0, 30.0, 34.0, 27.0, 31.0, 27.0, 18.0, 9.0, 12.0, 8.0, 5.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.296875, -17.725830078125, -17.15478515625, -16.583740234375, -16.0126953125, -15.441650390625, -14.87060546875, -14.299560546875, -13.728515625, -13.157470703125, -12.58642578125, -12.015380859375, -11.4443359375, -10.873291015625, -10.30224609375, -9.731201171875, -9.16015625, -8.589111328125, -8.01806640625, -7.447021484375, -6.8759765625, -6.304931640625, -5.73388671875, -5.162841796875, -4.591796875, -4.020751953125, -3.44970703125, -2.878662109375, -2.3076171875, -1.736572265625, -1.16552734375, -0.594482421875, -0.0234375, 0.547607421875, 1.11865234375, 1.689697265625, 2.2607421875, 2.831787109375, 3.40283203125, 3.973876953125, 4.544921875, 5.115966796875, 5.68701171875, 6.258056640625, 6.8291015625, 7.400146484375, 7.97119140625, 8.542236328125, 9.11328125, 9.684326171875, 10.25537109375, 10.826416015625, 11.3974609375, 11.968505859375, 12.53955078125, 13.110595703125, 13.681640625, 14.252685546875, 14.82373046875, 15.394775390625, 15.9658203125, 16.536865234375, 17.10791015625, 17.678955078125, 18.25]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 13.0, 10.0, 28.0, 49.0, 126.0, 412.0, 1737.0, 34403.0, 982393.0, 27160.0, 1547.0, 418.0, 129.0, 62.0, 35.0, 16.0, 12.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -8.8502197265625, -8.395751953125, -7.9412841796875, -7.48681640625, -7.0323486328125, -6.577880859375, -6.1234130859375, -5.6689453125, -5.2144775390625, -4.760009765625, -4.3055419921875, -3.85107421875, -3.3966064453125, -2.942138671875, -2.4876708984375, -2.033203125, -1.5787353515625, -1.124267578125, -0.6697998046875, -0.21533203125, 0.2391357421875, 0.693603515625, 1.1480712890625, 1.6025390625, 2.0570068359375, 2.511474609375, 2.9659423828125, 3.42041015625, 3.8748779296875, 4.329345703125, 4.7838134765625, 5.23828125, 5.6927490234375, 6.147216796875, 6.6016845703125, 7.05615234375, 7.5106201171875, 7.965087890625, 8.4195556640625, 8.8740234375, 9.3284912109375, 9.782958984375, 10.2374267578125, 10.69189453125, 11.1463623046875, 11.600830078125, 12.0552978515625, 12.509765625, 12.9642333984375, 13.418701171875, 13.8731689453125, 14.32763671875, 14.7821044921875, 15.236572265625, 15.6910400390625, 16.1455078125, 16.5999755859375, 17.054443359375, 17.5089111328125, 17.96337890625, 18.4178466796875, 18.872314453125, 19.3267822265625, 19.78125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 11.0, 7.0, 12.0, 15.0, 28.0, 39.0, 51.0, 89.0, 108.0, 127.0, 135.0, 109.0, 87.0, 50.0, 32.0, 24.0, 21.0, 8.0, 17.0, 8.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010805130004882812, -0.0010535269975662231, -0.001026540994644165, -0.000999554991722107, -0.0009725689888000488, -0.0009455829858779907, -0.0009185969829559326, -0.0008916109800338745, -0.0008646249771118164, -0.0008376389741897583, -0.0008106529712677002, -0.0007836669683456421, -0.000756680965423584, -0.0007296949625015259, -0.0007027089595794678, -0.0006757229566574097, -0.0006487369537353516, -0.0006217509508132935, -0.0005947649478912354, -0.0005677789449691772, -0.0005407929420471191, -0.000513806939125061, -0.00048682093620300293, -0.0004598349332809448, -0.0004328489303588867, -0.0004058629274368286, -0.0003788769245147705, -0.0003518909215927124, -0.0003249049186706543, -0.0002979189157485962, -0.0002709329128265381, -0.00024394690990447998, -0.00021696090698242188, -0.00018997490406036377, -0.00016298890113830566, -0.00013600289821624756, -0.00010901689529418945, -8.203089237213135e-05, -5.504488945007324e-05, -2.8058886528015137e-05, -1.0728836059570312e-06, 2.5913119316101074e-05, 5.289912223815918e-05, 7.988512516021729e-05, 0.00010687112808227539, 0.0001338571310043335, 0.0001608431339263916, 0.0001878291368484497, 0.0002148151397705078, 0.00024180114269256592, 0.000268787145614624, 0.00029577314853668213, 0.00032275915145874023, 0.00034974515438079834, 0.00037673115730285645, 0.00040371716022491455, 0.00043070316314697266, 0.00045768916606903076, 0.00048467516899108887, 0.000511661171913147, 0.0005386471748352051, 0.0005656331777572632, 0.0005926191806793213, 0.0006196051836013794, 0.0006465911865234375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 0.0, 6.0, 9.0, 12.0, 21.0, 27.0, 51.0, 73.0, 150.0, 290.0, 540.0, 1477.0, 6543.0, 83697.0, 873158.0, 73718.0, 6060.0, 1516.0, 595.0, 259.0, 129.0, 84.0, 47.0, 37.0, 13.0, 13.0, 8.0, 9.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.24609375, -6.97247314453125, -6.6988525390625, -6.42523193359375, -6.151611328125, -5.87799072265625, -5.6043701171875, -5.33074951171875, -5.05712890625, -4.78350830078125, -4.5098876953125, -4.23626708984375, -3.962646484375, -3.68902587890625, -3.4154052734375, -3.14178466796875, -2.8681640625, -2.59454345703125, -2.3209228515625, -2.04730224609375, -1.773681640625, -1.50006103515625, -1.2264404296875, -0.95281982421875, -0.67919921875, -0.40557861328125, -0.1319580078125, 0.14166259765625, 0.415283203125, 0.68890380859375, 0.9625244140625, 1.23614501953125, 1.509765625, 1.78338623046875, 2.0570068359375, 2.33062744140625, 2.604248046875, 2.87786865234375, 3.1514892578125, 3.42510986328125, 3.69873046875, 3.97235107421875, 4.2459716796875, 4.51959228515625, 4.793212890625, 5.06683349609375, 5.3404541015625, 5.61407470703125, 5.8876953125, 6.16131591796875, 6.4349365234375, 6.70855712890625, 6.982177734375, 7.25579833984375, 7.5294189453125, 7.80303955078125, 8.07666015625, 8.35028076171875, 8.6239013671875, 8.89752197265625, 9.171142578125, 9.44476318359375, 9.7183837890625, 9.99200439453125, 10.265625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 8.0, 9.0, 32.0, 54.0, 102.0, 163.0, 193.0, 183.0, 127.0, 67.0, 35.0, 18.0, 11.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.296875, -16.94244384765625, -16.5880126953125, -16.23358154296875, -15.879150390625, -15.52471923828125, -15.1702880859375, -14.81585693359375, -14.46142578125, -14.10699462890625, -13.7525634765625, -13.39813232421875, -13.043701171875, -12.68927001953125, -12.3348388671875, -11.98040771484375, -11.6259765625, -11.27154541015625, -10.9171142578125, -10.56268310546875, -10.208251953125, -9.85382080078125, -9.4993896484375, -9.14495849609375, -8.79052734375, -8.43609619140625, -8.0816650390625, -7.72723388671875, -7.372802734375, -7.01837158203125, -6.6639404296875, -6.30950927734375, -5.955078125, -5.60064697265625, -5.2462158203125, -4.89178466796875, -4.537353515625, -4.18292236328125, -3.8284912109375, -3.47406005859375, -3.11962890625, -2.76519775390625, -2.4107666015625, -2.05633544921875, -1.701904296875, -1.34747314453125, -0.9930419921875, -0.63861083984375, -0.2841796875, 0.07025146484375, 0.4246826171875, 0.77911376953125, 1.133544921875, 1.48797607421875, 1.8424072265625, 2.19683837890625, 2.55126953125, 2.90570068359375, 3.2601318359375, 3.61456298828125, 3.968994140625, 4.32342529296875, 4.6778564453125, 5.03228759765625, 5.38671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 16.0, 58.0, 108.0, 220.0, 259.0, 188.0, 83.0, 32.0, 14.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.9035186767578, -200.09164428710938, -195.27978515625, -190.46791076660156, -185.65603637695312, -180.84417724609375, -176.0323028564453, -171.22042846679688, -166.4085693359375, -161.59669494628906, -156.7848358154297, -151.97296142578125, -147.1610870361328, -142.34922790527344, -137.537353515625, -132.72549438476562, -127.91361236572266, -123.10174560546875, -118.28987121582031, -113.4780044555664, -108.6661376953125, -103.85426330566406, -99.04239654541016, -94.23052978515625, -89.41865539550781, -84.6067886352539, -79.79491424560547, -74.98304748535156, -70.17118072509766, -65.35931396484375, -60.54743957519531, -55.735572814941406, -50.92371368408203, -46.11184310913086, -41.29997634887695, -36.48810577392578, -31.676237106323242, -26.864368438720703, -22.05249786376953, -17.240631103515625, -12.428760528564453, -7.616891384124756, -2.8050222396850586, 2.006847381591797, 6.818716049194336, 11.630584716796875, 16.442455291748047, 21.254322052001953, 26.066192626953125, 30.878061294555664, 35.6899299621582, 40.501800537109375, 45.31366729736328, 50.12553787231445, 54.937408447265625, 59.74927520751953, 64.56114196777344, 69.37300872802734, 74.18488311767578, 78.99674987792969, 83.8086166381836, 88.6204833984375, 93.43235778808594, 98.24422454833984, 103.05609893798828]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 6.0, 8.0, 10.0, 10.0, 17.0, 16.0, 14.0, 20.0, 29.0, 25.0, 34.0, 45.0, 45.0, 44.0, 45.0, 40.0, 45.0, 40.0, 54.0, 39.0, 45.0, 32.0, 38.0, 40.0, 30.0, 30.0, 27.0, 22.0, 21.0, 15.0, 18.0, 18.0, 13.0, 10.0, 11.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-74.59950256347656, -72.32041931152344, -70.04133605957031, -67.76225280761719, -65.48316955566406, -63.20408248901367, -60.92499542236328, -58.645912170410156, -56.36682891845703, -54.087745666503906, -51.80866241455078, -49.52957534790039, -47.250492095947266, -44.97140884399414, -42.69232177734375, -40.413238525390625, -38.1341552734375, -35.855072021484375, -33.57598876953125, -31.29690170288086, -29.017818450927734, -26.73873519897461, -24.45965003967285, -22.180564880371094, -19.90148162841797, -17.622398376464844, -15.343313217163086, -13.064229011535645, -10.785144805908203, -8.506060600280762, -6.22697639465332, -3.947892189025879, -1.6688003540039062, 0.6102838516235352, 2.8893680572509766, 5.168452262878418, 7.447536468505859, 9.7266206741333, 12.005704879760742, 14.284789085388184, 16.563873291015625, 18.84295654296875, 21.122041702270508, 23.401126861572266, 25.68021011352539, 27.959293365478516, 30.238378524780273, 32.51746368408203, 34.796546936035156, 37.07563018798828, 39.354713439941406, 41.6338005065918, 43.91288375854492, 46.19196701049805, 48.47105407714844, 50.75013732910156, 53.02922058105469, 55.30830383300781, 57.58738708496094, 59.86647415161133, 62.14555740356445, 64.42464447021484, 66.70372772216797, 68.9828109741211, 71.26189422607422]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 10.0, 12.0, 21.0, 19.0, 39.0, 53.0, 77.0, 93.0, 168.0, 286.0, 428.0, 748.0, 1491.0, 3401.0, 9797.0, 51481.0, 4038489.0, 68637.0, 11448.0, 3781.0, 1648.0, 825.0, 467.0, 297.0, 183.0, 104.0, 75.0, 59.0, 46.0, 26.0, 17.0, 10.0, 11.0, 4.0, 7.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.880615234375, -8.51904296875, -8.157470703125, -7.7958984375, -7.434326171875, -7.07275390625, -6.711181640625, -6.349609375, -5.988037109375, -5.62646484375, -5.264892578125, -4.9033203125, -4.541748046875, -4.18017578125, -3.818603515625, -3.45703125, -3.095458984375, -2.73388671875, -2.372314453125, -2.0107421875, -1.649169921875, -1.28759765625, -0.926025390625, -0.564453125, -0.202880859375, 0.15869140625, 0.520263671875, 0.8818359375, 1.243408203125, 1.60498046875, 1.966552734375, 2.328125, 2.689697265625, 3.05126953125, 3.412841796875, 3.7744140625, 4.135986328125, 4.49755859375, 4.859130859375, 5.220703125, 5.582275390625, 5.94384765625, 6.305419921875, 6.6669921875, 7.028564453125, 7.39013671875, 7.751708984375, 8.11328125, 8.474853515625, 8.83642578125, 9.197998046875, 9.5595703125, 9.921142578125, 10.28271484375, 10.644287109375, 11.005859375, 11.367431640625, 11.72900390625, 12.090576171875, 12.4521484375, 12.813720703125, 13.17529296875, 13.536865234375, 13.8984375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 2.0, 10.0, 10.0, 19.0, 11.0, 23.0, 25.0, 29.0, 45.0, 38.0, 50.0, 51.0, 59.0, 56.0, 69.0, 66.0, 72.0, 58.0, 54.0, 47.0, 33.0, 38.0, 34.0, 20.0, 25.0, 13.0, 10.0, 10.0, 13.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.015625, -4.87213134765625, -4.7286376953125, -4.58514404296875, -4.441650390625, -4.29815673828125, -4.1546630859375, -4.01116943359375, -3.86767578125, -3.72418212890625, -3.5806884765625, -3.43719482421875, -3.293701171875, -3.15020751953125, -3.0067138671875, -2.86322021484375, -2.7197265625, -2.57623291015625, -2.4327392578125, -2.28924560546875, -2.145751953125, -2.00225830078125, -1.8587646484375, -1.71527099609375, -1.57177734375, -1.42828369140625, -1.2847900390625, -1.14129638671875, -0.997802734375, -0.85430908203125, -0.7108154296875, -0.56732177734375, -0.423828125, -0.28033447265625, -0.1368408203125, 0.00665283203125, 0.150146484375, 0.29364013671875, 0.4371337890625, 0.58062744140625, 0.72412109375, 0.86761474609375, 1.0111083984375, 1.15460205078125, 1.298095703125, 1.44158935546875, 1.5850830078125, 1.72857666015625, 1.8720703125, 2.01556396484375, 2.1590576171875, 2.30255126953125, 2.446044921875, 2.58953857421875, 2.7330322265625, 2.87652587890625, 3.02001953125, 3.16351318359375, 3.3070068359375, 3.45050048828125, 3.593994140625, 3.73748779296875, 3.8809814453125, 4.02447509765625, 4.16796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 8.0, 10.0, 10.0, 26.0, 33.0, 48.0, 54.0, 69.0, 80.0, 105.0, 179.0, 274.0, 345.0, 514.0, 825.0, 1612.0, 3156.0, 7721.0, 25178.0, 206177.0, 3876970.0, 48860.0, 12179.0, 4436.0, 2107.0, 1106.0, 662.0, 401.0, 298.0, 220.0, 163.0, 114.0, 90.0, 61.0, 44.0, 31.0, 26.0, 21.0, 15.0, 9.0, 7.0, 4.0, 6.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.08203125, -5.88067626953125, -5.6793212890625, -5.47796630859375, -5.276611328125, -5.07525634765625, -4.8739013671875, -4.67254638671875, -4.47119140625, -4.26983642578125, -4.0684814453125, -3.86712646484375, -3.665771484375, -3.46441650390625, -3.2630615234375, -3.06170654296875, -2.8603515625, -2.65899658203125, -2.4576416015625, -2.25628662109375, -2.054931640625, -1.85357666015625, -1.6522216796875, -1.45086669921875, -1.24951171875, -1.04815673828125, -0.8468017578125, -0.64544677734375, -0.444091796875, -0.24273681640625, -0.0413818359375, 0.15997314453125, 0.361328125, 0.56268310546875, 0.7640380859375, 0.96539306640625, 1.166748046875, 1.36810302734375, 1.5694580078125, 1.77081298828125, 1.97216796875, 2.17352294921875, 2.3748779296875, 2.57623291015625, 2.777587890625, 2.97894287109375, 3.1802978515625, 3.38165283203125, 3.5830078125, 3.78436279296875, 3.9857177734375, 4.18707275390625, 4.388427734375, 4.58978271484375, 4.7911376953125, 4.99249267578125, 5.19384765625, 5.39520263671875, 5.5965576171875, 5.79791259765625, 5.999267578125, 6.20062255859375, 6.4019775390625, 6.60333251953125, 6.8046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 7.0, 11.0, 18.0, 20.0, 39.0, 76.0, 207.0, 3344.0, 183.0, 74.0, 30.0, 12.0, 17.0, 8.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.375, -1.318817138671875, -1.26263427734375, -1.206451416015625, -1.1502685546875, -1.094085693359375, -1.03790283203125, -0.981719970703125, -0.925537109375, -0.869354248046875, -0.81317138671875, -0.756988525390625, -0.7008056640625, -0.644622802734375, -0.58843994140625, -0.532257080078125, -0.47607421875, -0.419891357421875, -0.36370849609375, -0.307525634765625, -0.2513427734375, -0.195159912109375, -0.13897705078125, -0.082794189453125, -0.026611328125, 0.029571533203125, 0.08575439453125, 0.141937255859375, 0.1981201171875, 0.254302978515625, 0.31048583984375, 0.366668701171875, 0.4228515625, 0.479034423828125, 0.53521728515625, 0.591400146484375, 0.6475830078125, 0.703765869140625, 0.75994873046875, 0.816131591796875, 0.872314453125, 0.928497314453125, 0.98468017578125, 1.040863037109375, 1.0970458984375, 1.153228759765625, 1.20941162109375, 1.265594482421875, 1.32177734375, 1.377960205078125, 1.43414306640625, 1.490325927734375, 1.5465087890625, 1.602691650390625, 1.65887451171875, 1.715057373046875, 1.771240234375, 1.827423095703125, 1.88360595703125, 1.939788818359375, 1.9959716796875, 2.052154541015625, 2.10833740234375, 2.164520263671875, 2.220703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 20.0, 95.0, 304.0, 340.0, 156.0, 57.0, 14.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.305152893066406, -24.706371307373047, -24.107587814331055, -23.508806228637695, -22.910022735595703, -22.311241149902344, -21.71245765686035, -21.113676071166992, -20.514892578125, -19.91611099243164, -19.31732749938965, -18.71854591369629, -18.119762420654297, -17.520980834960938, -16.922197341918945, -16.323415756225586, -15.724634170532227, -15.12585163116455, -14.527069091796875, -13.9282865524292, -13.329504013061523, -12.730722427368164, -12.131939888000488, -11.533157348632812, -10.934374809265137, -10.335592269897461, -9.736809730529785, -9.13802719116211, -8.53924560546875, -7.940462589263916, -7.341680526733398, -6.742897987365723, -6.144113540649414, -5.545331001281738, -4.9465484619140625, -4.347766399383545, -3.748983860015869, -3.1502013206481934, -2.5514190196990967, -1.95263671875, -1.3538541793823242, -0.755071759223938, -0.15628933906555176, 0.4424930810928345, 1.0412755012512207, 1.6400580406188965, 2.238840341567993, 2.83762264251709, 3.4364051818847656, 4.035187721252441, 4.633970260620117, 5.232752323150635, 5.8315348625183105, 6.430317401885986, 7.029099464416504, 7.62788200378418, 8.226664543151855, 8.825447082519531, 9.424229621887207, 10.023012161254883, 10.621793746948242, 11.220577239990234, 11.819358825683594, 12.41814136505127, 13.016923904418945]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 1.0, 7.0, 3.0, 5.0, 8.0, 13.0, 7.0, 9.0, 12.0, 15.0, 23.0, 17.0, 35.0, 26.0, 36.0, 38.0, 40.0, 46.0, 46.0, 42.0, 49.0, 40.0, 45.0, 53.0, 43.0, 39.0, 35.0, 38.0, 29.0, 34.0, 34.0, 27.0, 21.0, 16.0, 13.0, 11.0, 13.0, 6.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.556063652038574, -3.4452922344207764, -3.3345205783843994, -3.2237491607666016, -3.1129777431488037, -3.002206325531006, -2.891434669494629, -2.780663251876831, -2.669891834259033, -2.5591204166412354, -2.4483487606048584, -2.3375773429870605, -2.2268059253692627, -2.116034507751465, -2.005262851715088, -1.89449143409729, -1.7837198972702026, -1.6729483604431152, -1.5621769428253174, -1.45140540599823, -1.3406339883804321, -1.2298624515533447, -1.1190910339355469, -1.0083194971084595, -0.8975480198860168, -0.7867765426635742, -0.6760050654411316, -0.565233588218689, -0.45446208119392395, -0.34369057416915894, -0.2329190969467163, -0.12214761972427368, -0.011376142501831055, 0.09939534217119217, 0.2101668268442154, 0.3209383189678192, 0.43170979619026184, 0.5424813032150269, 0.6532527804374695, 0.7640242576599121, 0.8747957348823547, 0.9855672121047974, 1.0963387489318848, 1.2071101665496826, 1.31788170337677, 1.4286532402038574, 1.5394246578216553, 1.6501960754394531, 1.7609676122665405, 1.871739149093628, 1.9825105667114258, 2.0932819843292236, 2.2040536403656006, 2.3148250579833984, 2.4255964756011963, 2.536367893218994, 2.647139549255371, 2.757910966873169, 2.868682622909546, 2.9794540405273438, 3.0902254581451416, 3.2009968757629395, 3.3117685317993164, 3.4225399494171143, 3.533311367034912]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 13.0, 16.0, 18.0, 51.0, 75.0, 118.0, 185.0, 303.0, 565.0, 1051.0, 2071.0, 4325.0, 9722.0, 23530.0, 62011.0, 157102.0, 313352.0, 272348.0, 121631.0, 47069.0, 18082.0, 7528.0, 3514.0, 1748.0, 921.0, 487.0, 259.0, 157.0, 103.0, 56.0, 54.0, 29.0, 16.0, 13.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.18359375, -5.00396728515625, -4.8243408203125, -4.64471435546875, -4.465087890625, -4.28546142578125, -4.1058349609375, -3.92620849609375, -3.74658203125, -3.56695556640625, -3.3873291015625, -3.20770263671875, -3.028076171875, -2.84844970703125, -2.6688232421875, -2.48919677734375, -2.3095703125, -2.12994384765625, -1.9503173828125, -1.77069091796875, -1.591064453125, -1.41143798828125, -1.2318115234375, -1.05218505859375, -0.87255859375, -0.69293212890625, -0.5133056640625, -0.33367919921875, -0.154052734375, 0.02557373046875, 0.2052001953125, 0.38482666015625, 0.564453125, 0.74407958984375, 0.9237060546875, 1.10333251953125, 1.282958984375, 1.46258544921875, 1.6422119140625, 1.82183837890625, 2.00146484375, 2.18109130859375, 2.3607177734375, 2.54034423828125, 2.719970703125, 2.89959716796875, 3.0792236328125, 3.25885009765625, 3.4384765625, 3.61810302734375, 3.7977294921875, 3.97735595703125, 4.156982421875, 4.33660888671875, 4.5162353515625, 4.69586181640625, 4.87548828125, 5.05511474609375, 5.2347412109375, 5.41436767578125, 5.593994140625, 5.77362060546875, 5.9532470703125, 6.13287353515625, 6.3125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 8.0, 2.0, 8.0, 14.0, 11.0, 22.0, 24.0, 33.0, 35.0, 41.0, 39.0, 44.0, 50.0, 67.0, 51.0, 63.0, 68.0, 63.0, 60.0, 63.0, 29.0, 32.0, 33.0, 27.0, 29.0, 16.0, 20.0, 14.0, 11.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.66015625, -4.52178955078125, -4.3834228515625, -4.24505615234375, -4.106689453125, -3.96832275390625, -3.8299560546875, -3.69158935546875, -3.55322265625, -3.41485595703125, -3.2764892578125, -3.13812255859375, -2.999755859375, -2.86138916015625, -2.7230224609375, -2.58465576171875, -2.4462890625, -2.30792236328125, -2.1695556640625, -2.03118896484375, -1.892822265625, -1.75445556640625, -1.6160888671875, -1.47772216796875, -1.33935546875, -1.20098876953125, -1.0626220703125, -0.92425537109375, -0.785888671875, -0.64752197265625, -0.5091552734375, -0.37078857421875, -0.232421875, -0.09405517578125, 0.0443115234375, 0.18267822265625, 0.321044921875, 0.45941162109375, 0.5977783203125, 0.73614501953125, 0.87451171875, 1.01287841796875, 1.1512451171875, 1.28961181640625, 1.427978515625, 1.56634521484375, 1.7047119140625, 1.84307861328125, 1.9814453125, 2.11981201171875, 2.2581787109375, 2.39654541015625, 2.534912109375, 2.67327880859375, 2.8116455078125, 2.95001220703125, 3.08837890625, 3.22674560546875, 3.3651123046875, 3.50347900390625, 3.641845703125, 3.78021240234375, 3.9185791015625, 4.05694580078125, 4.1953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 7.0, 10.0, 14.0, 22.0, 38.0, 37.0, 46.0, 74.0, 95.0, 146.0, 200.0, 232.0, 317.0, 507.0, 864.0, 1430.0, 3451.0, 10261.0, 40759.0, 216758.0, 577547.0, 151351.0, 30031.0, 7906.0, 2767.0, 1310.0, 709.0, 472.0, 308.0, 251.0, 181.0, 134.0, 86.0, 51.0, 47.0, 33.0, 26.0, 16.0, 12.0, 11.0, 11.0, 5.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-8.140625, -7.88134765625, -7.6220703125, -7.36279296875, -7.103515625, -6.84423828125, -6.5849609375, -6.32568359375, -6.06640625, -5.80712890625, -5.5478515625, -5.28857421875, -5.029296875, -4.77001953125, -4.5107421875, -4.25146484375, -3.9921875, -3.73291015625, -3.4736328125, -3.21435546875, -2.955078125, -2.69580078125, -2.4365234375, -2.17724609375, -1.91796875, -1.65869140625, -1.3994140625, -1.14013671875, -0.880859375, -0.62158203125, -0.3623046875, -0.10302734375, 0.15625, 0.41552734375, 0.6748046875, 0.93408203125, 1.193359375, 1.45263671875, 1.7119140625, 1.97119140625, 2.23046875, 2.48974609375, 2.7490234375, 3.00830078125, 3.267578125, 3.52685546875, 3.7861328125, 4.04541015625, 4.3046875, 4.56396484375, 4.8232421875, 5.08251953125, 5.341796875, 5.60107421875, 5.8603515625, 6.11962890625, 6.37890625, 6.63818359375, 6.8974609375, 7.15673828125, 7.416015625, 7.67529296875, 7.9345703125, 8.19384765625, 8.453125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 5.0, 11.0, 8.0, 6.0, 9.0, 14.0, 16.0, 16.0, 27.0, 19.0, 25.0, 26.0, 33.0, 33.0, 41.0, 36.0, 36.0, 53.0, 42.0, 54.0, 47.0, 39.0, 41.0, 47.0, 50.0, 30.0, 28.0, 19.0, 24.0, 24.0, 19.0, 18.0, 21.0, 20.0, 15.0, 5.0, 9.0, 9.0, 5.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.78125, -14.3316650390625, -13.882080078125, -13.4324951171875, -12.98291015625, -12.5333251953125, -12.083740234375, -11.6341552734375, -11.1845703125, -10.7349853515625, -10.285400390625, -9.8358154296875, -9.38623046875, -8.9366455078125, -8.487060546875, -8.0374755859375, -7.587890625, -7.1383056640625, -6.688720703125, -6.2391357421875, -5.78955078125, -5.3399658203125, -4.890380859375, -4.4407958984375, -3.9912109375, -3.5416259765625, -3.092041015625, -2.6424560546875, -2.19287109375, -1.7432861328125, -1.293701171875, -0.8441162109375, -0.39453125, 0.0550537109375, 0.504638671875, 0.9542236328125, 1.40380859375, 1.8533935546875, 2.302978515625, 2.7525634765625, 3.2021484375, 3.6517333984375, 4.101318359375, 4.5509033203125, 5.00048828125, 5.4500732421875, 5.899658203125, 6.3492431640625, 6.798828125, 7.2484130859375, 7.697998046875, 8.1475830078125, 8.59716796875, 9.0467529296875, 9.496337890625, 9.9459228515625, 10.3955078125, 10.8450927734375, 11.294677734375, 11.7442626953125, 12.19384765625, 12.6434326171875, 13.093017578125, 13.5426025390625, 13.9921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 11.0, 9.0, 18.0, 21.0, 53.0, 74.0, 134.0, 319.0, 612.0, 1728.0, 9623.0, 303314.0, 713103.0, 15759.0, 2347.0, 716.0, 320.0, 160.0, 77.0, 37.0, 29.0, 25.0, 17.0, 8.0, 6.0, 10.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3671875, -12.0426025390625, -11.718017578125, -11.3934326171875, -11.06884765625, -10.7442626953125, -10.419677734375, -10.0950927734375, -9.7705078125, -9.4459228515625, -9.121337890625, -8.7967529296875, -8.47216796875, -8.1475830078125, -7.822998046875, -7.4984130859375, -7.173828125, -6.8492431640625, -6.524658203125, -6.2000732421875, -5.87548828125, -5.5509033203125, -5.226318359375, -4.9017333984375, -4.5771484375, -4.2525634765625, -3.927978515625, -3.6033935546875, -3.27880859375, -2.9542236328125, -2.629638671875, -2.3050537109375, -1.98046875, -1.6558837890625, -1.331298828125, -1.0067138671875, -0.68212890625, -0.3575439453125, -0.032958984375, 0.2916259765625, 0.6162109375, 0.9407958984375, 1.265380859375, 1.5899658203125, 1.91455078125, 2.2391357421875, 2.563720703125, 2.8883056640625, 3.212890625, 3.5374755859375, 3.862060546875, 4.1866455078125, 4.51123046875, 4.8358154296875, 5.160400390625, 5.4849853515625, 5.8095703125, 6.1341552734375, 6.458740234375, 6.7833251953125, 7.10791015625, 7.4324951171875, 7.757080078125, 8.0816650390625, 8.40625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 9.0, 5.0, 18.0, 14.0, 27.0, 34.0, 37.0, 39.0, 65.0, 91.0, 119.0, 110.0, 108.0, 76.0, 54.0, 43.0, 29.0, 21.0, 21.0, 7.0, 6.0, 10.0, 7.0, 10.0, 7.0, 10.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006155967712402344, -0.0005943924188613892, -0.0005731880664825439, -0.0005519837141036987, -0.0005307793617248535, -0.0005095750093460083, -0.0004883706569671631, -0.00046716630458831787, -0.00044596195220947266, -0.00042475759983062744, -0.0004035532474517822, -0.000382348895072937, -0.0003611445426940918, -0.0003399401903152466, -0.00031873583793640137, -0.00029753148555755615, -0.00027632713317871094, -0.0002551227807998657, -0.0002339184284210205, -0.0002127140760421753, -0.00019150972366333008, -0.00017030537128448486, -0.00014910101890563965, -0.00012789666652679443, -0.00010669231414794922, -8.5487961769104e-05, -6.428360939025879e-05, -4.3079257011413574e-05, -2.187490463256836e-05, -6.705522537231445e-07, 2.053380012512207e-05, 4.1738152503967285e-05, 6.29425048828125e-05, 8.414685726165771e-05, 0.00010535120964050293, 0.00012655556201934814, 0.00014775991439819336, 0.00016896426677703857, 0.0001901686191558838, 0.000211372971534729, 0.00023257732391357422, 0.00025378167629241943, 0.00027498602867126465, 0.00029619038105010986, 0.0003173947334289551, 0.0003385990858078003, 0.0003598034381866455, 0.0003810077905654907, 0.00040221214294433594, 0.00042341649532318115, 0.00044462084770202637, 0.0004658252000808716, 0.0004870295524597168, 0.000508233904838562, 0.0005294382572174072, 0.0005506426095962524, 0.0005718469619750977, 0.0005930513143539429, 0.0006142556667327881, 0.0006354600191116333, 0.0006566643714904785, 0.0006778687238693237, 0.0006990730762481689, 0.0007202774286270142, 0.0007414817810058594]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 12.0, 12.0, 32.0, 32.0, 76.0, 104.0, 189.0, 317.0, 723.0, 1610.0, 5339.0, 27110.0, 414917.0, 556090.0, 32485.0, 6055.0, 1895.0, 752.0, 330.0, 154.0, 95.0, 62.0, 45.0, 32.0, 24.0, 12.0, 5.0, 8.0, 5.0, 9.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.5078125, -6.28375244140625, -6.0596923828125, -5.83563232421875, -5.611572265625, -5.38751220703125, -5.1634521484375, -4.93939208984375, -4.71533203125, -4.49127197265625, -4.2672119140625, -4.04315185546875, -3.819091796875, -3.59503173828125, -3.3709716796875, -3.14691162109375, -2.9228515625, -2.69879150390625, -2.4747314453125, -2.25067138671875, -2.026611328125, -1.80255126953125, -1.5784912109375, -1.35443115234375, -1.13037109375, -0.90631103515625, -0.6822509765625, -0.45819091796875, -0.234130859375, -0.01007080078125, 0.2139892578125, 0.43804931640625, 0.662109375, 0.88616943359375, 1.1102294921875, 1.33428955078125, 1.558349609375, 1.78240966796875, 2.0064697265625, 2.23052978515625, 2.45458984375, 2.67864990234375, 2.9027099609375, 3.12677001953125, 3.350830078125, 3.57489013671875, 3.7989501953125, 4.02301025390625, 4.2470703125, 4.47113037109375, 4.6951904296875, 4.91925048828125, 5.143310546875, 5.36737060546875, 5.5914306640625, 5.81549072265625, 6.03955078125, 6.26361083984375, 6.4876708984375, 6.71173095703125, 6.935791015625, 7.15985107421875, 7.3839111328125, 7.60797119140625, 7.83203125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 17.0, 25.0, 32.0, 53.0, 81.0, 101.0, 150.0, 137.0, 111.0, 86.0, 71.0, 37.0, 27.0, 12.0, 8.0, 11.0, 7.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8671875, -9.621826171875, -9.37646484375, -9.131103515625, -8.8857421875, -8.640380859375, -8.39501953125, -8.149658203125, -7.904296875, -7.658935546875, -7.41357421875, -7.168212890625, -6.9228515625, -6.677490234375, -6.43212890625, -6.186767578125, -5.94140625, -5.696044921875, -5.45068359375, -5.205322265625, -4.9599609375, -4.714599609375, -4.46923828125, -4.223876953125, -3.978515625, -3.733154296875, -3.48779296875, -3.242431640625, -2.9970703125, -2.751708984375, -2.50634765625, -2.260986328125, -2.015625, -1.770263671875, -1.52490234375, -1.279541015625, -1.0341796875, -0.788818359375, -0.54345703125, -0.298095703125, -0.052734375, 0.192626953125, 0.43798828125, 0.683349609375, 0.9287109375, 1.174072265625, 1.41943359375, 1.664794921875, 1.91015625, 2.155517578125, 2.40087890625, 2.646240234375, 2.8916015625, 3.136962890625, 3.38232421875, 3.627685546875, 3.873046875, 4.118408203125, 4.36376953125, 4.609130859375, 4.8544921875, 5.099853515625, 5.34521484375, 5.590576171875, 5.8359375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 12.0, 24.0, 111.0, 354.0, 356.0, 116.0, 23.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.74440002441406, -240.87088012695312, -233.9973602294922, -227.12384033203125, -220.25030517578125, -213.3767852783203, -206.50326538085938, -199.62974548339844, -192.7562255859375, -185.88270568847656, -179.00918579101562, -172.13565063476562, -165.2621307373047, -158.38861083984375, -151.5150909423828, -144.64157104492188, -137.76803588867188, -130.89451599121094, -124.02098846435547, -117.14746856689453, -110.27394104003906, -103.40042114257812, -96.52690124511719, -89.65338134765625, -82.77985382080078, -75.90633392333984, -69.03280639648438, -62.15928649902344, -55.285762786865234, -48.41223907470703, -41.538719177246094, -34.66519546508789, -27.79168701171875, -20.918163299560547, -14.044641494750977, -7.171119689941406, -0.2975959777832031, 6.575927734375, 13.449447631835938, 20.32297134399414, 27.196495056152344, 34.07001876831055, 40.94354248046875, 47.81706237792969, 54.69058609008789, 61.564109802246094, 68.43762969970703, 75.3111572265625, 82.18467712402344, 89.05819702148438, 95.93172454833984, 102.80524444580078, 109.67877197265625, 116.55229187011719, 123.42581176757812, 130.29933166503906, 137.1728515625, 144.04637145996094, 150.91989135742188, 157.79342651367188, 164.6669464111328, 171.54046630859375, 178.4139862060547, 185.28750610351562, 192.16104125976562]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 8.0, 20.0, 19.0, 14.0, 14.0, 21.0, 24.0, 25.0, 28.0, 35.0, 37.0, 42.0, 41.0, 49.0, 62.0, 58.0, 46.0, 52.0, 58.0, 49.0, 45.0, 44.0, 36.0, 34.0, 26.0, 24.0, 12.0, 16.0, 12.0, 14.0, 8.0, 6.0, 8.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.04206848144531, -72.6947250366211, -70.34737396240234, -68.00003051757812, -65.65267944335938, -63.30533218383789, -60.957984924316406, -58.61064147949219, -56.26329040527344, -53.91594314575195, -51.56859588623047, -49.221248626708984, -46.8739013671875, -44.526554107666016, -42.17920684814453, -39.83186340332031, -37.48451614379883, -35.137168884277344, -32.78982162475586, -30.442474365234375, -28.09512710571289, -25.747779846191406, -23.400434494018555, -21.05308723449707, -18.705739974975586, -16.3583927154541, -14.011045455932617, -11.66369915008545, -9.316351890563965, -6.9690046310424805, -4.6216583251953125, -2.274311065673828, 0.07303619384765625, 2.4203832149505615, 4.767730236053467, 7.115077018737793, 9.462424278259277, 11.809771537780762, 14.15711784362793, 16.504465103149414, 18.8518123626709, 21.199159622192383, 23.546506881713867, 25.89385223388672, 28.241199493408203, 30.588546752929688, 32.93589401245117, 35.283241271972656, 37.63058853149414, 39.977935791015625, 42.32528305053711, 44.672630310058594, 47.01997756958008, 49.36732482910156, 51.71466827392578, 54.06201934814453, 56.40936279296875, 58.756710052490234, 61.10405731201172, 63.4514045715332, 65.79875183105469, 68.1460952758789, 70.49344635009766, 72.84078979492188, 75.18814086914062]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 12.0, 6.0, 12.0, 9.0, 15.0, 15.0, 38.0, 45.0, 55.0, 93.0, 144.0, 206.0, 303.0, 551.0, 983.0, 1817.0, 3995.0, 9575.0, 32837.0, 402330.0, 3673607.0, 46299.0, 11938.0, 4528.0, 2051.0, 1146.0, 625.0, 366.0, 215.0, 128.0, 96.0, 56.0, 48.0, 30.0, 17.0, 19.0, 9.0, 12.0, 11.0, 11.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.9608154296875, -7.687255859375, -7.4136962890625, -7.14013671875, -6.8665771484375, -6.593017578125, -6.3194580078125, -6.0458984375, -5.7723388671875, -5.498779296875, -5.2252197265625, -4.95166015625, -4.6781005859375, -4.404541015625, -4.1309814453125, -3.857421875, -3.5838623046875, -3.310302734375, -3.0367431640625, -2.76318359375, -2.4896240234375, -2.216064453125, -1.9425048828125, -1.6689453125, -1.3953857421875, -1.121826171875, -0.8482666015625, -0.57470703125, -0.3011474609375, -0.027587890625, 0.2459716796875, 0.51953125, 0.7930908203125, 1.066650390625, 1.3402099609375, 1.61376953125, 1.8873291015625, 2.160888671875, 2.4344482421875, 2.7080078125, 2.9815673828125, 3.255126953125, 3.5286865234375, 3.80224609375, 4.0758056640625, 4.349365234375, 4.6229248046875, 4.896484375, 5.1700439453125, 5.443603515625, 5.7171630859375, 5.99072265625, 6.2642822265625, 6.537841796875, 6.8114013671875, 7.0849609375, 7.3585205078125, 7.632080078125, 7.9056396484375, 8.17919921875, 8.4527587890625, 8.726318359375, 8.9998779296875, 9.2734375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 7.0, 6.0, 9.0, 10.0, 17.0, 20.0, 21.0, 19.0, 34.0, 30.0, 42.0, 55.0, 49.0, 42.0, 47.0, 67.0, 60.0, 56.0, 45.0, 53.0, 49.0, 43.0, 32.0, 32.0, 25.0, 15.0, 18.0, 22.0, 14.0, 10.0, 13.0, 10.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.26171875, -4.137115478515625, -4.01251220703125, -3.887908935546875, -3.7633056640625, -3.638702392578125, -3.51409912109375, -3.389495849609375, -3.264892578125, -3.140289306640625, -3.01568603515625, -2.891082763671875, -2.7664794921875, -2.641876220703125, -2.51727294921875, -2.392669677734375, -2.26806640625, -2.143463134765625, -2.01885986328125, -1.894256591796875, -1.7696533203125, -1.645050048828125, -1.52044677734375, -1.395843505859375, -1.271240234375, -1.146636962890625, -1.02203369140625, -0.897430419921875, -0.7728271484375, -0.648223876953125, -0.52362060546875, -0.399017333984375, -0.2744140625, -0.149810791015625, -0.02520751953125, 0.099395751953125, 0.2239990234375, 0.348602294921875, 0.47320556640625, 0.597808837890625, 0.722412109375, 0.847015380859375, 0.97161865234375, 1.096221923828125, 1.2208251953125, 1.345428466796875, 1.47003173828125, 1.594635009765625, 1.71923828125, 1.843841552734375, 1.96844482421875, 2.093048095703125, 2.2176513671875, 2.342254638671875, 2.46685791015625, 2.591461181640625, 2.716064453125, 2.840667724609375, 2.96527099609375, 3.089874267578125, 3.2144775390625, 3.339080810546875, 3.46368408203125, 3.588287353515625, 3.712890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 16.0, 12.0, 8.0, 12.0, 22.0, 30.0, 24.0, 35.0, 45.0, 51.0, 59.0, 71.0, 75.0, 66.0, 73.0, 85.0, 93.0, 153.0, 877.0, 21994.0, 4160036.0, 9029.0, 565.0, 118.0, 78.0, 56.0, 73.0, 65.0, 64.0, 58.0, 47.0, 54.0, 46.0, 37.0, 32.0, 31.0, 22.0, 13.0, 14.0, 7.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-37.78125, -36.77099609375, -35.7607421875, -34.75048828125, -33.740234375, -32.72998046875, -31.7197265625, -30.70947265625, -29.69921875, -28.68896484375, -27.6787109375, -26.66845703125, -25.658203125, -24.64794921875, -23.6376953125, -22.62744140625, -21.6171875, -20.60693359375, -19.5966796875, -18.58642578125, -17.576171875, -16.56591796875, -15.5556640625, -14.54541015625, -13.53515625, -12.52490234375, -11.5146484375, -10.50439453125, -9.494140625, -8.48388671875, -7.4736328125, -6.46337890625, -5.453125, -4.44287109375, -3.4326171875, -2.42236328125, -1.412109375, -0.40185546875, 0.6083984375, 1.61865234375, 2.62890625, 3.63916015625, 4.6494140625, 5.65966796875, 6.669921875, 7.68017578125, 8.6904296875, 9.70068359375, 10.7109375, 11.72119140625, 12.7314453125, 13.74169921875, 14.751953125, 15.76220703125, 16.7724609375, 17.78271484375, 18.79296875, 19.80322265625, 20.8134765625, 21.82373046875, 22.833984375, 23.84423828125, 24.8544921875, 25.86474609375, 26.875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 13.0, 40.0, 3528.0, 467.0, 32.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-34.3125, -33.7091064453125, -33.105712890625, -32.5023193359375, -31.89892578125, -31.2955322265625, -30.692138671875, -30.0887451171875, -29.4853515625, -28.8819580078125, -28.278564453125, -27.6751708984375, -27.07177734375, -26.4683837890625, -25.864990234375, -25.2615966796875, -24.658203125, -24.0548095703125, -23.451416015625, -22.8480224609375, -22.24462890625, -21.6412353515625, -21.037841796875, -20.4344482421875, -19.8310546875, -19.2276611328125, -18.624267578125, -18.0208740234375, -17.41748046875, -16.8140869140625, -16.210693359375, -15.6072998046875, -15.00390625, -14.4005126953125, -13.797119140625, -13.1937255859375, -12.59033203125, -11.9869384765625, -11.383544921875, -10.7801513671875, -10.1767578125, -9.5733642578125, -8.969970703125, -8.3665771484375, -7.76318359375, -7.1597900390625, -6.556396484375, -5.9530029296875, -5.349609375, -4.7462158203125, -4.142822265625, -3.5394287109375, -2.93603515625, -2.3326416015625, -1.729248046875, -1.1258544921875, -0.5224609375, 0.0809326171875, 0.684326171875, 1.2877197265625, 1.89111328125, 2.4945068359375, 3.097900390625, 3.7012939453125, 4.3046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 14.0, 74.0, 257.0, 461.0, 144.0, 36.0, 11.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.0317611694336, -98.79784393310547, -96.56392669677734, -94.33000946044922, -92.0960922241211, -89.86217498779297, -87.62825775146484, -85.39434051513672, -83.1604232788086, -80.92650604248047, -78.69258880615234, -76.45867156982422, -74.2247543334961, -71.99083709716797, -69.75691986083984, -67.52300262451172, -65.2890853881836, -63.05516815185547, -60.821250915527344, -58.58733367919922, -56.353416442871094, -54.11949920654297, -51.885581970214844, -49.65166473388672, -47.417747497558594, -45.18383026123047, -42.949913024902344, -40.71599578857422, -38.482078552246094, -36.24816131591797, -34.014244079589844, -31.78032684326172, -29.546401977539062, -27.312484741210938, -25.078567504882812, -22.844650268554688, -20.610733032226562, -18.376815795898438, -16.142898559570312, -13.908981323242188, -11.675064086914062, -9.441146850585938, -7.2072296142578125, -4.9733123779296875, -2.7393951416015625, -0.5054779052734375, 1.7284393310546875, 3.9623565673828125, 6.1962738037109375, 8.430191040039062, 10.664108276367188, 12.898025512695312, 15.131942749023438, 17.365859985351562, 19.599777221679688, 21.833694458007812, 24.067611694335938, 26.301528930664062, 28.535446166992188, 30.769363403320312, 33.00328063964844, 35.23719787597656, 37.47111511230469, 39.70503234863281, 41.93894958496094]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 3.0, 8.0, 17.0, 11.0, 18.0, 23.0, 39.0, 60.0, 76.0, 98.0, 130.0, 119.0, 111.0, 73.0, 72.0, 46.0, 29.0, 21.0, 12.0, 14.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.319488525390625, -44.61859130859375, -42.917694091796875, -41.216796875, -39.515899658203125, -37.81500244140625, -36.114105224609375, -34.4132080078125, -32.712310791015625, -31.01141357421875, -29.310516357421875, -27.609619140625, -25.908721923828125, -24.20782470703125, -22.506929397583008, -20.806032180786133, -19.10513687133789, -17.404239654541016, -15.70334243774414, -14.002446174621582, -12.301548957824707, -10.600651741027832, -8.899755477905273, -7.198858261108398, -5.497961044311523, -3.7970640659332275, -2.0961670875549316, -0.39527034759521484, 1.3056268692016602, 3.006524085998535, 4.707420349121094, 6.408317565917969, 8.109214782714844, 9.810111999511719, 11.511009216308594, 13.211905479431152, 14.912802696228027, 16.61370086669922, 18.31459617614746, 20.015493392944336, 21.71639060974121, 23.417287826538086, 25.11818504333496, 26.819080352783203, 28.519977569580078, 30.220874786376953, 31.921772003173828, 33.6226692199707, 35.32356643676758, 37.02446365356445, 38.72536087036133, 40.4262580871582, 42.12715530395508, 43.82805252075195, 45.52894592285156, 47.22984313964844, 48.93074035644531, 50.63163757324219, 52.33253479003906, 54.03343200683594, 55.73432922363281, 57.43522644042969, 59.13612365722656, 60.83702087402344, 62.53791809082031]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 15.0, 13.0, 18.0, 23.0, 42.0, 49.0, 77.0, 125.0, 180.0, 303.0, 499.0, 819.0, 1602.0, 3050.0, 7055.0, 18360.0, 57426.0, 209445.0, 448010.0, 210926.0, 58036.0, 18580.0, 6973.0, 3087.0, 1593.0, 843.0, 483.0, 287.0, 189.0, 128.0, 74.0, 73.0, 52.0, 35.0, 21.0, 12.0, 10.0, 7.0, 7.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.50390625, -7.24957275390625, -6.9952392578125, -6.74090576171875, -6.486572265625, -6.23223876953125, -5.9779052734375, -5.72357177734375, -5.46923828125, -5.21490478515625, -4.9605712890625, -4.70623779296875, -4.451904296875, -4.19757080078125, -3.9432373046875, -3.68890380859375, -3.4345703125, -3.18023681640625, -2.9259033203125, -2.67156982421875, -2.417236328125, -2.16290283203125, -1.9085693359375, -1.65423583984375, -1.39990234375, -1.14556884765625, -0.8912353515625, -0.63690185546875, -0.382568359375, -0.12823486328125, 0.1260986328125, 0.38043212890625, 0.634765625, 0.88909912109375, 1.1434326171875, 1.39776611328125, 1.652099609375, 1.90643310546875, 2.1607666015625, 2.41510009765625, 2.66943359375, 2.92376708984375, 3.1781005859375, 3.43243408203125, 3.686767578125, 3.94110107421875, 4.1954345703125, 4.44976806640625, 4.7041015625, 4.95843505859375, 5.2127685546875, 5.46710205078125, 5.721435546875, 5.97576904296875, 6.2301025390625, 6.48443603515625, 6.73876953125, 6.99310302734375, 7.2474365234375, 7.50177001953125, 7.756103515625, 8.01043701171875, 8.2647705078125, 8.51910400390625, 8.7734375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 2.0, 7.0, 14.0, 14.0, 15.0, 20.0, 38.0, 38.0, 47.0, 59.0, 74.0, 82.0, 78.0, 93.0, 93.0, 59.0, 55.0, 41.0, 43.0, 33.0, 27.0, 15.0, 19.0, 3.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.67578125, -7.45562744140625, -7.2354736328125, -7.01531982421875, -6.795166015625, -6.57501220703125, -6.3548583984375, -6.13470458984375, -5.91455078125, -5.69439697265625, -5.4742431640625, -5.25408935546875, -5.033935546875, -4.81378173828125, -4.5936279296875, -4.37347412109375, -4.1533203125, -3.93316650390625, -3.7130126953125, -3.49285888671875, -3.272705078125, -3.05255126953125, -2.8323974609375, -2.61224365234375, -2.39208984375, -2.17193603515625, -1.9517822265625, -1.73162841796875, -1.511474609375, -1.29132080078125, -1.0711669921875, -0.85101318359375, -0.630859375, -0.41070556640625, -0.1905517578125, 0.02960205078125, 0.249755859375, 0.46990966796875, 0.6900634765625, 0.91021728515625, 1.13037109375, 1.35052490234375, 1.5706787109375, 1.79083251953125, 2.010986328125, 2.23114013671875, 2.4512939453125, 2.67144775390625, 2.8916015625, 3.11175537109375, 3.3319091796875, 3.55206298828125, 3.772216796875, 3.99237060546875, 4.2125244140625, 4.43267822265625, 4.65283203125, 4.87298583984375, 5.0931396484375, 5.31329345703125, 5.533447265625, 5.75360107421875, 5.9737548828125, 6.19390869140625, 6.4140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 10.0, 11.0, 22.0, 34.0, 101.0, 181.0, 490.0, 1504.0, 9091.0, 929437.0, 102979.0, 3292.0, 869.0, 304.0, 103.0, 54.0, 28.0, 13.0, 11.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.59375, -39.31591796875, -38.0380859375, -36.76025390625, -35.482421875, -34.20458984375, -32.9267578125, -31.64892578125, -30.37109375, -29.09326171875, -27.8154296875, -26.53759765625, -25.259765625, -23.98193359375, -22.7041015625, -21.42626953125, -20.1484375, -18.87060546875, -17.5927734375, -16.31494140625, -15.037109375, -13.75927734375, -12.4814453125, -11.20361328125, -9.92578125, -8.64794921875, -7.3701171875, -6.09228515625, -4.814453125, -3.53662109375, -2.2587890625, -0.98095703125, 0.296875, 1.57470703125, 2.8525390625, 4.13037109375, 5.408203125, 6.68603515625, 7.9638671875, 9.24169921875, 10.51953125, 11.79736328125, 13.0751953125, 14.35302734375, 15.630859375, 16.90869140625, 18.1865234375, 19.46435546875, 20.7421875, 22.02001953125, 23.2978515625, 24.57568359375, 25.853515625, 27.13134765625, 28.4091796875, 29.68701171875, 30.96484375, 32.24267578125, 33.5205078125, 34.79833984375, 36.076171875, 37.35400390625, 38.6318359375, 39.90966796875, 41.1875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 8.0, 23.0, 45.0, 79.0, 127.0, 159.0, 169.0, 149.0, 115.0, 74.0, 26.0, 18.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.5, -65.4013671875, -63.302734375, -61.2041015625, -59.10546875, -57.0068359375, -54.908203125, -52.8095703125, -50.7109375, -48.6123046875, -46.513671875, -44.4150390625, -42.31640625, -40.2177734375, -38.119140625, -36.0205078125, -33.921875, -31.8232421875, -29.724609375, -27.6259765625, -25.52734375, -23.4287109375, -21.330078125, -19.2314453125, -17.1328125, -15.0341796875, -12.935546875, -10.8369140625, -8.73828125, -6.6396484375, -4.541015625, -2.4423828125, -0.34375, 1.7548828125, 3.853515625, 5.9521484375, 8.05078125, 10.1494140625, 12.248046875, 14.3466796875, 16.4453125, 18.5439453125, 20.642578125, 22.7412109375, 24.83984375, 26.9384765625, 29.037109375, 31.1357421875, 33.234375, 35.3330078125, 37.431640625, 39.5302734375, 41.62890625, 43.7275390625, 45.826171875, 47.9248046875, 50.0234375, 52.1220703125, 54.220703125, 56.3193359375, 58.41796875, 60.5166015625, 62.615234375, 64.7138671875, 66.8125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 10.0, 11.0, 23.0, 20.0, 45.0, 63.0, 98.0, 201.0, 402.0, 784.0, 2193.0, 8460.0, 77056.0, 829644.0, 114784.0, 10420.0, 2427.0, 961.0, 411.0, 209.0, 106.0, 71.0, 41.0, 35.0, 22.0, 19.0, 10.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1953125, -6.0107421875, -5.826171875, -5.6416015625, -5.45703125, -5.2724609375, -5.087890625, -4.9033203125, -4.71875, -4.5341796875, -4.349609375, -4.1650390625, -3.98046875, -3.7958984375, -3.611328125, -3.4267578125, -3.2421875, -3.0576171875, -2.873046875, -2.6884765625, -2.50390625, -2.3193359375, -2.134765625, -1.9501953125, -1.765625, -1.5810546875, -1.396484375, -1.2119140625, -1.02734375, -0.8427734375, -0.658203125, -0.4736328125, -0.2890625, -0.1044921875, 0.080078125, 0.2646484375, 0.44921875, 0.6337890625, 0.818359375, 1.0029296875, 1.1875, 1.3720703125, 1.556640625, 1.7412109375, 1.92578125, 2.1103515625, 2.294921875, 2.4794921875, 2.6640625, 2.8486328125, 3.033203125, 3.2177734375, 3.40234375, 3.5869140625, 3.771484375, 3.9560546875, 4.140625, 4.3251953125, 4.509765625, 4.6943359375, 4.87890625, 5.0634765625, 5.248046875, 5.4326171875, 5.6171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 8.0, 12.0, 9.0, 13.0, 11.0, 23.0, 25.0, 35.0, 40.0, 47.0, 82.0, 103.0, 131.0, 108.0, 83.0, 60.0, 46.0, 34.0, 22.0, 24.0, 14.0, 11.0, 8.0, 11.0, 4.0, 5.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007433891296386719, -0.000720590353012085, -0.000697791576385498, -0.0006749927997589111, -0.0006521940231323242, -0.0006293952465057373, -0.0006065964698791504, -0.0005837976932525635, -0.0005609989166259766, -0.0005382001399993896, -0.0005154013633728027, -0.0004926025867462158, -0.0004698038101196289, -0.000447005033493042, -0.0004242062568664551, -0.00040140748023986816, -0.00037860870361328125, -0.00035580992698669434, -0.0003330111503601074, -0.0003102123737335205, -0.0002874135971069336, -0.0002646148204803467, -0.00024181604385375977, -0.00021901726722717285, -0.00019621849060058594, -0.00017341971397399902, -0.0001506209373474121, -0.0001278221607208252, -0.00010502338409423828, -8.222460746765137e-05, -5.942583084106445e-05, -3.662705421447754e-05, -1.3828277587890625e-05, 8.970499038696289e-06, 3.17692756652832e-05, 5.456805229187012e-05, 7.736682891845703e-05, 0.00010016560554504395, 0.00012296438217163086, 0.00014576315879821777, 0.0001685619354248047, 0.0001913607120513916, 0.00021415948867797852, 0.00023695826530456543, 0.00025975704193115234, 0.00028255581855773926, 0.00030535459518432617, 0.0003281533718109131, 0.0003509521484375, 0.0003737509250640869, 0.00039654970169067383, 0.00041934847831726074, 0.00044214725494384766, 0.00046494603157043457, 0.0004877448081970215, 0.0005105435848236084, 0.0005333423614501953, 0.0005561411380767822, 0.0005789399147033691, 0.0006017386913299561, 0.000624537467956543, 0.0006473362445831299, 0.0006701350212097168, 0.0006929337978363037, 0.0007157325744628906]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 6.0, 2.0, 5.0, 7.0, 10.0, 13.0, 27.0, 28.0, 43.0, 53.0, 76.0, 116.0, 211.0, 384.0, 716.0, 1551.0, 3778.0, 13208.0, 93204.0, 727052.0, 179175.0, 20221.0, 4876.0, 1810.0, 851.0, 457.0, 249.0, 141.0, 91.0, 57.0, 29.0, 28.0, 26.0, 10.0, 10.0, 10.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.84765625, -4.69439697265625, -4.5411376953125, -4.38787841796875, -4.234619140625, -4.08135986328125, -3.9281005859375, -3.77484130859375, -3.62158203125, -3.46832275390625, -3.3150634765625, -3.16180419921875, -3.008544921875, -2.85528564453125, -2.7020263671875, -2.54876708984375, -2.3955078125, -2.24224853515625, -2.0889892578125, -1.93572998046875, -1.782470703125, -1.62921142578125, -1.4759521484375, -1.32269287109375, -1.16943359375, -1.01617431640625, -0.8629150390625, -0.70965576171875, -0.556396484375, -0.40313720703125, -0.2498779296875, -0.09661865234375, 0.056640625, 0.20989990234375, 0.3631591796875, 0.51641845703125, 0.669677734375, 0.82293701171875, 0.9761962890625, 1.12945556640625, 1.28271484375, 1.43597412109375, 1.5892333984375, 1.74249267578125, 1.895751953125, 2.04901123046875, 2.2022705078125, 2.35552978515625, 2.5087890625, 2.66204833984375, 2.8153076171875, 2.96856689453125, 3.121826171875, 3.27508544921875, 3.4283447265625, 3.58160400390625, 3.73486328125, 3.88812255859375, 4.0413818359375, 4.19464111328125, 4.347900390625, 4.50115966796875, 4.6544189453125, 4.80767822265625, 4.9609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 5.0, 16.0, 18.0, 41.0, 48.0, 86.0, 103.0, 133.0, 126.0, 111.0, 102.0, 74.0, 47.0, 30.0, 23.0, 11.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.109375, -8.88372802734375, -8.6580810546875, -8.43243408203125, -8.206787109375, -7.98114013671875, -7.7554931640625, -7.52984619140625, -7.30419921875, -7.07855224609375, -6.8529052734375, -6.62725830078125, -6.401611328125, -6.17596435546875, -5.9503173828125, -5.72467041015625, -5.4990234375, -5.27337646484375, -5.0477294921875, -4.82208251953125, -4.596435546875, -4.37078857421875, -4.1451416015625, -3.91949462890625, -3.69384765625, -3.46820068359375, -3.2425537109375, -3.01690673828125, -2.791259765625, -2.56561279296875, -2.3399658203125, -2.11431884765625, -1.888671875, -1.66302490234375, -1.4373779296875, -1.21173095703125, -0.986083984375, -0.76043701171875, -0.5347900390625, -0.30914306640625, -0.08349609375, 0.14215087890625, 0.3677978515625, 0.59344482421875, 0.819091796875, 1.04473876953125, 1.2703857421875, 1.49603271484375, 1.7216796875, 1.94732666015625, 2.1729736328125, 2.39862060546875, 2.624267578125, 2.84991455078125, 3.0755615234375, 3.30120849609375, 3.52685546875, 3.75250244140625, 3.9781494140625, 4.20379638671875, 4.429443359375, 4.65509033203125, 4.8807373046875, 5.10638427734375, 5.33203125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 18.0, 58.0, 254.0, 438.0, 165.0, 42.0, 14.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.3667907714844, -251.2064208984375, -242.04605102539062, -232.88568115234375, -223.7252960205078, -214.56492614746094, -205.40455627441406, -196.24417114257812, -187.08380126953125, -177.92343139648438, -168.7630615234375, -159.60269165039062, -150.4423065185547, -141.2819366455078, -132.12156677246094, -122.96118927001953, -113.80082702636719, -104.64045715332031, -95.4800796508789, -86.31970977783203, -77.15933227539062, -67.99896240234375, -58.838592529296875, -49.67821502685547, -40.517845153808594, -31.357471466064453, -22.197099685668945, -13.036727905273438, -3.876354217529297, 5.284019470214844, 14.444389343261719, 23.604766845703125, 32.76513671875, 41.92551040649414, 51.08588409423828, 60.246253967285156, 69.40663146972656, 78.56700134277344, 87.72737121582031, 96.88774871826172, 106.0481185913086, 115.20848846435547, 124.36886596679688, 133.52923583984375, 142.68960571289062, 151.8499755859375, 161.01034545898438, 170.1707305908203, 179.3311004638672, 188.49147033691406, 197.65184020996094, 206.81222534179688, 215.97259521484375, 225.13296508789062, 234.2933349609375, 243.45370483398438, 252.61407470703125, 261.7744445800781, 270.934814453125, 280.0951843261719, 289.25555419921875, 298.41595458984375, 307.5762939453125, 316.7366943359375, 325.8970642089844]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 5.0, 7.0, 11.0, 15.0, 17.0, 20.0, 30.0, 35.0, 28.0, 36.0, 52.0, 38.0, 60.0, 61.0, 65.0, 61.0, 62.0, 62.0, 48.0, 49.0, 49.0, 32.0, 31.0, 25.0, 17.0, 15.0, 17.0, 11.0, 7.0, 9.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-152.39544677734375, -147.9127197265625, -143.4299774169922, -138.94725036621094, -134.46450805664062, -129.98178100585938, -125.4990463256836, -121.01631164550781, -116.53358459472656, -112.05084991455078, -107.568115234375, -103.08538818359375, -98.60265350341797, -94.11991882324219, -89.6371841430664, -85.15444946289062, -80.67171478271484, -76.18898010253906, -71.70624542236328, -67.2235107421875, -62.74078369140625, -58.25804901123047, -53.77531433105469, -49.292579650878906, -44.80984878540039, -40.32711410522461, -35.844383239746094, -31.361648559570312, -26.878915786743164, -22.396183013916016, -17.913448333740234, -13.430715560913086, -8.947982788085938, -4.465249538421631, 0.01748371124267578, 4.500217437744141, 8.982950210571289, 13.465682983398438, 17.94841766357422, 22.431150436401367, 26.913883209228516, 31.396615982055664, 35.87934875488281, 40.362083435058594, 44.844818115234375, 49.32754898071289, 53.81028366088867, 58.29301452636719, 62.77574920654297, 67.25848388671875, 71.74121856689453, 76.22395324707031, 80.70668029785156, 85.18941497802734, 89.67214965820312, 94.1548843383789, 98.63761901855469, 103.12035369873047, 107.60308837890625, 112.0858154296875, 116.56855010986328, 121.05128479003906, 125.53401947021484, 130.01675415039062, 134.49948120117188]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 13.0, 21.0, 24.0, 51.0, 90.0, 134.0, 293.0, 685.0, 1731.0, 5304.0, 20725.0, 213643.0, 3836827.0, 93643.0, 14574.0, 3921.0, 1391.0, 594.0, 268.0, 140.0, 79.0, 48.0, 25.0, 18.0, 8.0, 10.0, 6.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.6328125, -11.2735595703125, -10.914306640625, -10.5550537109375, -10.19580078125, -9.8365478515625, -9.477294921875, -9.1180419921875, -8.7587890625, -8.3995361328125, -8.040283203125, -7.6810302734375, -7.32177734375, -6.9625244140625, -6.603271484375, -6.2440185546875, -5.884765625, -5.5255126953125, -5.166259765625, -4.8070068359375, -4.44775390625, -4.0885009765625, -3.729248046875, -3.3699951171875, -3.0107421875, -2.6514892578125, -2.292236328125, -1.9329833984375, -1.57373046875, -1.2144775390625, -0.855224609375, -0.4959716796875, -0.13671875, 0.2225341796875, 0.581787109375, 0.9410400390625, 1.30029296875, 1.6595458984375, 2.018798828125, 2.3780517578125, 2.7373046875, 3.0965576171875, 3.455810546875, 3.8150634765625, 4.17431640625, 4.5335693359375, 4.892822265625, 5.2520751953125, 5.611328125, 5.9705810546875, 6.329833984375, 6.6890869140625, 7.04833984375, 7.4075927734375, 7.766845703125, 8.1260986328125, 8.4853515625, 8.8446044921875, 9.203857421875, 9.5631103515625, 9.92236328125, 10.2816162109375, 10.640869140625, 11.0001220703125, 11.359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 7.0, 14.0, 15.0, 42.0, 34.0, 55.0, 67.0, 77.0, 96.0, 94.0, 110.0, 93.0, 81.0, 64.0, 39.0, 33.0, 17.0, 20.0, 13.0, 6.0, 5.0, 5.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0546875, -7.830322265625, -7.60595703125, -7.381591796875, -7.1572265625, -6.932861328125, -6.70849609375, -6.484130859375, -6.259765625, -6.035400390625, -5.81103515625, -5.586669921875, -5.3623046875, -5.137939453125, -4.91357421875, -4.689208984375, -4.46484375, -4.240478515625, -4.01611328125, -3.791748046875, -3.5673828125, -3.343017578125, -3.11865234375, -2.894287109375, -2.669921875, -2.445556640625, -2.22119140625, -1.996826171875, -1.7724609375, -1.548095703125, -1.32373046875, -1.099365234375, -0.875, -0.650634765625, -0.42626953125, -0.201904296875, 0.0224609375, 0.246826171875, 0.47119140625, 0.695556640625, 0.919921875, 1.144287109375, 1.36865234375, 1.593017578125, 1.8173828125, 2.041748046875, 2.26611328125, 2.490478515625, 2.71484375, 2.939208984375, 3.16357421875, 3.387939453125, 3.6123046875, 3.836669921875, 4.06103515625, 4.285400390625, 4.509765625, 4.734130859375, 4.95849609375, 5.182861328125, 5.4072265625, 5.631591796875, 5.85595703125, 6.080322265625, 6.3046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 11.0, 16.0, 22.0, 34.0, 47.0, 111.0, 226.0, 604.0, 2145.0, 13689.0, 308026.0, 3833708.0, 31101.0, 3326.0, 711.0, 239.0, 102.0, 51.0, 33.0, 15.0, 21.0, 14.0, 6.0, 3.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.8125, -18.189208984375, -17.56591796875, -16.942626953125, -16.3193359375, -15.696044921875, -15.07275390625, -14.449462890625, -13.826171875, -13.202880859375, -12.57958984375, -11.956298828125, -11.3330078125, -10.709716796875, -10.08642578125, -9.463134765625, -8.83984375, -8.216552734375, -7.59326171875, -6.969970703125, -6.3466796875, -5.723388671875, -5.10009765625, -4.476806640625, -3.853515625, -3.230224609375, -2.60693359375, -1.983642578125, -1.3603515625, -0.737060546875, -0.11376953125, 0.509521484375, 1.1328125, 1.756103515625, 2.37939453125, 3.002685546875, 3.6259765625, 4.249267578125, 4.87255859375, 5.495849609375, 6.119140625, 6.742431640625, 7.36572265625, 7.989013671875, 8.6123046875, 9.235595703125, 9.85888671875, 10.482177734375, 11.10546875, 11.728759765625, 12.35205078125, 12.975341796875, 13.5986328125, 14.221923828125, 14.84521484375, 15.468505859375, 16.091796875, 16.715087890625, 17.33837890625, 17.961669921875, 18.5849609375, 19.208251953125, 19.83154296875, 20.454833984375, 21.078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 9.0, 11.0, 16.0, 21.0, 28.0, 33.0, 76.0, 175.0, 813.0, 2301.0, 378.0, 110.0, 43.0, 29.0, 16.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34375, -22.74951171875, -22.1552734375, -21.56103515625, -20.966796875, -20.37255859375, -19.7783203125, -19.18408203125, -18.58984375, -17.99560546875, -17.4013671875, -16.80712890625, -16.212890625, -15.61865234375, -15.0244140625, -14.43017578125, -13.8359375, -13.24169921875, -12.6474609375, -12.05322265625, -11.458984375, -10.86474609375, -10.2705078125, -9.67626953125, -9.08203125, -8.48779296875, -7.8935546875, -7.29931640625, -6.705078125, -6.11083984375, -5.5166015625, -4.92236328125, -4.328125, -3.73388671875, -3.1396484375, -2.54541015625, -1.951171875, -1.35693359375, -0.7626953125, -0.16845703125, 0.42578125, 1.02001953125, 1.6142578125, 2.20849609375, 2.802734375, 3.39697265625, 3.9912109375, 4.58544921875, 5.1796875, 5.77392578125, 6.3681640625, 6.96240234375, 7.556640625, 8.15087890625, 8.7451171875, 9.33935546875, 9.93359375, 10.52783203125, 11.1220703125, 11.71630859375, 12.310546875, 12.90478515625, 13.4990234375, 14.09326171875, 14.6875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 23.0, 46.0, 83.0, 139.0, 176.0, 188.0, 146.0, 77.0, 52.0, 25.0, 11.0, 13.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.96214294433594, -72.40230560302734, -69.84246063232422, -67.28262329101562, -64.7227783203125, -62.162940979003906, -59.60309982299805, -57.04325866699219, -54.48341751098633, -51.92357635498047, -49.36373519897461, -46.80389404296875, -44.244056701660156, -41.68421173095703, -39.12437438964844, -36.56453323364258, -34.00469207763672, -31.44485092163086, -28.885009765625, -26.325170516967773, -23.765329360961914, -21.205488204956055, -18.645648956298828, -16.08580780029297, -13.52596664428711, -10.96612548828125, -8.406285285949707, -5.846444606781006, -3.2866039276123047, -0.7267627716064453, 1.8330774307250977, 4.392917633056641, 6.9527587890625, 9.51259994506836, 12.072440147399902, 14.632280349731445, 17.192121505737305, 19.751962661743164, 22.31180191040039, 24.87164306640625, 27.43148422241211, 29.99132537841797, 32.55116653442383, 35.11100769042969, 37.67084503173828, 40.230690002441406, 42.79052734375, 45.35036849975586, 47.91020965576172, 50.47005081176758, 53.02989196777344, 55.5897331237793, 58.149574279785156, 60.70941162109375, 63.26925277709961, 65.82909393310547, 68.38893127441406, 70.94876861572266, 73.50861358642578, 76.06845092773438, 78.6282958984375, 81.1881332397461, 83.74797821044922, 86.30781555175781, 88.86766052246094]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 8.0, 8.0, 9.0, 12.0, 16.0, 38.0, 31.0, 33.0, 47.0, 52.0, 65.0, 66.0, 59.0, 74.0, 82.0, 64.0, 70.0, 50.0, 51.0, 38.0, 36.0, 20.0, 15.0, 18.0, 15.0, 6.0, 10.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.46385192871094, -45.46003341674805, -43.45621109008789, -41.452392578125, -39.448570251464844, -37.44475173950195, -35.44093322753906, -33.437110900878906, -31.433292388916016, -29.429471969604492, -27.42565155029297, -25.421833038330078, -23.418012619018555, -21.41419219970703, -19.41037368774414, -17.406553268432617, -15.402732849121094, -13.39891242980957, -11.395092964172363, -9.391273498535156, -7.387453079223633, -5.383632659912109, -3.3798131942749023, -1.3759937286376953, 0.6278266906738281, 2.6316466331481934, 4.635466575622559, 6.639286518096924, 8.643106460571289, 10.646926879882812, 12.65074634552002, 14.654565811157227, 16.65838623046875, 18.662206649780273, 20.666027069091797, 22.669845581054688, 24.67366600036621, 26.677486419677734, 28.681304931640625, 30.68512535095215, 32.68894577026367, 34.69276428222656, 36.69658660888672, 38.70040512084961, 40.7042236328125, 42.708045959472656, 44.71186447143555, 46.71568298339844, 48.719505310058594, 50.723323822021484, 52.72714614868164, 54.73096466064453, 56.73478698730469, 58.73860549926758, 60.74242401123047, 62.746246337890625, 64.75006103515625, 66.7538833618164, 68.75769805908203, 70.76152038574219, 72.76534271240234, 74.7691650390625, 76.77297973632812, 78.77680206298828, 80.78062438964844]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 8.0, 7.0, 7.0, 14.0, 23.0, 32.0, 39.0, 54.0, 100.0, 136.0, 214.0, 321.0, 541.0, 1008.0, 1741.0, 3303.0, 6737.0, 14351.0, 32271.0, 76168.0, 189862.0, 366958.0, 206547.0, 82315.0, 35035.0, 15613.0, 7149.0, 3555.0, 1823.0, 979.0, 567.0, 376.0, 245.0, 143.0, 97.0, 76.0, 41.0, 31.0, 21.0, 14.0, 10.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.38616943359375, -5.2098388671875, -5.03350830078125, -4.857177734375, -4.68084716796875, -4.5045166015625, -4.32818603515625, -4.15185546875, -3.97552490234375, -3.7991943359375, -3.62286376953125, -3.446533203125, -3.27020263671875, -3.0938720703125, -2.91754150390625, -2.7412109375, -2.56488037109375, -2.3885498046875, -2.21221923828125, -2.035888671875, -1.85955810546875, -1.6832275390625, -1.50689697265625, -1.33056640625, -1.15423583984375, -0.9779052734375, -0.80157470703125, -0.625244140625, -0.44891357421875, -0.2725830078125, -0.09625244140625, 0.080078125, 0.25640869140625, 0.4327392578125, 0.60906982421875, 0.785400390625, 0.96173095703125, 1.1380615234375, 1.31439208984375, 1.49072265625, 1.66705322265625, 1.8433837890625, 2.01971435546875, 2.196044921875, 2.37237548828125, 2.5487060546875, 2.72503662109375, 2.9013671875, 3.07769775390625, 3.2540283203125, 3.43035888671875, 3.606689453125, 3.78302001953125, 3.9593505859375, 4.13568115234375, 4.31201171875, 4.48834228515625, 4.6646728515625, 4.84100341796875, 5.017333984375, 5.19366455078125, 5.3699951171875, 5.54632568359375, 5.72265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 10.0, 14.0, 14.0, 24.0, 22.0, 37.0, 27.0, 33.0, 47.0, 47.0, 64.0, 61.0, 67.0, 72.0, 86.0, 60.0, 46.0, 54.0, 40.0, 33.0, 33.0, 20.0, 16.0, 18.0, 11.0, 9.0, 8.0, 11.0, 7.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.92523193359375, -3.7762451171875, -3.62725830078125, -3.478271484375, -3.32928466796875, -3.1802978515625, -3.03131103515625, -2.88232421875, -2.73333740234375, -2.5843505859375, -2.43536376953125, -2.286376953125, -2.13739013671875, -1.9884033203125, -1.83941650390625, -1.6904296875, -1.54144287109375, -1.3924560546875, -1.24346923828125, -1.094482421875, -0.94549560546875, -0.7965087890625, -0.64752197265625, -0.49853515625, -0.34954833984375, -0.2005615234375, -0.05157470703125, 0.097412109375, 0.24639892578125, 0.3953857421875, 0.54437255859375, 0.693359375, 0.84234619140625, 0.9913330078125, 1.14031982421875, 1.289306640625, 1.43829345703125, 1.5872802734375, 1.73626708984375, 1.88525390625, 2.03424072265625, 2.1832275390625, 2.33221435546875, 2.481201171875, 2.63018798828125, 2.7791748046875, 2.92816162109375, 3.0771484375, 3.22613525390625, 3.3751220703125, 3.52410888671875, 3.673095703125, 3.82208251953125, 3.9710693359375, 4.12005615234375, 4.26904296875, 4.41802978515625, 4.5670166015625, 4.71600341796875, 4.864990234375, 5.01397705078125, 5.1629638671875, 5.31195068359375, 5.4609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 16.0, 18.0, 32.0, 47.0, 87.0, 85.0, 172.0, 234.0, 346.0, 601.0, 1167.0, 2661.0, 8867.0, 66841.0, 749833.0, 191780.0, 18016.0, 3974.0, 1642.0, 819.0, 459.0, 268.0, 169.0, 107.0, 71.0, 51.0, 43.0, 22.0, 30.0, 19.0, 4.0, 13.0, 3.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.596923828125, -13.13916015625, -12.681396484375, -12.2236328125, -11.765869140625, -11.30810546875, -10.850341796875, -10.392578125, -9.934814453125, -9.47705078125, -9.019287109375, -8.5615234375, -8.103759765625, -7.64599609375, -7.188232421875, -6.73046875, -6.272705078125, -5.81494140625, -5.357177734375, -4.8994140625, -4.441650390625, -3.98388671875, -3.526123046875, -3.068359375, -2.610595703125, -2.15283203125, -1.695068359375, -1.2373046875, -0.779541015625, -0.32177734375, 0.135986328125, 0.59375, 1.051513671875, 1.50927734375, 1.967041015625, 2.4248046875, 2.882568359375, 3.34033203125, 3.798095703125, 4.255859375, 4.713623046875, 5.17138671875, 5.629150390625, 6.0869140625, 6.544677734375, 7.00244140625, 7.460205078125, 7.91796875, 8.375732421875, 8.83349609375, 9.291259765625, 9.7490234375, 10.206787109375, 10.66455078125, 11.122314453125, 11.580078125, 12.037841796875, 12.49560546875, 12.953369140625, 13.4111328125, 13.868896484375, 14.32666015625, 14.784423828125, 15.2421875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 11.0, 10.0, 14.0, 21.0, 20.0, 31.0, 34.0, 52.0, 43.0, 61.0, 63.0, 79.0, 69.0, 83.0, 41.0, 52.0, 47.0, 53.0, 50.0, 34.0, 32.0, 24.0, 22.0, 12.0, 9.0, 10.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.75, -20.064453125, -19.37890625, -18.693359375, -18.0078125, -17.322265625, -16.63671875, -15.951171875, -15.265625, -14.580078125, -13.89453125, -13.208984375, -12.5234375, -11.837890625, -11.15234375, -10.466796875, -9.78125, -9.095703125, -8.41015625, -7.724609375, -7.0390625, -6.353515625, -5.66796875, -4.982421875, -4.296875, -3.611328125, -2.92578125, -2.240234375, -1.5546875, -0.869140625, -0.18359375, 0.501953125, 1.1875, 1.873046875, 2.55859375, 3.244140625, 3.9296875, 4.615234375, 5.30078125, 5.986328125, 6.671875, 7.357421875, 8.04296875, 8.728515625, 9.4140625, 10.099609375, 10.78515625, 11.470703125, 12.15625, 12.841796875, 13.52734375, 14.212890625, 14.8984375, 15.583984375, 16.26953125, 16.955078125, 17.640625, 18.326171875, 19.01171875, 19.697265625, 20.3828125, 21.068359375, 21.75390625, 22.439453125, 23.125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 16.0, 20.0, 34.0, 60.0, 87.0, 166.0, 402.0, 1022.0, 4293.0, 35798.0, 886615.0, 108928.0, 8354.0, 1687.0, 556.0, 222.0, 92.0, 75.0, 48.0, 21.0, 19.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.314453125, -6.05859375, -5.802734375, -5.546875, -5.291015625, -5.03515625, -4.779296875, -4.5234375, -4.267578125, -4.01171875, -3.755859375, -3.5, -3.244140625, -2.98828125, -2.732421875, -2.4765625, -2.220703125, -1.96484375, -1.708984375, -1.453125, -1.197265625, -0.94140625, -0.685546875, -0.4296875, -0.173828125, 0.08203125, 0.337890625, 0.59375, 0.849609375, 1.10546875, 1.361328125, 1.6171875, 1.873046875, 2.12890625, 2.384765625, 2.640625, 2.896484375, 3.15234375, 3.408203125, 3.6640625, 3.919921875, 4.17578125, 4.431640625, 4.6875, 4.943359375, 5.19921875, 5.455078125, 5.7109375, 5.966796875, 6.22265625, 6.478515625, 6.734375, 6.990234375, 7.24609375, 7.501953125, 7.7578125, 8.013671875, 8.26953125, 8.525390625, 8.78125, 9.037109375, 9.29296875, 9.548828125, 9.8046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 4.0, 5.0, 6.0, 14.0, 11.0, 20.0, 29.0, 36.0, 60.0, 135.0, 217.0, 163.0, 124.0, 45.0, 35.0, 23.0, 15.0, 14.0, 12.0, 8.0, 6.0, 1.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012950897216796875, -0.001256793737411499, -0.0012184977531433105, -0.001180201768875122, -0.0011419057846069336, -0.0011036098003387451, -0.0010653138160705566, -0.0010270178318023682, -0.0009887218475341797, -0.0009504258632659912, -0.0009121298789978027, -0.0008738338947296143, -0.0008355379104614258, -0.0007972419261932373, -0.0007589459419250488, -0.0007206499576568604, -0.0006823539733886719, -0.0006440579891204834, -0.0006057620048522949, -0.0005674660205841064, -0.000529170036315918, -0.0004908740520477295, -0.000452578067779541, -0.00041428208351135254, -0.00037598609924316406, -0.0003376901149749756, -0.0002993941307067871, -0.00026109814643859863, -0.00022280216217041016, -0.00018450617790222168, -0.0001462101936340332, -0.00010791420936584473, -6.961822509765625e-05, -3.1322240829467773e-05, 6.973743438720703e-06, 4.526972770690918e-05, 8.356571197509766e-05, 0.00012186169624328613, 0.0001601576805114746, 0.00019845366477966309, 0.00023674964904785156, 0.00027504563331604004, 0.0003133416175842285, 0.000351637601852417, 0.00038993358612060547, 0.00042822957038879395, 0.0004665255546569824, 0.0005048215389251709, 0.0005431175231933594, 0.0005814135074615479, 0.0006197094917297363, 0.0006580054759979248, 0.0006963014602661133, 0.0007345974445343018, 0.0007728934288024902, 0.0008111894130706787, 0.0008494853973388672, 0.0008877813816070557, 0.0009260773658752441, 0.0009643733501434326, 0.001002669334411621, 0.0010409653186798096, 0.001079261302947998, 0.0011175572872161865, 0.001155853271484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 9.0, 2.0, 3.0, 11.0, 13.0, 20.0, 17.0, 32.0, 64.0, 81.0, 125.0, 157.0, 295.0, 513.0, 1023.0, 2297.0, 5680.0, 19700.0, 124904.0, 766511.0, 100288.0, 17222.0, 5289.0, 2074.0, 938.0, 482.0, 277.0, 161.0, 100.0, 75.0, 56.0, 25.0, 30.0, 29.0, 18.0, 14.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.67578125, -4.51702880859375, -4.3582763671875, -4.19952392578125, -4.040771484375, -3.88201904296875, -3.7232666015625, -3.56451416015625, -3.40576171875, -3.24700927734375, -3.0882568359375, -2.92950439453125, -2.770751953125, -2.61199951171875, -2.4532470703125, -2.29449462890625, -2.1357421875, -1.97698974609375, -1.8182373046875, -1.65948486328125, -1.500732421875, -1.34197998046875, -1.1832275390625, -1.02447509765625, -0.86572265625, -0.70697021484375, -0.5482177734375, -0.38946533203125, -0.230712890625, -0.07196044921875, 0.0867919921875, 0.24554443359375, 0.404296875, 0.56304931640625, 0.7218017578125, 0.88055419921875, 1.039306640625, 1.19805908203125, 1.3568115234375, 1.51556396484375, 1.67431640625, 1.83306884765625, 1.9918212890625, 2.15057373046875, 2.309326171875, 2.46807861328125, 2.6268310546875, 2.78558349609375, 2.9443359375, 3.10308837890625, 3.2618408203125, 3.42059326171875, 3.579345703125, 3.73809814453125, 3.8968505859375, 4.05560302734375, 4.21435546875, 4.37310791015625, 4.5318603515625, 4.69061279296875, 4.849365234375, 5.00811767578125, 5.1668701171875, 5.32562255859375, 5.484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 6.0, 9.0, 13.0, 16.0, 24.0, 28.0, 28.0, 45.0, 60.0, 68.0, 83.0, 113.0, 106.0, 73.0, 74.0, 59.0, 33.0, 25.0, 23.0, 14.0, 14.0, 12.0, 13.0, 9.0, 5.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.17578125, -4.03521728515625, -3.8946533203125, -3.75408935546875, -3.613525390625, -3.47296142578125, -3.3323974609375, -3.19183349609375, -3.05126953125, -2.91070556640625, -2.7701416015625, -2.62957763671875, -2.489013671875, -2.34844970703125, -2.2078857421875, -2.06732177734375, -1.9267578125, -1.78619384765625, -1.6456298828125, -1.50506591796875, -1.364501953125, -1.22393798828125, -1.0833740234375, -0.94281005859375, -0.80224609375, -0.66168212890625, -0.5211181640625, -0.38055419921875, -0.239990234375, -0.09942626953125, 0.0411376953125, 0.18170166015625, 0.322265625, 0.46282958984375, 0.6033935546875, 0.74395751953125, 0.884521484375, 1.02508544921875, 1.1656494140625, 1.30621337890625, 1.44677734375, 1.58734130859375, 1.7279052734375, 1.86846923828125, 2.009033203125, 2.14959716796875, 2.2901611328125, 2.43072509765625, 2.5712890625, 2.71185302734375, 2.8524169921875, 2.99298095703125, 3.133544921875, 3.27410888671875, 3.4146728515625, 3.55523681640625, 3.69580078125, 3.83636474609375, 3.9769287109375, 4.11749267578125, 4.258056640625, 4.39862060546875, 4.5391845703125, 4.67974853515625, 4.8203125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 20.0, 35.0, 80.0, 169.0, 255.0, 200.0, 133.0, 52.0, 15.0, 9.0, 6.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.1579818725586, -96.41535949707031, -92.6727294921875, -88.93009948730469, -85.1874771118164, -81.44485473632812, -77.70222473144531, -73.9595947265625, -70.21697235107422, -66.47434997558594, -62.731719970703125, -58.98909378051758, -55.24646759033203, -51.503841400146484, -47.76121520996094, -44.01858901977539, -40.275962829589844, -36.5333366394043, -32.79071044921875, -29.048084259033203, -25.305458068847656, -21.56283187866211, -17.820205688476562, -14.077579498291016, -10.334953308105469, -6.592327117919922, -2.849700927734375, 0.8929252624511719, 4.635551452636719, 8.378177642822266, 12.120803833007812, 15.86343002319336, 19.606063842773438, 23.348690032958984, 27.09131622314453, 30.833942413330078, 34.576568603515625, 38.31919479370117, 42.06182098388672, 45.804447174072266, 49.54707336425781, 53.28969955444336, 57.032325744628906, 60.77495193481445, 64.517578125, 68.26020812988281, 72.0028305053711, 75.74545288085938, 79.48808288574219, 83.230712890625, 86.97333526611328, 90.71595764160156, 94.45858764648438, 98.20121765136719, 101.94384002685547, 105.68646240234375, 109.42909240722656, 113.17172241210938, 116.91434478759766, 120.65696716308594, 124.39959716796875, 128.14222717285156, 131.88485717773438, 135.62747192382812, 139.37010192871094]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 7.0, 10.0, 14.0, 11.0, 11.0, 25.0, 23.0, 27.0, 26.0, 53.0, 47.0, 54.0, 86.0, 71.0, 68.0, 69.0, 65.0, 48.0, 51.0, 33.0, 40.0, 33.0, 19.0, 26.0, 13.0, 9.0, 11.0, 12.0, 8.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-107.50023651123047, -104.55801391601562, -101.61579132080078, -98.67356872558594, -95.7313461303711, -92.78912353515625, -89.84689331054688, -86.90467834472656, -83.96244812011719, -81.02022552490234, -78.0780029296875, -75.13578033447266, -72.19355773925781, -69.25133514404297, -66.30911254882812, -63.366886138916016, -60.42466735839844, -57.482444763183594, -54.54022216796875, -51.597999572753906, -48.65577697753906, -45.71355438232422, -42.77132797241211, -39.829105377197266, -36.88688278198242, -33.94466018676758, -31.002437591552734, -28.060213088989258, -25.117990493774414, -22.17576789855957, -19.233543395996094, -16.29132080078125, -13.349098205566406, -10.406875610351562, -7.464652061462402, -4.522428512573242, -1.5802059173583984, 1.3620166778564453, 4.304241180419922, 7.246463775634766, 10.18868637084961, 13.130908966064453, 16.073131561279297, 19.015356063842773, 21.957578659057617, 24.89980125427246, 27.842025756835938, 30.78424835205078, 33.726470947265625, 36.66869354248047, 39.61091613769531, 42.553138732910156, 45.495361328125, 48.437583923339844, 51.37981033325195, 54.3220329284668, 57.26425552368164, 60.206478118896484, 63.14870071411133, 66.09092712402344, 69.03314971923828, 71.97537231445312, 74.91759490966797, 77.85981750488281, 80.80204010009766]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 11.0, 11.0, 14.0, 19.0, 24.0, 43.0, 62.0, 89.0, 126.0, 219.0, 519.0, 1741.0, 14787.0, 3951857.0, 217147.0, 5881.0, 918.0, 330.0, 166.0, 111.0, 67.0, 36.0, 28.0, 20.0, 17.0, 8.0, 8.0, 4.0, 5.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.03125, -19.283935546875, -18.53662109375, -17.789306640625, -17.0419921875, -16.294677734375, -15.54736328125, -14.800048828125, -14.052734375, -13.305419921875, -12.55810546875, -11.810791015625, -11.0634765625, -10.316162109375, -9.56884765625, -8.821533203125, -8.07421875, -7.326904296875, -6.57958984375, -5.832275390625, -5.0849609375, -4.337646484375, -3.59033203125, -2.843017578125, -2.095703125, -1.348388671875, -0.60107421875, 0.146240234375, 0.8935546875, 1.640869140625, 2.38818359375, 3.135498046875, 3.8828125, 4.630126953125, 5.37744140625, 6.124755859375, 6.8720703125, 7.619384765625, 8.36669921875, 9.114013671875, 9.861328125, 10.608642578125, 11.35595703125, 12.103271484375, 12.8505859375, 13.597900390625, 14.34521484375, 15.092529296875, 15.83984375, 16.587158203125, 17.33447265625, 18.081787109375, 18.8291015625, 19.576416015625, 20.32373046875, 21.071044921875, 21.818359375, 22.565673828125, 23.31298828125, 24.060302734375, 24.8076171875, 25.554931640625, 26.30224609375, 27.049560546875, 27.796875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 8.0, 3.0, 6.0, 15.0, 30.0, 43.0, 66.0, 94.0, 131.0, 162.0, 152.0, 113.0, 74.0, 47.0, 28.0, 15.0, 11.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.2421875, -14.892333984375, -14.54248046875, -14.192626953125, -13.8427734375, -13.492919921875, -13.14306640625, -12.793212890625, -12.443359375, -12.093505859375, -11.74365234375, -11.393798828125, -11.0439453125, -10.694091796875, -10.34423828125, -9.994384765625, -9.64453125, -9.294677734375, -8.94482421875, -8.594970703125, -8.2451171875, -7.895263671875, -7.54541015625, -7.195556640625, -6.845703125, -6.495849609375, -6.14599609375, -5.796142578125, -5.4462890625, -5.096435546875, -4.74658203125, -4.396728515625, -4.046875, -3.697021484375, -3.34716796875, -2.997314453125, -2.6474609375, -2.297607421875, -1.94775390625, -1.597900390625, -1.248046875, -0.898193359375, -0.54833984375, -0.198486328125, 0.1513671875, 0.501220703125, 0.85107421875, 1.200927734375, 1.55078125, 1.900634765625, 2.25048828125, 2.600341796875, 2.9501953125, 3.300048828125, 3.64990234375, 3.999755859375, 4.349609375, 4.699462890625, 5.04931640625, 5.399169921875, 5.7490234375, 6.098876953125, 6.44873046875, 6.798583984375, 7.1484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 14.0, 11.0, 21.0, 24.0, 58.0, 64.0, 109.0, 156.0, 251.0, 461.0, 883.0, 1888.0, 4337.0, 11718.0, 39069.0, 256930.0, 3543980.0, 275769.0, 39888.0, 10939.0, 3925.0, 1667.0, 793.0, 415.0, 309.0, 171.0, 123.0, 86.0, 62.0, 39.0, 34.0, 34.0, 9.0, 14.0, 8.0, 8.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12890625, -6.87884521484375, -6.6287841796875, -6.37872314453125, -6.128662109375, -5.87860107421875, -5.6285400390625, -5.37847900390625, -5.12841796875, -4.87835693359375, -4.6282958984375, -4.37823486328125, -4.128173828125, -3.87811279296875, -3.6280517578125, -3.37799072265625, -3.1279296875, -2.87786865234375, -2.6278076171875, -2.37774658203125, -2.127685546875, -1.87762451171875, -1.6275634765625, -1.37750244140625, -1.12744140625, -0.87738037109375, -0.6273193359375, -0.37725830078125, -0.127197265625, 0.12286376953125, 0.3729248046875, 0.62298583984375, 0.873046875, 1.12310791015625, 1.3731689453125, 1.62322998046875, 1.873291015625, 2.12335205078125, 2.3734130859375, 2.62347412109375, 2.87353515625, 3.12359619140625, 3.3736572265625, 3.62371826171875, 3.873779296875, 4.12384033203125, 4.3739013671875, 4.62396240234375, 4.8740234375, 5.12408447265625, 5.3741455078125, 5.62420654296875, 5.874267578125, 6.12432861328125, 6.3743896484375, 6.62445068359375, 6.87451171875, 7.12457275390625, 7.3746337890625, 7.62469482421875, 7.874755859375, 8.12481689453125, 8.3748779296875, 8.62493896484375, 8.875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 18.0, 16.0, 34.0, 52.0, 113.0, 355.0, 1442.0, 1415.0, 366.0, 113.0, 76.0, 21.0, 15.0, 7.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.495849609375, -10.03857421875, -9.581298828125, -9.1240234375, -8.666748046875, -8.20947265625, -7.752197265625, -7.294921875, -6.837646484375, -6.38037109375, -5.923095703125, -5.4658203125, -5.008544921875, -4.55126953125, -4.093994140625, -3.63671875, -3.179443359375, -2.72216796875, -2.264892578125, -1.8076171875, -1.350341796875, -0.89306640625, -0.435791015625, 0.021484375, 0.478759765625, 0.93603515625, 1.393310546875, 1.8505859375, 2.307861328125, 2.76513671875, 3.222412109375, 3.6796875, 4.136962890625, 4.59423828125, 5.051513671875, 5.5087890625, 5.966064453125, 6.42333984375, 6.880615234375, 7.337890625, 7.795166015625, 8.25244140625, 8.709716796875, 9.1669921875, 9.624267578125, 10.08154296875, 10.538818359375, 10.99609375, 11.453369140625, 11.91064453125, 12.367919921875, 12.8251953125, 13.282470703125, 13.73974609375, 14.197021484375, 14.654296875, 15.111572265625, 15.56884765625, 16.026123046875, 16.4833984375, 16.940673828125, 17.39794921875, 17.855224609375, 18.3125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 28.0, 68.0, 184.0, 234.0, 223.0, 124.0, 62.0, 32.0, 11.0, 9.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-122.49754333496094, -119.62767791748047, -116.75782012939453, -113.88795471191406, -111.01809692382812, -108.14823150634766, -105.27836608886719, -102.40850830078125, -99.53864288330078, -96.66877746582031, -93.79891967773438, -90.9290542602539, -88.05918884277344, -85.1893310546875, -82.31946563720703, -79.44960021972656, -76.57974243164062, -73.70987701416016, -70.84001922607422, -67.97015380859375, -65.10029602050781, -62.230430603027344, -59.360565185546875, -56.49070358276367, -53.62084197998047, -50.750980377197266, -47.88111877441406, -45.011253356933594, -42.14139175415039, -39.27153015136719, -36.40166473388672, -33.531803131103516, -30.661949157714844, -27.79208755493164, -24.922224044799805, -22.05236053466797, -19.182498931884766, -16.312637329101562, -13.442773818969727, -10.57291030883789, -7.7030487060546875, -4.833186149597168, -1.9633235931396484, 0.9065389633178711, 3.7764015197753906, 6.64626407623291, 9.51612663269043, 12.385990142822266, 15.255851745605469, 18.125713348388672, 20.995576858520508, 23.865440368652344, 26.735301971435547, 29.60516357421875, 32.47502899169922, 35.34489059448242, 38.214752197265625, 41.08461380004883, 43.95447540283203, 46.8243408203125, 49.6942024230957, 52.564064025878906, 55.433929443359375, 58.30379104614258, 61.17365264892578]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 9.0, 14.0, 14.0, 15.0, 28.0, 25.0, 34.0, 47.0, 59.0, 62.0, 57.0, 67.0, 76.0, 67.0, 51.0, 51.0, 48.0, 57.0, 37.0, 30.0, 31.0, 25.0, 25.0, 18.0, 13.0, 13.0, 8.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.78485107421875, -32.36203384399414, -30.9392147064209, -29.516395568847656, -28.093578338623047, -26.670761108398438, -25.247941970825195, -23.825122833251953, -22.402305603027344, -20.979488372802734, -19.556669235229492, -18.13385009765625, -16.71103286743164, -15.288214683532715, -13.865396499633789, -12.442578315734863, -11.019760131835938, -9.596941947937012, -8.174123764038086, -6.75130558013916, -5.328487396240234, -3.9056692123413086, -2.482851028442383, -1.060032844543457, 0.36278533935546875, 1.7856035232543945, 3.2084217071533203, 4.631239891052246, 6.054058074951172, 7.476876258850098, 8.899694442749023, 10.32251262664795, 11.74532699584961, 13.168145179748535, 14.590963363647461, 16.013782501220703, 17.436599731445312, 18.859416961669922, 20.282236099243164, 21.705055236816406, 23.127872467041016, 24.550689697265625, 25.973508834838867, 27.39632797241211, 28.81914520263672, 30.241962432861328, 31.66478157043457, 33.08760070800781, 34.51041793823242, 35.93323516845703, 37.356056213378906, 38.778873443603516, 40.201690673828125, 41.624507904052734, 43.047325134277344, 44.47014617919922, 45.89296340942383, 47.31578063964844, 48.73860168457031, 50.16141891479492, 51.58423614501953, 53.00705337524414, 54.42987060546875, 55.852691650390625, 57.275508880615234]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 14.0, 8.0, 16.0, 32.0, 34.0, 58.0, 78.0, 131.0, 169.0, 265.0, 465.0, 738.0, 1345.0, 2485.0, 4837.0, 9789.0, 21434.0, 50626.0, 129081.0, 335383.0, 299191.0, 110865.0, 43944.0, 19058.0, 8666.0, 4389.0, 2311.0, 1272.0, 691.0, 381.0, 270.0, 156.0, 116.0, 74.0, 64.0, 24.0, 24.0, 20.0, 12.0, 5.0, 8.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.53582763671875, -5.3568115234375, -5.17779541015625, -4.998779296875, -4.81976318359375, -4.6407470703125, -4.46173095703125, -4.28271484375, -4.10369873046875, -3.9246826171875, -3.74566650390625, -3.566650390625, -3.38763427734375, -3.2086181640625, -3.02960205078125, -2.8505859375, -2.67156982421875, -2.4925537109375, -2.31353759765625, -2.134521484375, -1.95550537109375, -1.7764892578125, -1.59747314453125, -1.41845703125, -1.23944091796875, -1.0604248046875, -0.88140869140625, -0.702392578125, -0.52337646484375, -0.3443603515625, -0.16534423828125, 0.013671875, 0.19268798828125, 0.3717041015625, 0.55072021484375, 0.729736328125, 0.90875244140625, 1.0877685546875, 1.26678466796875, 1.44580078125, 1.62481689453125, 1.8038330078125, 1.98284912109375, 2.161865234375, 2.34088134765625, 2.5198974609375, 2.69891357421875, 2.8779296875, 3.05694580078125, 3.2359619140625, 3.41497802734375, 3.593994140625, 3.77301025390625, 3.9520263671875, 4.13104248046875, 4.31005859375, 4.48907470703125, 4.6680908203125, 4.84710693359375, 5.026123046875, 5.20513916015625, 5.3841552734375, 5.56317138671875, 5.7421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 14.0, 12.0, 19.0, 16.0, 39.0, 43.0, 63.0, 81.0, 78.0, 87.0, 92.0, 96.0, 84.0, 75.0, 68.0, 47.0, 25.0, 23.0, 14.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.859375, -8.63421630859375, -8.4090576171875, -8.18389892578125, -7.958740234375, -7.73358154296875, -7.5084228515625, -7.28326416015625, -7.05810546875, -6.83294677734375, -6.6077880859375, -6.38262939453125, -6.157470703125, -5.93231201171875, -5.7071533203125, -5.48199462890625, -5.2568359375, -5.03167724609375, -4.8065185546875, -4.58135986328125, -4.356201171875, -4.13104248046875, -3.9058837890625, -3.68072509765625, -3.45556640625, -3.23040771484375, -3.0052490234375, -2.78009033203125, -2.554931640625, -2.32977294921875, -2.1046142578125, -1.87945556640625, -1.654296875, -1.42913818359375, -1.2039794921875, -0.97882080078125, -0.753662109375, -0.52850341796875, -0.3033447265625, -0.07818603515625, 0.14697265625, 0.37213134765625, 0.5972900390625, 0.82244873046875, 1.047607421875, 1.27276611328125, 1.4979248046875, 1.72308349609375, 1.9482421875, 2.17340087890625, 2.3985595703125, 2.62371826171875, 2.848876953125, 3.07403564453125, 3.2991943359375, 3.52435302734375, 3.74951171875, 3.97467041015625, 4.1998291015625, 4.42498779296875, 4.650146484375, 4.87530517578125, 5.1004638671875, 5.32562255859375, 5.55078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 5.0, 4.0, 10.0, 21.0, 17.0, 40.0, 43.0, 83.0, 91.0, 146.0, 286.0, 433.0, 909.0, 2121.0, 7047.0, 34178.0, 299846.0, 626811.0, 60440.0, 10437.0, 3049.0, 1215.0, 559.0, 294.0, 154.0, 103.0, 76.0, 39.0, 32.0, 19.0, 14.0, 9.0, 6.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0625, -11.662353515625, -11.26220703125, -10.862060546875, -10.4619140625, -10.061767578125, -9.66162109375, -9.261474609375, -8.861328125, -8.461181640625, -8.06103515625, -7.660888671875, -7.2607421875, -6.860595703125, -6.46044921875, -6.060302734375, -5.66015625, -5.260009765625, -4.85986328125, -4.459716796875, -4.0595703125, -3.659423828125, -3.25927734375, -2.859130859375, -2.458984375, -2.058837890625, -1.65869140625, -1.258544921875, -0.8583984375, -0.458251953125, -0.05810546875, 0.342041015625, 0.7421875, 1.142333984375, 1.54248046875, 1.942626953125, 2.3427734375, 2.742919921875, 3.14306640625, 3.543212890625, 3.943359375, 4.343505859375, 4.74365234375, 5.143798828125, 5.5439453125, 5.944091796875, 6.34423828125, 6.744384765625, 7.14453125, 7.544677734375, 7.94482421875, 8.344970703125, 8.7451171875, 9.145263671875, 9.54541015625, 9.945556640625, 10.345703125, 10.745849609375, 11.14599609375, 11.546142578125, 11.9462890625, 12.346435546875, 12.74658203125, 13.146728515625, 13.546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 6.0, 1.0, 7.0, 7.0, 12.0, 13.0, 17.0, 18.0, 24.0, 30.0, 41.0, 38.0, 51.0, 54.0, 72.0, 58.0, 60.0, 72.0, 72.0, 67.0, 50.0, 40.0, 36.0, 26.0, 33.0, 19.0, 22.0, 12.0, 12.0, 8.0, 10.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.28125, -21.6396484375, -20.998046875, -20.3564453125, -19.71484375, -19.0732421875, -18.431640625, -17.7900390625, -17.1484375, -16.5068359375, -15.865234375, -15.2236328125, -14.58203125, -13.9404296875, -13.298828125, -12.6572265625, -12.015625, -11.3740234375, -10.732421875, -10.0908203125, -9.44921875, -8.8076171875, -8.166015625, -7.5244140625, -6.8828125, -6.2412109375, -5.599609375, -4.9580078125, -4.31640625, -3.6748046875, -3.033203125, -2.3916015625, -1.75, -1.1083984375, -0.466796875, 0.1748046875, 0.81640625, 1.4580078125, 2.099609375, 2.7412109375, 3.3828125, 4.0244140625, 4.666015625, 5.3076171875, 5.94921875, 6.5908203125, 7.232421875, 7.8740234375, 8.515625, 9.1572265625, 9.798828125, 10.4404296875, 11.08203125, 11.7236328125, 12.365234375, 13.0068359375, 13.6484375, 14.2900390625, 14.931640625, 15.5732421875, 16.21484375, 16.8564453125, 17.498046875, 18.1396484375, 18.78125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 5.0, 10.0, 8.0, 14.0, 16.0, 27.0, 47.0, 122.0, 202.0, 644.0, 2596.0, 30944.0, 1004871.0, 6950.0, 1369.0, 392.0, 146.0, 69.0, 40.0, 23.0, 18.0, 10.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.3125, -24.4765625, -23.640625, -22.8046875, -21.96875, -21.1328125, -20.296875, -19.4609375, -18.625, -17.7890625, -16.953125, -16.1171875, -15.28125, -14.4453125, -13.609375, -12.7734375, -11.9375, -11.1015625, -10.265625, -9.4296875, -8.59375, -7.7578125, -6.921875, -6.0859375, -5.25, -4.4140625, -3.578125, -2.7421875, -1.90625, -1.0703125, -0.234375, 0.6015625, 1.4375, 2.2734375, 3.109375, 3.9453125, 4.78125, 5.6171875, 6.453125, 7.2890625, 8.125, 8.9609375, 9.796875, 10.6328125, 11.46875, 12.3046875, 13.140625, 13.9765625, 14.8125, 15.6484375, 16.484375, 17.3203125, 18.15625, 18.9921875, 19.828125, 20.6640625, 21.5, 22.3359375, 23.171875, 24.0078125, 24.84375, 25.6796875, 26.515625, 27.3515625, 28.1875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 10.0, 10.0, 19.0, 41.0, 95.0, 270.0, 322.0, 122.0, 45.0, 24.0, 14.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.003551483154296875, -0.003474414348602295, -0.003397345542907715, -0.0033202767372131348, -0.0032432079315185547, -0.0031661391258239746, -0.0030890703201293945, -0.0030120015144348145, -0.0029349327087402344, -0.0028578639030456543, -0.0027807950973510742, -0.002703726291656494, -0.002626657485961914, -0.002549588680267334, -0.002472519874572754, -0.002395451068878174, -0.0023183822631835938, -0.0022413134574890137, -0.0021642446517944336, -0.0020871758460998535, -0.0020101070404052734, -0.0019330382347106934, -0.0018559694290161133, -0.0017789006233215332, -0.0017018318176269531, -0.001624763011932373, -0.001547694206237793, -0.0014706254005432129, -0.0013935565948486328, -0.0013164877891540527, -0.0012394189834594727, -0.0011623501777648926, -0.0010852813720703125, -0.0010082125663757324, -0.0009311437606811523, -0.0008540749549865723, -0.0007770061492919922, -0.0006999373435974121, -0.000622868537902832, -0.000545799732208252, -0.0004687309265136719, -0.0003916621208190918, -0.0003145933151245117, -0.00023752450942993164, -0.00016045570373535156, -8.338689804077148e-05, -6.318092346191406e-06, 7.075071334838867e-05, 0.00014781951904296875, 0.00022488832473754883, 0.0003019571304321289, 0.000379025936126709, 0.00045609474182128906, 0.0005331635475158691, 0.0006102323532104492, 0.0006873011589050293, 0.0007643699645996094, 0.0008414387702941895, 0.0009185075759887695, 0.0009955763816833496, 0.0010726451873779297, 0.0011497139930725098, 0.0012267827987670898, 0.00130385160446167, 0.00138092041015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 10.0, 24.0, 25.0, 55.0, 86.0, 173.0, 344.0, 1170.0, 6873.0, 964426.0, 71123.0, 2934.0, 737.0, 279.0, 123.0, 72.0, 34.0, 22.0, 11.0, 10.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.6875, -29.953369140625, -29.21923828125, -28.485107421875, -27.7509765625, -27.016845703125, -26.28271484375, -25.548583984375, -24.814453125, -24.080322265625, -23.34619140625, -22.612060546875, -21.8779296875, -21.143798828125, -20.40966796875, -19.675537109375, -18.94140625, -18.207275390625, -17.47314453125, -16.739013671875, -16.0048828125, -15.270751953125, -14.53662109375, -13.802490234375, -13.068359375, -12.334228515625, -11.60009765625, -10.865966796875, -10.1318359375, -9.397705078125, -8.66357421875, -7.929443359375, -7.1953125, -6.461181640625, -5.72705078125, -4.992919921875, -4.2587890625, -3.524658203125, -2.79052734375, -2.056396484375, -1.322265625, -0.588134765625, 0.14599609375, 0.880126953125, 1.6142578125, 2.348388671875, 3.08251953125, 3.816650390625, 4.55078125, 5.284912109375, 6.01904296875, 6.753173828125, 7.4873046875, 8.221435546875, 8.95556640625, 9.689697265625, 10.423828125, 11.157958984375, 11.89208984375, 12.626220703125, 13.3603515625, 14.094482421875, 14.82861328125, 15.562744140625, 16.296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 10.0, 25.0, 41.0, 107.0, 235.0, 296.0, 166.0, 63.0, 19.0, 12.0, 6.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.5390625, -8.09375, -7.6484375, -7.203125, -6.7578125, -6.3125, -5.8671875, -5.421875, -4.9765625, -4.53125, -4.0859375, -3.640625, -3.1953125, -2.75, -2.3046875, -1.859375, -1.4140625, -0.96875, -0.5234375, -0.078125, 0.3671875, 0.8125, 1.2578125, 1.703125, 2.1484375, 2.59375, 3.0390625, 3.484375, 3.9296875, 4.375, 4.8203125, 5.265625, 5.7109375, 6.15625, 6.6015625, 7.046875, 7.4921875, 7.9375, 8.3828125, 8.828125, 9.2734375, 9.71875, 10.1640625, 10.609375, 11.0546875, 11.5, 11.9453125, 12.390625, 12.8359375, 13.28125, 13.7265625, 14.171875, 14.6171875, 15.0625, 15.5078125, 15.953125, 16.3984375, 16.84375, 17.2890625, 17.734375, 18.1796875, 18.625, 19.0703125, 19.515625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 17.0, 67.0, 140.0, 387.0, 267.0, 79.0, 14.0, 10.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.15481567382812, -235.982177734375, -228.8095245361328, -221.6368865966797, -214.4642333984375, -207.29159545898438, -200.11895751953125, -192.94631958007812, -185.77366638183594, -178.6010284423828, -171.42837524414062, -164.2557373046875, -157.08309936523438, -149.9104461669922, -142.73780822753906, -135.56515502929688, -128.39251708984375, -121.2198715209961, -114.04722595214844, -106.87458801269531, -99.70194244384766, -92.529296875, -85.35665893554688, -78.18401336669922, -71.01136779785156, -63.838722229003906, -56.666080474853516, -49.493438720703125, -42.32079315185547, -35.14814758300781, -27.975505828857422, -20.80286407470703, -13.630218505859375, -6.457574844360352, 0.7150688171386719, 7.887712478637695, 15.060356140136719, 22.233001708984375, 29.405643463134766, 36.578285217285156, 43.75093078613281, 50.92357635498047, 58.09621810913086, 65.26885986328125, 72.4415054321289, 79.61415100097656, 86.78678894042969, 93.95943450927734, 101.132080078125, 108.30472564697266, 115.47737121582031, 122.65000915527344, 129.82266235351562, 136.99530029296875, 144.16793823242188, 151.340576171875, 158.5132293701172, 165.6858673095703, 172.8585205078125, 180.03115844726562, 187.20379638671875, 194.37644958496094, 201.54908752441406, 208.72174072265625, 215.89437866210938]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 2.0, 11.0, 7.0, 6.0, 6.0, 20.0, 20.0, 19.0, 26.0, 37.0, 36.0, 50.0, 43.0, 44.0, 62.0, 81.0, 86.0, 60.0, 42.0, 42.0, 44.0, 32.0, 38.0, 19.0, 41.0, 29.0, 17.0, 14.0, 18.0, 11.0, 9.0, 8.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-80.77488708496094, -78.02449798583984, -75.27410125732422, -72.52371215820312, -69.7733154296875, -67.0229263305664, -64.27253723144531, -61.52214431762695, -58.771751403808594, -56.021358489990234, -53.270965576171875, -50.52057647705078, -47.77018356323242, -45.01979064941406, -42.26940155029297, -39.51900863647461, -36.76861572265625, -34.01822280883789, -31.267831802368164, -28.517440795898438, -25.767047882080078, -23.01665496826172, -20.266263961791992, -17.515872955322266, -14.765480041503906, -12.015088081359863, -9.26469612121582, -6.514304161071777, -3.7639122009277344, -1.0135202407836914, 1.7368717193603516, 4.487262725830078, 7.237663269042969, 9.988055229187012, 12.738447189331055, 15.488839149475098, 18.23923110961914, 20.9896240234375, 23.740015029907227, 26.490406036376953, 29.240798950195312, 31.991191864013672, 34.74158477783203, 37.491973876953125, 40.242366790771484, 42.992759704589844, 45.74314880371094, 48.4935417175293, 51.243934631347656, 53.994327545166016, 56.744720458984375, 59.49510955810547, 62.24550247192383, 64.99589538574219, 67.74628448486328, 70.49667358398438, 73.2470703125, 75.9974594116211, 78.74785614013672, 81.49824523925781, 84.24864196777344, 86.99903106689453, 89.74942016601562, 92.49981689453125, 95.25020599365234]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 10.0, 12.0, 16.0, 18.0, 27.0, 38.0, 60.0, 110.0, 199.0, 529.0, 1823.0, 8421.0, 66376.0, 3255858.0, 823553.0, 30389.0, 4894.0, 1144.0, 401.0, 178.0, 67.0, 58.0, 27.0, 25.0, 12.0, 13.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.8228759765625, -9.442626953125, -9.0623779296875, -8.68212890625, -8.3018798828125, -7.921630859375, -7.5413818359375, -7.1611328125, -6.7808837890625, -6.400634765625, -6.0203857421875, -5.64013671875, -5.2598876953125, -4.879638671875, -4.4993896484375, -4.119140625, -3.7388916015625, -3.358642578125, -2.9783935546875, -2.59814453125, -2.2178955078125, -1.837646484375, -1.4573974609375, -1.0771484375, -0.6968994140625, -0.316650390625, 0.0635986328125, 0.44384765625, 0.8240966796875, 1.204345703125, 1.5845947265625, 1.96484375, 2.3450927734375, 2.725341796875, 3.1055908203125, 3.48583984375, 3.8660888671875, 4.246337890625, 4.6265869140625, 5.0068359375, 5.3870849609375, 5.767333984375, 6.1475830078125, 6.52783203125, 6.9080810546875, 7.288330078125, 7.6685791015625, 8.048828125, 8.4290771484375, 8.809326171875, 9.1895751953125, 9.56982421875, 9.9500732421875, 10.330322265625, 10.7105712890625, 11.0908203125, 11.4710693359375, 11.851318359375, 12.2315673828125, 12.61181640625, 12.9920654296875, 13.372314453125, 13.7525634765625, 14.1328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 9.0, 8.0, 11.0, 16.0, 34.0, 39.0, 40.0, 51.0, 70.0, 84.0, 65.0, 97.0, 77.0, 98.0, 64.0, 77.0, 44.0, 26.0, 31.0, 28.0, 15.0, 8.0, 10.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73046875, -3.55059814453125, -3.3707275390625, -3.19085693359375, -3.010986328125, -2.83111572265625, -2.6512451171875, -2.47137451171875, -2.29150390625, -2.11163330078125, -1.9317626953125, -1.75189208984375, -1.572021484375, -1.39215087890625, -1.2122802734375, -1.03240966796875, -0.8525390625, -0.67266845703125, -0.4927978515625, -0.31292724609375, -0.133056640625, 0.04681396484375, 0.2266845703125, 0.40655517578125, 0.58642578125, 0.76629638671875, 0.9461669921875, 1.12603759765625, 1.305908203125, 1.48577880859375, 1.6656494140625, 1.84552001953125, 2.025390625, 2.20526123046875, 2.3851318359375, 2.56500244140625, 2.744873046875, 2.92474365234375, 3.1046142578125, 3.28448486328125, 3.46435546875, 3.64422607421875, 3.8240966796875, 4.00396728515625, 4.183837890625, 4.36370849609375, 4.5435791015625, 4.72344970703125, 4.9033203125, 5.08319091796875, 5.2630615234375, 5.44293212890625, 5.622802734375, 5.80267333984375, 5.9825439453125, 6.16241455078125, 6.34228515625, 6.52215576171875, 6.7020263671875, 6.88189697265625, 7.061767578125, 7.24163818359375, 7.4215087890625, 7.60137939453125, 7.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 5.0, 11.0, 17.0, 18.0, 28.0, 43.0, 59.0, 102.0, 177.0, 373.0, 772.0, 1877.0, 5885.0, 24604.0, 149394.0, 3286537.0, 659434.0, 49822.0, 9915.0, 2919.0, 1101.0, 512.0, 238.0, 152.0, 88.0, 63.0, 42.0, 29.0, 19.0, 13.0, 10.0, 6.0, 5.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.6015625, -10.296630859375, -9.99169921875, -9.686767578125, -9.3818359375, -9.076904296875, -8.77197265625, -8.467041015625, -8.162109375, -7.857177734375, -7.55224609375, -7.247314453125, -6.9423828125, -6.637451171875, -6.33251953125, -6.027587890625, -5.72265625, -5.417724609375, -5.11279296875, -4.807861328125, -4.5029296875, -4.197998046875, -3.89306640625, -3.588134765625, -3.283203125, -2.978271484375, -2.67333984375, -2.368408203125, -2.0634765625, -1.758544921875, -1.45361328125, -1.148681640625, -0.84375, -0.538818359375, -0.23388671875, 0.071044921875, 0.3759765625, 0.680908203125, 0.98583984375, 1.290771484375, 1.595703125, 1.900634765625, 2.20556640625, 2.510498046875, 2.8154296875, 3.120361328125, 3.42529296875, 3.730224609375, 4.03515625, 4.340087890625, 4.64501953125, 4.949951171875, 5.2548828125, 5.559814453125, 5.86474609375, 6.169677734375, 6.474609375, 6.779541015625, 7.08447265625, 7.389404296875, 7.6943359375, 7.999267578125, 8.30419921875, 8.609130859375, 8.9140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 8.0, 5.0, 5.0, 8.0, 9.0, 12.0, 14.0, 14.0, 24.0, 31.0, 38.0, 49.0, 67.0, 94.0, 118.0, 200.0, 341.0, 603.0, 855.0, 624.0, 406.0, 193.0, 109.0, 74.0, 54.0, 21.0, 26.0, 7.0, 7.0, 11.0, 6.0, 6.0, 7.0, 6.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.8203125, -7.5716552734375, -7.322998046875, -7.0743408203125, -6.82568359375, -6.5770263671875, -6.328369140625, -6.0797119140625, -5.8310546875, -5.5823974609375, -5.333740234375, -5.0850830078125, -4.83642578125, -4.5877685546875, -4.339111328125, -4.0904541015625, -3.841796875, -3.5931396484375, -3.344482421875, -3.0958251953125, -2.84716796875, -2.5985107421875, -2.349853515625, -2.1011962890625, -1.8525390625, -1.6038818359375, -1.355224609375, -1.1065673828125, -0.85791015625, -0.6092529296875, -0.360595703125, -0.1119384765625, 0.13671875, 0.3853759765625, 0.634033203125, 0.8826904296875, 1.13134765625, 1.3800048828125, 1.628662109375, 1.8773193359375, 2.1259765625, 2.3746337890625, 2.623291015625, 2.8719482421875, 3.12060546875, 3.3692626953125, 3.617919921875, 3.8665771484375, 4.115234375, 4.3638916015625, 4.612548828125, 4.8612060546875, 5.10986328125, 5.3585205078125, 5.607177734375, 5.8558349609375, 6.1044921875, 6.3531494140625, 6.601806640625, 6.8504638671875, 7.09912109375, 7.3477783203125, 7.596435546875, 7.8450927734375, 8.09375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 3.0, 13.0, 18.0, 64.0, 98.0, 219.0, 256.0, 169.0, 89.0, 32.0, 10.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-171.29298400878906, -167.5221405029297, -163.7512969970703, -159.98045349121094, -156.20960998535156, -152.4387664794922, -148.6679229736328, -144.89707946777344, -141.12623596191406, -137.3553924560547, -133.5845489501953, -129.81370544433594, -126.04286193847656, -122.27201843261719, -118.50117492675781, -114.73033142089844, -110.95948791503906, -107.18864440917969, -103.41780090332031, -99.64695739746094, -95.87611389160156, -92.10527038574219, -88.33442687988281, -84.56358337402344, -80.79273223876953, -77.02188873291016, -73.25104522705078, -69.4802017211914, -65.70935821533203, -61.938514709472656, -58.16767120361328, -54.396827697753906, -50.62598419189453, -46.855140686035156, -43.08429718017578, -39.313453674316406, -35.54261016845703, -31.771764755249023, -28.00092124938965, -24.230077743530273, -20.4592342376709, -16.688390731811523, -12.917547225952148, -9.146702766418457, -5.375859260559082, -1.6050148010253906, 2.1658287048339844, 5.936672210693359, 9.707515716552734, 13.47835922241211, 17.249202728271484, 21.02004623413086, 24.790889739990234, 28.561735153198242, 32.33258056640625, 36.103424072265625, 39.874267578125, 43.645111083984375, 47.41595458984375, 51.186798095703125, 54.9576416015625, 58.728485107421875, 62.49932861328125, 66.27017211914062, 70.041015625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 1.0, 5.0, 6.0, 12.0, 17.0, 23.0, 13.0, 19.0, 29.0, 49.0, 47.0, 43.0, 49.0, 45.0, 35.0, 62.0, 50.0, 55.0, 52.0, 49.0, 58.0, 47.0, 42.0, 38.0, 39.0, 24.0, 19.0, 18.0, 16.0, 4.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.02311706542969, -59.32658386230469, -57.63005065917969, -55.93351364135742, -54.23698043823242, -52.54044723510742, -50.843910217285156, -49.147377014160156, -47.450843811035156, -45.754310607910156, -44.057777404785156, -42.36124038696289, -40.66470718383789, -38.96817398071289, -37.271636962890625, -35.575103759765625, -33.878570556640625, -32.182037353515625, -30.485502243041992, -28.78896713256836, -27.09243392944336, -25.39590072631836, -23.699365615844727, -22.002830505371094, -20.306297302246094, -18.609764099121094, -16.91322898864746, -15.216694831848145, -13.520160675048828, -11.823626518249512, -10.127092361450195, -8.430558204650879, -6.734020233154297, -5.0374860763549805, -3.340951919555664, -1.6444177627563477, 0.05211639404296875, 1.7486505508422852, 3.4451847076416016, 5.141718864440918, 6.838253021240234, 8.53478717803955, 10.231321334838867, 11.927855491638184, 13.6243896484375, 15.320923805236816, 17.017457962036133, 18.713993072509766, 20.410526275634766, 22.107059478759766, 23.8035945892334, 25.50012969970703, 27.19666290283203, 28.89319610595703, 30.589731216430664, 32.2862663269043, 33.9827995300293, 35.6793327331543, 37.37586975097656, 39.07240295410156, 40.76893615722656, 42.46546936035156, 44.16200256347656, 45.85853958129883, 47.55507278442383]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 7.0, 13.0, 16.0, 18.0, 28.0, 37.0, 66.0, 101.0, 153.0, 230.0, 376.0, 576.0, 1029.0, 1886.0, 3602.0, 7184.0, 14418.0, 29942.0, 62879.0, 130906.0, 256986.0, 268575.0, 139363.0, 66953.0, 31813.0, 15372.0, 7474.0, 3743.0, 2008.0, 1167.0, 622.0, 335.0, 242.0, 148.0, 81.0, 59.0, 42.0, 36.0, 18.0, 11.0, 10.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.5, -4.35955810546875, -4.2191162109375, -4.07867431640625, -3.938232421875, -3.79779052734375, -3.6573486328125, -3.51690673828125, -3.37646484375, -3.23602294921875, -3.0955810546875, -2.95513916015625, -2.814697265625, -2.67425537109375, -2.5338134765625, -2.39337158203125, -2.2529296875, -2.11248779296875, -1.9720458984375, -1.83160400390625, -1.691162109375, -1.55072021484375, -1.4102783203125, -1.26983642578125, -1.12939453125, -0.98895263671875, -0.8485107421875, -0.70806884765625, -0.567626953125, -0.42718505859375, -0.2867431640625, -0.14630126953125, -0.005859375, 0.13458251953125, 0.2750244140625, 0.41546630859375, 0.555908203125, 0.69635009765625, 0.8367919921875, 0.97723388671875, 1.11767578125, 1.25811767578125, 1.3985595703125, 1.53900146484375, 1.679443359375, 1.81988525390625, 1.9603271484375, 2.10076904296875, 2.2412109375, 2.38165283203125, 2.5220947265625, 2.66253662109375, 2.802978515625, 2.94342041015625, 3.0838623046875, 3.22430419921875, 3.36474609375, 3.50518798828125, 3.6456298828125, 3.78607177734375, 3.926513671875, 4.06695556640625, 4.2073974609375, 4.34783935546875, 4.48828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 6.0, 6.0, 5.0, 6.0, 9.0, 9.0, 12.0, 10.0, 20.0, 14.0, 17.0, 22.0, 36.0, 27.0, 52.0, 39.0, 41.0, 48.0, 51.0, 52.0, 45.0, 46.0, 54.0, 52.0, 53.0, 39.0, 28.0, 32.0, 27.0, 25.0, 23.0, 16.0, 17.0, 12.0, 17.0, 12.0, 6.0, 4.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-3.638671875, -3.539398193359375, -3.44012451171875, -3.340850830078125, -3.2415771484375, -3.142303466796875, -3.04302978515625, -2.943756103515625, -2.844482421875, -2.745208740234375, -2.64593505859375, -2.546661376953125, -2.4473876953125, -2.348114013671875, -2.24884033203125, -2.149566650390625, -2.05029296875, -1.951019287109375, -1.85174560546875, -1.752471923828125, -1.6531982421875, -1.553924560546875, -1.45465087890625, -1.355377197265625, -1.256103515625, -1.156829833984375, -1.05755615234375, -0.958282470703125, -0.8590087890625, -0.759735107421875, -0.66046142578125, -0.561187744140625, -0.4619140625, -0.362640380859375, -0.26336669921875, -0.164093017578125, -0.0648193359375, 0.034454345703125, 0.13372802734375, 0.233001708984375, 0.332275390625, 0.431549072265625, 0.53082275390625, 0.630096435546875, 0.7293701171875, 0.828643798828125, 0.92791748046875, 1.027191162109375, 1.12646484375, 1.225738525390625, 1.32501220703125, 1.424285888671875, 1.5235595703125, 1.622833251953125, 1.72210693359375, 1.821380615234375, 1.920654296875, 2.019927978515625, 2.11920166015625, 2.218475341796875, 2.3177490234375, 2.417022705078125, 2.51629638671875, 2.615570068359375, 2.71484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 5.0, 8.0, 7.0, 8.0, 16.0, 24.0, 31.0, 40.0, 50.0, 62.0, 97.0, 107.0, 171.0, 222.0, 273.0, 353.0, 559.0, 757.0, 1203.0, 2070.0, 4212.0, 11807.0, 46240.0, 225574.0, 600794.0, 113238.0, 25130.0, 7305.0, 3022.0, 1683.0, 974.0, 682.0, 431.0, 348.0, 264.0, 202.0, 150.0, 126.0, 73.0, 59.0, 35.0, 39.0, 27.0, 24.0, 12.0, 16.0, 8.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.421875, -8.1527099609375, -7.883544921875, -7.6143798828125, -7.34521484375, -7.0760498046875, -6.806884765625, -6.5377197265625, -6.2685546875, -5.9993896484375, -5.730224609375, -5.4610595703125, -5.19189453125, -4.9227294921875, -4.653564453125, -4.3843994140625, -4.115234375, -3.8460693359375, -3.576904296875, -3.3077392578125, -3.03857421875, -2.7694091796875, -2.500244140625, -2.2310791015625, -1.9619140625, -1.6927490234375, -1.423583984375, -1.1544189453125, -0.88525390625, -0.6160888671875, -0.346923828125, -0.0777587890625, 0.19140625, 0.4605712890625, 0.729736328125, 0.9989013671875, 1.26806640625, 1.5372314453125, 1.806396484375, 2.0755615234375, 2.3447265625, 2.6138916015625, 2.883056640625, 3.1522216796875, 3.42138671875, 3.6905517578125, 3.959716796875, 4.2288818359375, 4.498046875, 4.7672119140625, 5.036376953125, 5.3055419921875, 5.57470703125, 5.8438720703125, 6.113037109375, 6.3822021484375, 6.6513671875, 6.9205322265625, 7.189697265625, 7.4588623046875, 7.72802734375, 7.9971923828125, 8.266357421875, 8.5355224609375, 8.8046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 9.0, 7.0, 10.0, 18.0, 11.0, 23.0, 22.0, 24.0, 31.0, 31.0, 34.0, 41.0, 45.0, 40.0, 41.0, 47.0, 50.0, 53.0, 36.0, 40.0, 43.0, 40.0, 36.0, 37.0, 23.0, 28.0, 17.0, 14.0, 26.0, 19.0, 23.0, 16.0, 10.0, 7.0, 6.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.6015625, -12.192138671875, -11.78271484375, -11.373291015625, -10.9638671875, -10.554443359375, -10.14501953125, -9.735595703125, -9.326171875, -8.916748046875, -8.50732421875, -8.097900390625, -7.6884765625, -7.279052734375, -6.86962890625, -6.460205078125, -6.05078125, -5.641357421875, -5.23193359375, -4.822509765625, -4.4130859375, -4.003662109375, -3.59423828125, -3.184814453125, -2.775390625, -2.365966796875, -1.95654296875, -1.547119140625, -1.1376953125, -0.728271484375, -0.31884765625, 0.090576171875, 0.5, 0.909423828125, 1.31884765625, 1.728271484375, 2.1376953125, 2.547119140625, 2.95654296875, 3.365966796875, 3.775390625, 4.184814453125, 4.59423828125, 5.003662109375, 5.4130859375, 5.822509765625, 6.23193359375, 6.641357421875, 7.05078125, 7.460205078125, 7.86962890625, 8.279052734375, 8.6884765625, 9.097900390625, 9.50732421875, 9.916748046875, 10.326171875, 10.735595703125, 11.14501953125, 11.554443359375, 11.9638671875, 12.373291015625, 12.78271484375, 13.192138671875, 13.6015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 8.0, 8.0, 7.0, 10.0, 12.0, 28.0, 33.0, 51.0, 75.0, 115.0, 175.0, 310.0, 477.0, 853.0, 1846.0, 4872.0, 15736.0, 74247.0, 711578.0, 193740.0, 30669.0, 7925.0, 2883.0, 1229.0, 623.0, 360.0, 238.0, 140.0, 107.0, 53.0, 42.0, 39.0, 17.0, 9.0, 12.0, 8.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.8828125, -4.733642578125, -4.58447265625, -4.435302734375, -4.2861328125, -4.136962890625, -3.98779296875, -3.838623046875, -3.689453125, -3.540283203125, -3.39111328125, -3.241943359375, -3.0927734375, -2.943603515625, -2.79443359375, -2.645263671875, -2.49609375, -2.346923828125, -2.19775390625, -2.048583984375, -1.8994140625, -1.750244140625, -1.60107421875, -1.451904296875, -1.302734375, -1.153564453125, -1.00439453125, -0.855224609375, -0.7060546875, -0.556884765625, -0.40771484375, -0.258544921875, -0.109375, 0.039794921875, 0.18896484375, 0.338134765625, 0.4873046875, 0.636474609375, 0.78564453125, 0.934814453125, 1.083984375, 1.233154296875, 1.38232421875, 1.531494140625, 1.6806640625, 1.829833984375, 1.97900390625, 2.128173828125, 2.27734375, 2.426513671875, 2.57568359375, 2.724853515625, 2.8740234375, 3.023193359375, 3.17236328125, 3.321533203125, 3.470703125, 3.619873046875, 3.76904296875, 3.918212890625, 4.0673828125, 4.216552734375, 4.36572265625, 4.514892578125, 4.6640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 6.0, 7.0, 4.0, 19.0, 22.0, 24.0, 23.0, 38.0, 53.0, 96.0, 156.0, 178.0, 103.0, 61.0, 49.0, 45.0, 27.0, 18.0, 14.0, 14.0, 8.0, 10.0, 9.0, 5.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008721351623535156, -0.0008265599608421326, -0.0007809847593307495, -0.0007354095578193665, -0.0006898343563079834, -0.0006442591547966003, -0.0005986839532852173, -0.0005531087517738342, -0.0005075335502624512, -0.0004619583487510681, -0.00041638314723968506, -0.000370807945728302, -0.00032523274421691895, -0.0002796575427055359, -0.00023408234119415283, -0.00018850713968276978, -0.00014293193817138672, -9.735673666000366e-05, -5.1781535148620605e-05, -6.206333637237549e-06, 3.936886787414551e-05, 8.494406938552856e-05, 0.00013051927089691162, 0.00017609447240829468, 0.00022166967391967773, 0.0002672448754310608, 0.00031282007694244385, 0.0003583952784538269, 0.00040397047996520996, 0.000449545681476593, 0.0004951208829879761, 0.0005406960844993591, 0.0005862712860107422, 0.0006318464875221252, 0.0006774216890335083, 0.0007229968905448914, 0.0007685720920562744, 0.0008141472935676575, 0.0008597224950790405, 0.0009052976965904236, 0.0009508728981018066, 0.0009964480996131897, 0.0010420233011245728, 0.0010875985026359558, 0.0011331737041473389, 0.001178748905658722, 0.001224324107170105, 0.001269899308681488, 0.001315474510192871, 0.0013610497117042542, 0.0014066249132156372, 0.0014522001147270203, 0.0014977753162384033, 0.0015433505177497864, 0.0015889257192611694, 0.0016345009207725525, 0.0016800761222839355, 0.0017256513237953186, 0.0017712265253067017, 0.0018168017268180847, 0.0018623769283294678, 0.0019079521298408508, 0.001953527331352234, 0.001999102532863617, 0.002044677734375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 10.0, 16.0, 16.0, 24.0, 34.0, 49.0, 83.0, 140.0, 218.0, 429.0, 888.0, 1943.0, 4447.0, 12619.0, 48727.0, 394445.0, 512498.0, 50501.0, 12957.0, 4531.0, 1904.0, 941.0, 425.0, 277.0, 143.0, 111.0, 57.0, 39.0, 16.0, 20.0, 17.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.2216796875, -4.076171875, -3.9306640625, -3.78515625, -3.6396484375, -3.494140625, -3.3486328125, -3.203125, -3.0576171875, -2.912109375, -2.7666015625, -2.62109375, -2.4755859375, -2.330078125, -2.1845703125, -2.0390625, -1.8935546875, -1.748046875, -1.6025390625, -1.45703125, -1.3115234375, -1.166015625, -1.0205078125, -0.875, -0.7294921875, -0.583984375, -0.4384765625, -0.29296875, -0.1474609375, -0.001953125, 0.1435546875, 0.2890625, 0.4345703125, 0.580078125, 0.7255859375, 0.87109375, 1.0166015625, 1.162109375, 1.3076171875, 1.453125, 1.5986328125, 1.744140625, 1.8896484375, 2.03515625, 2.1806640625, 2.326171875, 2.4716796875, 2.6171875, 2.7626953125, 2.908203125, 3.0537109375, 3.19921875, 3.3447265625, 3.490234375, 3.6357421875, 3.78125, 3.9267578125, 4.072265625, 4.2177734375, 4.36328125, 4.5087890625, 4.654296875, 4.7998046875, 4.9453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 14.0, 9.0, 7.0, 5.0, 10.0, 20.0, 23.0, 43.0, 52.0, 55.0, 49.0, 95.0, 114.0, 92.0, 97.0, 67.0, 55.0, 38.0, 29.0, 28.0, 18.0, 22.0, 8.0, 8.0, 11.0, 3.0, 10.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.53094482421875, -4.3939208984375, -4.25689697265625, -4.119873046875, -3.98284912109375, -3.8458251953125, -3.70880126953125, -3.57177734375, -3.43475341796875, -3.2977294921875, -3.16070556640625, -3.023681640625, -2.88665771484375, -2.7496337890625, -2.61260986328125, -2.4755859375, -2.33856201171875, -2.2015380859375, -2.06451416015625, -1.927490234375, -1.79046630859375, -1.6534423828125, -1.51641845703125, -1.37939453125, -1.24237060546875, -1.1053466796875, -0.96832275390625, -0.831298828125, -0.69427490234375, -0.5572509765625, -0.42022705078125, -0.283203125, -0.14617919921875, -0.0091552734375, 0.12786865234375, 0.264892578125, 0.40191650390625, 0.5389404296875, 0.67596435546875, 0.81298828125, 0.95001220703125, 1.0870361328125, 1.22406005859375, 1.361083984375, 1.49810791015625, 1.6351318359375, 1.77215576171875, 1.9091796875, 2.04620361328125, 2.1832275390625, 2.32025146484375, 2.457275390625, 2.59429931640625, 2.7313232421875, 2.86834716796875, 3.00537109375, 3.14239501953125, 3.2794189453125, 3.41644287109375, 3.553466796875, 3.69049072265625, 3.8275146484375, 3.96453857421875, 4.1015625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 7.0, 13.0, 38.0, 99.0, 228.0, 265.0, 154.0, 90.0, 43.0, 21.0, 24.0, 11.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-142.86318969726562, -139.10525512695312, -135.34732055664062, -131.58938598632812, -127.83145141601562, -124.07351684570312, -120.3155746459961, -116.5576400756836, -112.7997055053711, -109.0417709350586, -105.2838363647461, -101.5259017944336, -97.76795959472656, -94.01002502441406, -90.25209045410156, -86.49415588378906, -82.73622131347656, -78.97828674316406, -75.22035217285156, -71.46241760253906, -67.70448303222656, -63.9465446472168, -60.18860626220703, -56.43067169189453, -52.67273712158203, -48.91480255126953, -45.15686798095703, -41.398929595947266, -37.640995025634766, -33.883060455322266, -30.125123977661133, -26.3671875, -22.60924530029297, -18.85131072998047, -15.093374252319336, -11.33543872833252, -7.577503204345703, -3.819568634033203, -0.06163215637207031, 3.6963043212890625, 7.4542388916015625, 11.212174415588379, 14.970109939575195, 18.728046417236328, 22.485980987548828, 26.243915557861328, 30.00185203552246, 33.759788513183594, 37.517723083496094, 41.275657653808594, 45.033592224121094, 48.79153060913086, 52.54946517944336, 56.30739974975586, 60.065338134765625, 63.823272705078125, 67.58120727539062, 71.33914184570312, 75.09707641601562, 78.85501098632812, 82.61294555664062, 86.37088012695312, 90.12882232666016, 93.88675689697266, 97.64469146728516]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 7.0, 3.0, 6.0, 7.0, 5.0, 16.0, 14.0, 16.0, 14.0, 28.0, 25.0, 31.0, 29.0, 19.0, 34.0, 42.0, 43.0, 62.0, 69.0, 92.0, 76.0, 53.0, 33.0, 35.0, 36.0, 32.0, 28.0, 25.0, 25.0, 19.0, 23.0, 12.0, 6.0, 13.0, 6.0, 9.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-73.421630859375, -71.5413589477539, -69.66108703613281, -67.78080749511719, -65.9005355834961, -64.020263671875, -62.139991760253906, -60.25971984863281, -58.37944412231445, -56.49917221069336, -54.618896484375, -52.738624572753906, -50.85835266113281, -48.97807693481445, -47.09780502319336, -45.217529296875, -43.337257385253906, -41.45698547363281, -39.57670974731445, -37.69643783569336, -35.816162109375, -33.935890197753906, -32.05561828613281, -30.175344467163086, -28.29507064819336, -26.414796829223633, -24.534523010253906, -22.654251098632812, -20.773977279663086, -18.89370346069336, -17.013431549072266, -15.133157730102539, -13.252883911132812, -11.372610092163086, -9.492337226867676, -7.612063884735107, -5.731790542602539, -3.8515167236328125, -1.9712438583374023, -0.09097099304199219, 1.7893028259277344, 3.6695761680603027, 5.549849510192871, 7.4301228523254395, 9.310396194458008, 11.190670013427734, 13.070942878723145, 14.951215744018555, 16.83148956298828, 18.711763381958008, 20.592037200927734, 22.472309112548828, 24.352582931518555, 26.23285675048828, 28.113128662109375, 29.9934024810791, 31.873676300048828, 33.75394821166992, 35.63422393798828, 37.514495849609375, 39.39476776123047, 41.27504348754883, 43.15531539916992, 45.03559112548828, 46.915863037109375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 9.0, 9.0, 19.0, 29.0, 39.0, 65.0, 104.0, 143.0, 261.0, 539.0, 1083.0, 2521.0, 6557.0, 21658.0, 104413.0, 1990193.0, 1928892.0, 103682.0, 22445.0, 6823.0, 2554.0, 1137.0, 489.0, 241.0, 135.0, 74.0, 57.0, 32.0, 29.0, 14.0, 11.0, 11.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.140625, -4.9263916015625, -4.712158203125, -4.4979248046875, -4.28369140625, -4.0694580078125, -3.855224609375, -3.6409912109375, -3.4267578125, -3.2125244140625, -2.998291015625, -2.7840576171875, -2.56982421875, -2.3555908203125, -2.141357421875, -1.9271240234375, -1.712890625, -1.4986572265625, -1.284423828125, -1.0701904296875, -0.85595703125, -0.6417236328125, -0.427490234375, -0.2132568359375, 0.0009765625, 0.2152099609375, 0.429443359375, 0.6436767578125, 0.85791015625, 1.0721435546875, 1.286376953125, 1.5006103515625, 1.71484375, 1.9290771484375, 2.143310546875, 2.3575439453125, 2.57177734375, 2.7860107421875, 3.000244140625, 3.2144775390625, 3.4287109375, 3.6429443359375, 3.857177734375, 4.0714111328125, 4.28564453125, 4.4998779296875, 4.714111328125, 4.9283447265625, 5.142578125, 5.3568115234375, 5.571044921875, 5.7852783203125, 5.99951171875, 6.2137451171875, 6.427978515625, 6.6422119140625, 6.8564453125, 7.0706787109375, 7.284912109375, 7.4991455078125, 7.71337890625, 7.9276123046875, 8.141845703125, 8.3560791015625, 8.5703125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 8.0, 15.0, 15.0, 26.0, 31.0, 37.0, 42.0, 38.0, 53.0, 57.0, 65.0, 77.0, 62.0, 63.0, 71.0, 56.0, 59.0, 43.0, 34.0, 28.0, 27.0, 22.0, 23.0, 12.0, 9.0, 4.0, 10.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.0234375, -4.90264892578125, -4.7818603515625, -4.66107177734375, -4.540283203125, -4.41949462890625, -4.2987060546875, -4.17791748046875, -4.05712890625, -3.93634033203125, -3.8155517578125, -3.69476318359375, -3.573974609375, -3.45318603515625, -3.3323974609375, -3.21160888671875, -3.0908203125, -2.97003173828125, -2.8492431640625, -2.72845458984375, -2.607666015625, -2.48687744140625, -2.3660888671875, -2.24530029296875, -2.12451171875, -2.00372314453125, -1.8829345703125, -1.76214599609375, -1.641357421875, -1.52056884765625, -1.3997802734375, -1.27899169921875, -1.158203125, -1.03741455078125, -0.9166259765625, -0.79583740234375, -0.675048828125, -0.55426025390625, -0.4334716796875, -0.31268310546875, -0.19189453125, -0.07110595703125, 0.0496826171875, 0.17047119140625, 0.291259765625, 0.41204833984375, 0.5328369140625, 0.65362548828125, 0.7744140625, 0.89520263671875, 1.0159912109375, 1.13677978515625, 1.257568359375, 1.37835693359375, 1.4991455078125, 1.61993408203125, 1.74072265625, 1.86151123046875, 1.9822998046875, 2.10308837890625, 2.223876953125, 2.34466552734375, 2.4654541015625, 2.58624267578125, 2.70703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 7.0, 9.0, 12.0, 19.0, 28.0, 25.0, 41.0, 67.0, 107.0, 210.0, 350.0, 762.0, 1672.0, 4300.0, 12204.0, 45491.0, 274287.0, 3339343.0, 441286.0, 54485.0, 12873.0, 3871.0, 1380.0, 631.0, 305.0, 169.0, 99.0, 64.0, 43.0, 35.0, 25.0, 21.0, 15.0, 11.0, 10.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.5, -7.2698974609375, -7.039794921875, -6.8096923828125, -6.57958984375, -6.3494873046875, -6.119384765625, -5.8892822265625, -5.6591796875, -5.4290771484375, -5.198974609375, -4.9688720703125, -4.73876953125, -4.5086669921875, -4.278564453125, -4.0484619140625, -3.818359375, -3.5882568359375, -3.358154296875, -3.1280517578125, -2.89794921875, -2.6678466796875, -2.437744140625, -2.2076416015625, -1.9775390625, -1.7474365234375, -1.517333984375, -1.2872314453125, -1.05712890625, -0.8270263671875, -0.596923828125, -0.3668212890625, -0.13671875, 0.0933837890625, 0.323486328125, 0.5535888671875, 0.78369140625, 1.0137939453125, 1.243896484375, 1.4739990234375, 1.7041015625, 1.9342041015625, 2.164306640625, 2.3944091796875, 2.62451171875, 2.8546142578125, 3.084716796875, 3.3148193359375, 3.544921875, 3.7750244140625, 4.005126953125, 4.2352294921875, 4.46533203125, 4.6954345703125, 4.925537109375, 5.1556396484375, 5.3857421875, 5.6158447265625, 5.845947265625, 6.0760498046875, 6.30615234375, 6.5362548828125, 6.766357421875, 6.9964599609375, 7.2265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 7.0, 5.0, 10.0, 5.0, 11.0, 10.0, 7.0, 18.0, 24.0, 36.0, 41.0, 42.0, 71.0, 97.0, 138.0, 220.0, 332.0, 625.0, 719.0, 611.0, 415.0, 199.0, 127.0, 81.0, 65.0, 41.0, 24.0, 22.0, 17.0, 14.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.5860595703125, -6.383056640625, -6.1800537109375, -5.97705078125, -5.7740478515625, -5.571044921875, -5.3680419921875, -5.1650390625, -4.9620361328125, -4.759033203125, -4.5560302734375, -4.35302734375, -4.1500244140625, -3.947021484375, -3.7440185546875, -3.541015625, -3.3380126953125, -3.135009765625, -2.9320068359375, -2.72900390625, -2.5260009765625, -2.322998046875, -2.1199951171875, -1.9169921875, -1.7139892578125, -1.510986328125, -1.3079833984375, -1.10498046875, -0.9019775390625, -0.698974609375, -0.4959716796875, -0.29296875, -0.0899658203125, 0.113037109375, 0.3160400390625, 0.51904296875, 0.7220458984375, 0.925048828125, 1.1280517578125, 1.3310546875, 1.5340576171875, 1.737060546875, 1.9400634765625, 2.14306640625, 2.3460693359375, 2.549072265625, 2.7520751953125, 2.955078125, 3.1580810546875, 3.361083984375, 3.5640869140625, 3.76708984375, 3.9700927734375, 4.173095703125, 4.3760986328125, 4.5791015625, 4.7821044921875, 4.985107421875, 5.1881103515625, 5.39111328125, 5.5941162109375, 5.797119140625, 6.0001220703125, 6.203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 23.0, 28.0, 76.0, 193.0, 279.0, 205.0, 119.0, 32.0, 15.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.5028839111328, -132.88723754882812, -129.2716064453125, -125.65596008300781, -122.04031372070312, -118.42467498779297, -114.80903625488281, -111.19338989257812, -107.57774353027344, -103.96210479736328, -100.3464584350586, -96.73081970214844, -93.11517333984375, -89.4995346069336, -85.88389587402344, -82.26824951171875, -78.6526107788086, -75.03697204589844, -71.42132568359375, -67.8056869506836, -64.1900405883789, -60.57440185546875, -56.95875930786133, -53.343116760253906, -49.727474212646484, -46.11183166503906, -42.49618911743164, -38.88054656982422, -35.26490783691406, -31.649263381958008, -28.03362274169922, -24.417980194091797, -20.802337646484375, -17.186695098876953, -13.571053504943848, -9.955411911010742, -6.33976936340332, -2.7241268157958984, 0.8915138244628906, 4.5071563720703125, 8.122798919677734, 11.738441467285156, 15.354083061218262, 18.969724655151367, 22.58536720275879, 26.20100975036621, 29.816650390625, 33.43229293823242, 37.047935485839844, 40.663578033447266, 44.27922058105469, 47.894859313964844, 51.51050567626953, 55.12614440917969, 58.74178695678711, 62.35742950439453, 65.97306823730469, 69.58870697021484, 73.20435333251953, 76.81999206542969, 80.43563842773438, 84.05127716064453, 87.66691589355469, 91.28256225585938, 94.89820861816406]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 7.0, 4.0, 8.0, 9.0, 6.0, 10.0, 8.0, 23.0, 21.0, 20.0, 24.0, 29.0, 21.0, 35.0, 34.0, 29.0, 46.0, 52.0, 45.0, 45.0, 59.0, 57.0, 56.0, 51.0, 38.0, 38.0, 21.0, 32.0, 19.0, 26.0, 20.0, 14.0, 27.0, 13.0, 8.0, 11.0, 10.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0], "bins": [-37.55016326904297, -36.526187896728516, -35.50221252441406, -34.478233337402344, -33.45425796508789, -32.43028259277344, -31.40630531311035, -30.382328033447266, -29.358352661132812, -28.33437728881836, -27.310400009155273, -26.286422729492188, -25.262447357177734, -24.23847198486328, -23.214494705200195, -22.19051742553711, -21.166542053222656, -20.142566680908203, -19.118589401245117, -18.09461212158203, -17.070636749267578, -16.046661376953125, -15.022684097290039, -13.99870777130127, -12.9747314453125, -11.95075511932373, -10.926778793334961, -9.902802467346191, -8.878826141357422, -7.854849815368652, -6.830873489379883, -5.806897163391113, -4.782924652099609, -3.75894832611084, -2.7349720001220703, -1.7109956741333008, -0.6870193481445312, 0.3369569778442383, 1.3609333038330078, 2.3849096298217773, 3.408885955810547, 4.432862281799316, 5.456838607788086, 6.4808149337768555, 7.504791259765625, 8.528767585754395, 9.552743911743164, 10.576720237731934, 11.600696563720703, 12.624672889709473, 13.648649215698242, 14.672625541687012, 15.696601867675781, 16.720577239990234, 17.74455451965332, 18.768531799316406, 19.79250717163086, 20.816482543945312, 21.8404598236084, 22.864437103271484, 23.888412475585938, 24.91238784790039, 25.936365127563477, 26.960342407226562, 27.984317779541016]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 9.0, 15.0, 16.0, 34.0, 40.0, 67.0, 106.0, 174.0, 256.0, 410.0, 700.0, 1201.0, 1932.0, 3747.0, 7128.0, 14783.0, 33068.0, 79777.0, 211525.0, 365141.0, 195636.0, 73536.0, 30591.0, 13546.0, 6599.0, 3583.0, 1957.0, 1152.0, 663.0, 439.0, 253.0, 155.0, 97.0, 76.0, 48.0, 32.0, 14.0, 11.0, 6.0, 9.0, 5.0, 5.0, 1.0, 8.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.17425537109375, -4.0164794921875, -3.85870361328125, -3.700927734375, -3.54315185546875, -3.3853759765625, -3.22760009765625, -3.06982421875, -2.91204833984375, -2.7542724609375, -2.59649658203125, -2.438720703125, -2.28094482421875, -2.1231689453125, -1.96539306640625, -1.8076171875, -1.64984130859375, -1.4920654296875, -1.33428955078125, -1.176513671875, -1.01873779296875, -0.8609619140625, -0.70318603515625, -0.54541015625, -0.38763427734375, -0.2298583984375, -0.07208251953125, 0.085693359375, 0.24346923828125, 0.4012451171875, 0.55902099609375, 0.716796875, 0.87457275390625, 1.0323486328125, 1.19012451171875, 1.347900390625, 1.50567626953125, 1.6634521484375, 1.82122802734375, 1.97900390625, 2.13677978515625, 2.2945556640625, 2.45233154296875, 2.610107421875, 2.76788330078125, 2.9256591796875, 3.08343505859375, 3.2412109375, 3.39898681640625, 3.5567626953125, 3.71453857421875, 3.872314453125, 4.03009033203125, 4.1878662109375, 4.34564208984375, 4.50341796875, 4.66119384765625, 4.8189697265625, 4.97674560546875, 5.134521484375, 5.29229736328125, 5.4500732421875, 5.60784912109375, 5.765625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 12.0, 7.0, 5.0, 10.0, 12.0, 12.0, 11.0, 14.0, 19.0, 18.0, 27.0, 29.0, 34.0, 35.0, 32.0, 36.0, 46.0, 47.0, 39.0, 46.0, 51.0, 44.0, 46.0, 41.0, 40.0, 38.0, 34.0, 37.0, 25.0, 29.0, 25.0, 21.0, 11.0, 12.0, 12.0, 7.0, 10.0, 9.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.54296875, -2.45880126953125, -2.3746337890625, -2.29046630859375, -2.206298828125, -2.12213134765625, -2.0379638671875, -1.95379638671875, -1.86962890625, -1.78546142578125, -1.7012939453125, -1.61712646484375, -1.532958984375, -1.44879150390625, -1.3646240234375, -1.28045654296875, -1.1962890625, -1.11212158203125, -1.0279541015625, -0.94378662109375, -0.859619140625, -0.77545166015625, -0.6912841796875, -0.60711669921875, -0.52294921875, -0.43878173828125, -0.3546142578125, -0.27044677734375, -0.186279296875, -0.10211181640625, -0.0179443359375, 0.06622314453125, 0.150390625, 0.23455810546875, 0.3187255859375, 0.40289306640625, 0.487060546875, 0.57122802734375, 0.6553955078125, 0.73956298828125, 0.82373046875, 0.90789794921875, 0.9920654296875, 1.07623291015625, 1.160400390625, 1.24456787109375, 1.3287353515625, 1.41290283203125, 1.4970703125, 1.58123779296875, 1.6654052734375, 1.74957275390625, 1.833740234375, 1.91790771484375, 2.0020751953125, 2.08624267578125, 2.17041015625, 2.25457763671875, 2.3387451171875, 2.42291259765625, 2.507080078125, 2.59124755859375, 2.6754150390625, 2.75958251953125, 2.84375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 21.0, 21.0, 20.0, 32.0, 52.0, 64.0, 89.0, 118.0, 181.0, 234.0, 348.0, 517.0, 852.0, 1511.0, 3357.0, 9597.0, 39474.0, 244896.0, 636710.0, 83077.0, 16998.0, 5139.0, 2126.0, 1083.0, 613.0, 433.0, 274.0, 195.0, 154.0, 103.0, 67.0, 59.0, 35.0, 28.0, 15.0, 17.0, 12.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.6953125, -10.4000244140625, -10.104736328125, -9.8094482421875, -9.51416015625, -9.2188720703125, -8.923583984375, -8.6282958984375, -8.3330078125, -8.0377197265625, -7.742431640625, -7.4471435546875, -7.15185546875, -6.8565673828125, -6.561279296875, -6.2659912109375, -5.970703125, -5.6754150390625, -5.380126953125, -5.0848388671875, -4.78955078125, -4.4942626953125, -4.198974609375, -3.9036865234375, -3.6083984375, -3.3131103515625, -3.017822265625, -2.7225341796875, -2.42724609375, -2.1319580078125, -1.836669921875, -1.5413818359375, -1.24609375, -0.9508056640625, -0.655517578125, -0.3602294921875, -0.06494140625, 0.2303466796875, 0.525634765625, 0.8209228515625, 1.1162109375, 1.4114990234375, 1.706787109375, 2.0020751953125, 2.29736328125, 2.5926513671875, 2.887939453125, 3.1832275390625, 3.478515625, 3.7738037109375, 4.069091796875, 4.3643798828125, 4.65966796875, 4.9549560546875, 5.250244140625, 5.5455322265625, 5.8408203125, 6.1361083984375, 6.431396484375, 6.7266845703125, 7.02197265625, 7.3172607421875, 7.612548828125, 7.9078369140625, 8.203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 4.0, 7.0, 2.0, 9.0, 4.0, 12.0, 22.0, 14.0, 18.0, 20.0, 25.0, 21.0, 33.0, 28.0, 32.0, 47.0, 51.0, 48.0, 49.0, 50.0, 48.0, 49.0, 54.0, 43.0, 32.0, 33.0, 36.0, 31.0, 31.0, 23.0, 15.0, 15.0, 10.0, 8.0, 13.0, 15.0, 12.0, 8.0, 4.0, 6.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.828125, -10.5023193359375, -10.176513671875, -9.8507080078125, -9.52490234375, -9.1990966796875, -8.873291015625, -8.5474853515625, -8.2216796875, -7.8958740234375, -7.570068359375, -7.2442626953125, -6.91845703125, -6.5926513671875, -6.266845703125, -5.9410400390625, -5.615234375, -5.2894287109375, -4.963623046875, -4.6378173828125, -4.31201171875, -3.9862060546875, -3.660400390625, -3.3345947265625, -3.0087890625, -2.6829833984375, -2.357177734375, -2.0313720703125, -1.70556640625, -1.3797607421875, -1.053955078125, -0.7281494140625, -0.40234375, -0.0765380859375, 0.249267578125, 0.5750732421875, 0.90087890625, 1.2266845703125, 1.552490234375, 1.8782958984375, 2.2041015625, 2.5299072265625, 2.855712890625, 3.1815185546875, 3.50732421875, 3.8331298828125, 4.158935546875, 4.4847412109375, 4.810546875, 5.1363525390625, 5.462158203125, 5.7879638671875, 6.11376953125, 6.4395751953125, 6.765380859375, 7.0911865234375, 7.4169921875, 7.7427978515625, 8.068603515625, 8.3944091796875, 8.72021484375, 9.0460205078125, 9.371826171875, 9.6976318359375, 10.0234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 7.0, 7.0, 12.0, 18.0, 15.0, 28.0, 46.0, 63.0, 95.0, 155.0, 265.0, 576.0, 1247.0, 3308.0, 10134.0, 41115.0, 238736.0, 640841.0, 84419.0, 18532.0, 5284.0, 1919.0, 800.0, 361.0, 183.0, 136.0, 81.0, 50.0, 31.0, 29.0, 11.0, 15.0, 8.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.736328125, -3.6331787109375, -3.530029296875, -3.4268798828125, -3.32373046875, -3.2205810546875, -3.117431640625, -3.0142822265625, -2.9111328125, -2.8079833984375, -2.704833984375, -2.6016845703125, -2.49853515625, -2.3953857421875, -2.292236328125, -2.1890869140625, -2.0859375, -1.9827880859375, -1.879638671875, -1.7764892578125, -1.67333984375, -1.5701904296875, -1.467041015625, -1.3638916015625, -1.2607421875, -1.1575927734375, -1.054443359375, -0.9512939453125, -0.84814453125, -0.7449951171875, -0.641845703125, -0.5386962890625, -0.435546875, -0.3323974609375, -0.229248046875, -0.1260986328125, -0.02294921875, 0.0802001953125, 0.183349609375, 0.2864990234375, 0.3896484375, 0.4927978515625, 0.595947265625, 0.6990966796875, 0.80224609375, 0.9053955078125, 1.008544921875, 1.1116943359375, 1.21484375, 1.3179931640625, 1.421142578125, 1.5242919921875, 1.62744140625, 1.7305908203125, 1.833740234375, 1.9368896484375, 2.0400390625, 2.1431884765625, 2.246337890625, 2.3494873046875, 2.45263671875, 2.5557861328125, 2.658935546875, 2.7620849609375, 2.865234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 4.0, 10.0, 5.0, 10.0, 12.0, 11.0, 8.0, 16.0, 35.0, 32.0, 41.0, 71.0, 145.0, 169.0, 130.0, 92.0, 36.0, 43.0, 28.0, 16.0, 14.0, 15.0, 9.0, 7.0, 4.0, 4.0, 5.0, 8.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001201629638671875, -0.0011634379625320435, -0.001125246286392212, -0.0010870546102523804, -0.0010488629341125488, -0.0010106712579727173, -0.0009724795818328857, -0.0009342879056930542, -0.0008960962295532227, -0.0008579045534133911, -0.0008197128772735596, -0.000781521201133728, -0.0007433295249938965, -0.0007051378488540649, -0.0006669461727142334, -0.0006287544965744019, -0.0005905628204345703, -0.0005523711442947388, -0.0005141794681549072, -0.0004759877920150757, -0.00043779611587524414, -0.0003996044397354126, -0.00036141276359558105, -0.0003232210874557495, -0.00028502941131591797, -0.0002468377351760864, -0.00020864605903625488, -0.00017045438289642334, -0.0001322627067565918, -9.407103061676025e-05, -5.587935447692871e-05, -1.7687678337097168e-05, 2.0503997802734375e-05, 5.869567394256592e-05, 9.688735008239746e-05, 0.000135079026222229, 0.00017327070236206055, 0.0002114623785018921, 0.00024965405464172363, 0.0002878457307815552, 0.0003260374069213867, 0.00036422908306121826, 0.0004024207592010498, 0.00044061243534088135, 0.0004788041114807129, 0.0005169957876205444, 0.000555187463760376, 0.0005933791399002075, 0.0006315708160400391, 0.0006697624921798706, 0.0007079541683197021, 0.0007461458444595337, 0.0007843375205993652, 0.0008225291967391968, 0.0008607208728790283, 0.0008989125490188599, 0.0009371042251586914, 0.000975295901298523, 0.0010134875774383545, 0.001051679253578186, 0.0010898709297180176, 0.0011280626058578491, 0.0011662542819976807, 0.0012044459581375122, 0.0012426376342773438]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 6.0, 5.0, 7.0, 11.0, 15.0, 21.0, 31.0, 27.0, 50.0, 74.0, 127.0, 161.0, 277.0, 393.0, 700.0, 1149.0, 2015.0, 3911.0, 8274.0, 19927.0, 61058.0, 252284.0, 549106.0, 97271.0, 29100.0, 11257.0, 5088.0, 2558.0, 1403.0, 787.0, 506.0, 293.0, 192.0, 142.0, 98.0, 62.0, 48.0, 24.0, 16.0, 17.0, 17.0, 5.0, 9.0, 5.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.63671875, -2.552154541015625, -2.46759033203125, -2.383026123046875, -2.2984619140625, -2.213897705078125, -2.12933349609375, -2.044769287109375, -1.960205078125, -1.875640869140625, -1.79107666015625, -1.706512451171875, -1.6219482421875, -1.537384033203125, -1.45281982421875, -1.368255615234375, -1.28369140625, -1.199127197265625, -1.11456298828125, -1.029998779296875, -0.9454345703125, -0.860870361328125, -0.77630615234375, -0.691741943359375, -0.607177734375, -0.522613525390625, -0.43804931640625, -0.353485107421875, -0.2689208984375, -0.184356689453125, -0.09979248046875, -0.015228271484375, 0.0693359375, 0.153900146484375, 0.23846435546875, 0.323028564453125, 0.4075927734375, 0.492156982421875, 0.57672119140625, 0.661285400390625, 0.745849609375, 0.830413818359375, 0.91497802734375, 0.999542236328125, 1.0841064453125, 1.168670654296875, 1.25323486328125, 1.337799072265625, 1.42236328125, 1.506927490234375, 1.59149169921875, 1.676055908203125, 1.7606201171875, 1.845184326171875, 1.92974853515625, 2.014312744140625, 2.098876953125, 2.183441162109375, 2.26800537109375, 2.352569580078125, 2.4371337890625, 2.521697998046875, 2.60626220703125, 2.690826416015625, 2.775390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 13.0, 14.0, 14.0, 13.0, 21.0, 35.0, 27.0, 45.0, 58.0, 54.0, 88.0, 84.0, 85.0, 82.0, 71.0, 56.0, 42.0, 35.0, 29.0, 20.0, 27.0, 12.0, 12.0, 12.0, 8.0, 12.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.689453125, -3.59991455078125, -3.5103759765625, -3.42083740234375, -3.331298828125, -3.24176025390625, -3.1522216796875, -3.06268310546875, -2.97314453125, -2.88360595703125, -2.7940673828125, -2.70452880859375, -2.614990234375, -2.52545166015625, -2.4359130859375, -2.34637451171875, -2.2568359375, -2.16729736328125, -2.0777587890625, -1.98822021484375, -1.898681640625, -1.80914306640625, -1.7196044921875, -1.63006591796875, -1.54052734375, -1.45098876953125, -1.3614501953125, -1.27191162109375, -1.182373046875, -1.09283447265625, -1.0032958984375, -0.91375732421875, -0.82421875, -0.73468017578125, -0.6451416015625, -0.55560302734375, -0.466064453125, -0.37652587890625, -0.2869873046875, -0.19744873046875, -0.10791015625, -0.01837158203125, 0.0711669921875, 0.16070556640625, 0.250244140625, 0.33978271484375, 0.4293212890625, 0.51885986328125, 0.6083984375, 0.69793701171875, 0.7874755859375, 0.87701416015625, 0.966552734375, 1.05609130859375, 1.1456298828125, 1.23516845703125, 1.32470703125, 1.41424560546875, 1.5037841796875, 1.59332275390625, 1.682861328125, 1.77239990234375, 1.8619384765625, 1.95147705078125, 2.041015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 19.0, 26.0, 54.0, 49.0, 92.0, 160.0, 185.0, 116.0, 83.0, 59.0, 43.0, 27.0, 22.0, 13.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.665138244628906, -52.0051155090332, -50.3450927734375, -48.6850700378418, -47.025047302246094, -45.365020751953125, -43.70499801635742, -42.04497528076172, -40.384952545166016, -38.72492980957031, -37.06490707397461, -35.404884338378906, -33.74485778808594, -32.0848388671875, -30.42481231689453, -28.764789581298828, -27.104766845703125, -25.444744110107422, -23.78472137451172, -22.124696731567383, -20.46467399597168, -18.804651260375977, -17.14462661743164, -15.484603881835938, -13.824581146240234, -12.164558410644531, -10.504534721374512, -8.844511032104492, -7.184488296508789, -5.524465560913086, -3.8644418716430664, -2.204418182373047, -0.5443954467773438, 1.1156277656555176, 2.775650978088379, 4.43567419052124, 6.095697402954102, 7.755720138549805, 9.415743827819824, 11.075767517089844, 12.735790252685547, 14.39581298828125, 16.055835723876953, 17.71586036682129, 19.375883102416992, 21.035905838012695, 22.69593048095703, 24.355953216552734, 26.015975952148438, 27.67599868774414, 29.336021423339844, 30.99604606628418, 32.65606689453125, 34.31609344482422, 35.97611618041992, 37.636138916015625, 39.29616165161133, 40.95618438720703, 42.616207122802734, 44.27622985839844, 45.936256408691406, 47.596275329589844, 49.25630187988281, 50.916324615478516, 52.57634735107422]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 7.0, 5.0, 13.0, 10.0, 16.0, 16.0, 25.0, 15.0, 12.0, 25.0, 24.0, 33.0, 40.0, 40.0, 50.0, 54.0, 80.0, 77.0, 71.0, 53.0, 39.0, 46.0, 34.0, 32.0, 28.0, 20.0, 32.0, 21.0, 13.0, 12.0, 14.0, 15.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.35382080078125, -46.90304946899414, -45.45227813720703, -44.001502990722656, -42.55073165893555, -41.09996032714844, -39.64918899536133, -38.19841766357422, -36.747642517089844, -35.296871185302734, -33.846099853515625, -32.39532470703125, -30.94455337524414, -29.49378204345703, -28.043010711669922, -26.59223747253418, -25.14146614074707, -23.69069480895996, -22.23992156982422, -20.78915023803711, -19.338376998901367, -17.887605667114258, -16.436832427978516, -14.986061096191406, -13.53528881072998, -12.084516525268555, -10.633744239807129, -9.182971954345703, -7.7322001457214355, -6.28142786026001, -4.830656051635742, -3.3798837661743164, -1.9291114807128906, -0.4783393144607544, 0.9724328517913818, 2.4232048988342285, 3.8739771842956543, 5.32474946975708, 6.775521278381348, 8.226293563842773, 9.6770658493042, 11.127838134765625, 12.57861042022705, 14.029382705688477, 15.480154037475586, 16.930927276611328, 18.381698608398438, 19.832469940185547, 21.28324317932129, 22.7340145111084, 24.18478775024414, 25.63555908203125, 27.086332321166992, 28.5371036529541, 29.987876892089844, 31.438648223876953, 32.88941955566406, 34.34019088745117, 35.79096221923828, 37.241737365722656, 38.692508697509766, 40.143280029296875, 41.594051361083984, 43.044822692871094, 44.49559783935547]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 12.0, 3.0, 16.0, 21.0, 34.0, 54.0, 76.0, 175.0, 272.0, 569.0, 1206.0, 3064.0, 8897.0, 33097.0, 281033.0, 3308751.0, 493363.0, 45406.0, 11478.0, 3864.0, 1457.0, 686.0, 315.0, 155.0, 96.0, 65.0, 34.0, 23.0, 17.0, 12.0, 5.0, 1.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9765625, -6.785888671875, -6.59521484375, -6.404541015625, -6.2138671875, -6.023193359375, -5.83251953125, -5.641845703125, -5.451171875, -5.260498046875, -5.06982421875, -4.879150390625, -4.6884765625, -4.497802734375, -4.30712890625, -4.116455078125, -3.92578125, -3.735107421875, -3.54443359375, -3.353759765625, -3.1630859375, -2.972412109375, -2.78173828125, -2.591064453125, -2.400390625, -2.209716796875, -2.01904296875, -1.828369140625, -1.6376953125, -1.447021484375, -1.25634765625, -1.065673828125, -0.875, -0.684326171875, -0.49365234375, -0.302978515625, -0.1123046875, 0.078369140625, 0.26904296875, 0.459716796875, 0.650390625, 0.841064453125, 1.03173828125, 1.222412109375, 1.4130859375, 1.603759765625, 1.79443359375, 1.985107421875, 2.17578125, 2.366455078125, 2.55712890625, 2.747802734375, 2.9384765625, 3.129150390625, 3.31982421875, 3.510498046875, 3.701171875, 3.891845703125, 4.08251953125, 4.273193359375, 4.4638671875, 4.654541015625, 4.84521484375, 5.035888671875, 5.2265625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 5.0, 11.0, 8.0, 9.0, 16.0, 9.0, 14.0, 15.0, 28.0, 28.0, 35.0, 43.0, 52.0, 43.0, 47.0, 46.0, 47.0, 56.0, 51.0, 50.0, 50.0, 45.0, 42.0, 34.0, 45.0, 25.0, 23.0, 20.0, 18.0, 26.0, 15.0, 11.0, 13.0, 13.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98828125, -2.899993896484375, -2.81170654296875, -2.723419189453125, -2.6351318359375, -2.546844482421875, -2.45855712890625, -2.370269775390625, -2.281982421875, -2.193695068359375, -2.10540771484375, -2.017120361328125, -1.9288330078125, -1.840545654296875, -1.75225830078125, -1.663970947265625, -1.57568359375, -1.487396240234375, -1.39910888671875, -1.310821533203125, -1.2225341796875, -1.134246826171875, -1.04595947265625, -0.957672119140625, -0.869384765625, -0.781097412109375, -0.69281005859375, -0.604522705078125, -0.5162353515625, -0.427947998046875, -0.33966064453125, -0.251373291015625, -0.1630859375, -0.074798583984375, 0.01348876953125, 0.101776123046875, 0.1900634765625, 0.278350830078125, 0.36663818359375, 0.454925537109375, 0.543212890625, 0.631500244140625, 0.71978759765625, 0.808074951171875, 0.8963623046875, 0.984649658203125, 1.07293701171875, 1.161224365234375, 1.24951171875, 1.337799072265625, 1.42608642578125, 1.514373779296875, 1.6026611328125, 1.690948486328125, 1.77923583984375, 1.867523193359375, 1.955810546875, 2.044097900390625, 2.13238525390625, 2.220672607421875, 2.3089599609375, 2.397247314453125, 2.48553466796875, 2.573822021484375, 2.662109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 5.0, 11.0, 16.0, 11.0, 26.0, 21.0, 34.0, 54.0, 103.0, 145.0, 242.0, 726.0, 2290.0, 13604.0, 219988.0, 3861204.0, 85613.0, 7681.0, 1445.0, 456.0, 206.0, 101.0, 67.0, 47.0, 28.0, 34.0, 22.0, 27.0, 19.0, 11.0, 9.0, 2.0, 6.0, 5.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7109375, -11.312255859375, -10.91357421875, -10.514892578125, -10.1162109375, -9.717529296875, -9.31884765625, -8.920166015625, -8.521484375, -8.122802734375, -7.72412109375, -7.325439453125, -6.9267578125, -6.528076171875, -6.12939453125, -5.730712890625, -5.33203125, -4.933349609375, -4.53466796875, -4.135986328125, -3.7373046875, -3.338623046875, -2.93994140625, -2.541259765625, -2.142578125, -1.743896484375, -1.34521484375, -0.946533203125, -0.5478515625, -0.149169921875, 0.24951171875, 0.648193359375, 1.046875, 1.445556640625, 1.84423828125, 2.242919921875, 2.6416015625, 3.040283203125, 3.43896484375, 3.837646484375, 4.236328125, 4.635009765625, 5.03369140625, 5.432373046875, 5.8310546875, 6.229736328125, 6.62841796875, 7.027099609375, 7.42578125, 7.824462890625, 8.22314453125, 8.621826171875, 9.0205078125, 9.419189453125, 9.81787109375, 10.216552734375, 10.615234375, 11.013916015625, 11.41259765625, 11.811279296875, 12.2099609375, 12.608642578125, 13.00732421875, 13.406005859375, 13.8046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 5.0, 5.0, 6.0, 7.0, 12.0, 19.0, 16.0, 26.0, 38.0, 49.0, 96.0, 125.0, 220.0, 396.0, 670.0, 877.0, 597.0, 368.0, 175.0, 103.0, 82.0, 54.0, 37.0, 19.0, 15.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5703125, -5.36614990234375, -5.1619873046875, -4.95782470703125, -4.753662109375, -4.54949951171875, -4.3453369140625, -4.14117431640625, -3.93701171875, -3.73284912109375, -3.5286865234375, -3.32452392578125, -3.120361328125, -2.91619873046875, -2.7120361328125, -2.50787353515625, -2.3037109375, -2.09954833984375, -1.8953857421875, -1.69122314453125, -1.487060546875, -1.28289794921875, -1.0787353515625, -0.87457275390625, -0.67041015625, -0.46624755859375, -0.2620849609375, -0.05792236328125, 0.146240234375, 0.35040283203125, 0.5545654296875, 0.75872802734375, 0.962890625, 1.16705322265625, 1.3712158203125, 1.57537841796875, 1.779541015625, 1.98370361328125, 2.1878662109375, 2.39202880859375, 2.59619140625, 2.80035400390625, 3.0045166015625, 3.20867919921875, 3.412841796875, 3.61700439453125, 3.8211669921875, 4.02532958984375, 4.2294921875, 4.43365478515625, 4.6378173828125, 4.84197998046875, 5.046142578125, 5.25030517578125, 5.4544677734375, 5.65863037109375, 5.86279296875, 6.06695556640625, 6.2711181640625, 6.47528076171875, 6.679443359375, 6.88360595703125, 7.0877685546875, 7.29193115234375, 7.49609375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 8.0, 20.0, 54.0, 133.0, 261.0, 261.0, 147.0, 55.0, 26.0, 15.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.48782348632812, -102.0858383178711, -98.68384552001953, -95.2818603515625, -91.87986755371094, -88.4778823852539, -85.07589721679688, -81.67390441894531, -78.27191162109375, -74.86992645263672, -71.46793365478516, -68.06594848632812, -64.66395568847656, -61.26197052001953, -57.859981536865234, -54.45799255371094, -51.056007385253906, -47.65401840209961, -44.25202941894531, -40.85004425048828, -37.44805145263672, -34.04606628417969, -30.64407730102539, -27.242088317871094, -23.840099334716797, -20.4381103515625, -17.036121368408203, -13.634134292602539, -10.232145309448242, -6.830156326293945, -3.4281692504882812, -0.026180267333984375, 3.3758087158203125, 6.777797222137451, 10.17978572845459, 13.58177375793457, 16.983762741088867, 20.385751724243164, 23.787738800048828, 27.189727783203125, 30.591716766357422, 33.99370574951172, 37.395694732666016, 40.79768371582031, 44.199668884277344, 47.601661682128906, 51.00364685058594, 54.405635833740234, 57.80762481689453, 61.20961380004883, 64.61160278320312, 68.01358795166016, 71.41558074951172, 74.81756591796875, 78.21955871582031, 81.62154388427734, 85.02352905273438, 88.4255142211914, 91.82750701904297, 95.2294921875, 98.63148498535156, 102.0334701538086, 105.43545532226562, 108.83744812011719, 112.23944091796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 8.0, 10.0, 10.0, 12.0, 15.0, 21.0, 25.0, 21.0, 30.0, 51.0, 52.0, 53.0, 48.0, 59.0, 57.0, 60.0, 56.0, 56.0, 61.0, 51.0, 47.0, 36.0, 24.0, 27.0, 20.0, 21.0, 18.0, 12.0, 2.0, 8.0, 9.0, 5.0, 7.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.31557846069336, -28.257265090942383, -27.198951721191406, -26.140636444091797, -25.08232307434082, -24.024009704589844, -22.965694427490234, -21.907381057739258, -20.84906768798828, -19.790754318237305, -18.732440948486328, -17.67412567138672, -16.615812301635742, -15.557498931884766, -14.499184608459473, -13.44087028503418, -12.382556915283203, -11.324243545532227, -10.265929222106934, -9.20761489868164, -8.149301528930664, -7.090987682342529, -6.0326738357543945, -4.97435998916626, -3.916046142578125, -2.8577322959899902, -1.7994184494018555, -0.7411046028137207, 0.31720924377441406, 1.3755230903625488, 2.4338369369506836, 3.4921507835388184, 4.550464630126953, 5.608778476715088, 6.667092323303223, 7.725406169891357, 8.783720016479492, 9.842033386230469, 10.900347709655762, 11.958662033081055, 13.016975402832031, 14.075288772583008, 15.1336030960083, 16.191917419433594, 17.25023078918457, 18.308544158935547, 19.366859436035156, 20.425172805786133, 21.48348617553711, 22.541799545288086, 23.600112915039062, 24.658428192138672, 25.71674156188965, 26.775054931640625, 27.833370208740234, 28.89168357849121, 29.949996948242188, 31.008310317993164, 32.06662368774414, 33.12493896484375, 34.183250427246094, 35.2415657043457, 36.29988098144531, 37.358192443847656, 38.416507720947266]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 6.0, 10.0, 21.0, 31.0, 67.0, 86.0, 183.0, 298.0, 562.0, 980.0, 2008.0, 4818.0, 11942.0, 38835.0, 152411.0, 435478.0, 290337.0, 75591.0, 21334.0, 7269.0, 3167.0, 1407.0, 748.0, 425.0, 226.0, 108.0, 74.0, 29.0, 28.0, 18.0, 14.0, 10.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1328125, -5.945556640625, -5.75830078125, -5.571044921875, -5.3837890625, -5.196533203125, -5.00927734375, -4.822021484375, -4.634765625, -4.447509765625, -4.26025390625, -4.072998046875, -3.8857421875, -3.698486328125, -3.51123046875, -3.323974609375, -3.13671875, -2.949462890625, -2.76220703125, -2.574951171875, -2.3876953125, -2.200439453125, -2.01318359375, -1.825927734375, -1.638671875, -1.451416015625, -1.26416015625, -1.076904296875, -0.8896484375, -0.702392578125, -0.51513671875, -0.327880859375, -0.140625, 0.046630859375, 0.23388671875, 0.421142578125, 0.6083984375, 0.795654296875, 0.98291015625, 1.170166015625, 1.357421875, 1.544677734375, 1.73193359375, 1.919189453125, 2.1064453125, 2.293701171875, 2.48095703125, 2.668212890625, 2.85546875, 3.042724609375, 3.22998046875, 3.417236328125, 3.6044921875, 3.791748046875, 3.97900390625, 4.166259765625, 4.353515625, 4.540771484375, 4.72802734375, 4.915283203125, 5.1025390625, 5.289794921875, 5.47705078125, 5.664306640625, 5.8515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 11.0, 6.0, 7.0, 10.0, 10.0, 16.0, 15.0, 20.0, 31.0, 31.0, 27.0, 39.0, 48.0, 36.0, 41.0, 32.0, 49.0, 51.0, 44.0, 47.0, 37.0, 38.0, 38.0, 41.0, 39.0, 29.0, 28.0, 27.0, 23.0, 30.0, 16.0, 16.0, 16.0, 16.0, 8.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0078125, -2.923065185546875, -2.83831787109375, -2.753570556640625, -2.6688232421875, -2.584075927734375, -2.49932861328125, -2.414581298828125, -2.329833984375, -2.245086669921875, -2.16033935546875, -2.075592041015625, -1.9908447265625, -1.906097412109375, -1.82135009765625, -1.736602783203125, -1.65185546875, -1.567108154296875, -1.48236083984375, -1.397613525390625, -1.3128662109375, -1.228118896484375, -1.14337158203125, -1.058624267578125, -0.973876953125, -0.889129638671875, -0.80438232421875, -0.719635009765625, -0.6348876953125, -0.550140380859375, -0.46539306640625, -0.380645751953125, -0.2958984375, -0.211151123046875, -0.12640380859375, -0.041656494140625, 0.0430908203125, 0.127838134765625, 0.21258544921875, 0.297332763671875, 0.382080078125, 0.466827392578125, 0.55157470703125, 0.636322021484375, 0.7210693359375, 0.805816650390625, 0.89056396484375, 0.975311279296875, 1.06005859375, 1.144805908203125, 1.22955322265625, 1.314300537109375, 1.3990478515625, 1.483795166015625, 1.56854248046875, 1.653289794921875, 1.738037109375, 1.822784423828125, 1.90753173828125, 1.992279052734375, 2.0770263671875, 2.161773681640625, 2.24652099609375, 2.331268310546875, 2.416015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 9.0, 13.0, 34.0, 28.0, 53.0, 82.0, 127.0, 210.0, 342.0, 649.0, 1312.0, 2811.0, 7522.0, 27042.0, 140306.0, 644818.0, 175272.0, 32871.0, 8722.0, 3174.0, 1434.0, 727.0, 371.0, 219.0, 131.0, 87.0, 51.0, 32.0, 23.0, 28.0, 8.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.9375, -6.71051025390625, -6.4835205078125, -6.25653076171875, -6.029541015625, -5.80255126953125, -5.5755615234375, -5.34857177734375, -5.12158203125, -4.89459228515625, -4.6676025390625, -4.44061279296875, -4.213623046875, -3.98663330078125, -3.7596435546875, -3.53265380859375, -3.3056640625, -3.07867431640625, -2.8516845703125, -2.62469482421875, -2.397705078125, -2.17071533203125, -1.9437255859375, -1.71673583984375, -1.48974609375, -1.26275634765625, -1.0357666015625, -0.80877685546875, -0.581787109375, -0.35479736328125, -0.1278076171875, 0.09918212890625, 0.326171875, 0.55316162109375, 0.7801513671875, 1.00714111328125, 1.234130859375, 1.46112060546875, 1.6881103515625, 1.91510009765625, 2.14208984375, 2.36907958984375, 2.5960693359375, 2.82305908203125, 3.050048828125, 3.27703857421875, 3.5040283203125, 3.73101806640625, 3.9580078125, 4.18499755859375, 4.4119873046875, 4.63897705078125, 4.865966796875, 5.09295654296875, 5.3199462890625, 5.54693603515625, 5.77392578125, 6.00091552734375, 6.2279052734375, 6.45489501953125, 6.681884765625, 6.90887451171875, 7.1358642578125, 7.36285400390625, 7.58984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 8.0, 7.0, 8.0, 6.0, 18.0, 16.0, 24.0, 25.0, 35.0, 42.0, 30.0, 51.0, 51.0, 53.0, 60.0, 58.0, 67.0, 51.0, 39.0, 56.0, 40.0, 39.0, 35.0, 40.0, 23.0, 19.0, 26.0, 12.0, 9.0, 21.0, 8.0, 4.0, 2.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.90625, -11.5545654296875, -11.202880859375, -10.8511962890625, -10.49951171875, -10.1478271484375, -9.796142578125, -9.4444580078125, -9.0927734375, -8.7410888671875, -8.389404296875, -8.0377197265625, -7.68603515625, -7.3343505859375, -6.982666015625, -6.6309814453125, -6.279296875, -5.9276123046875, -5.575927734375, -5.2242431640625, -4.87255859375, -4.5208740234375, -4.169189453125, -3.8175048828125, -3.4658203125, -3.1141357421875, -2.762451171875, -2.4107666015625, -2.05908203125, -1.7073974609375, -1.355712890625, -1.0040283203125, -0.65234375, -0.3006591796875, 0.051025390625, 0.4027099609375, 0.75439453125, 1.1060791015625, 1.457763671875, 1.8094482421875, 2.1611328125, 2.5128173828125, 2.864501953125, 3.2161865234375, 3.56787109375, 3.9195556640625, 4.271240234375, 4.6229248046875, 4.974609375, 5.3262939453125, 5.677978515625, 6.0296630859375, 6.38134765625, 6.7330322265625, 7.084716796875, 7.4364013671875, 7.7880859375, 8.1397705078125, 8.491455078125, 8.8431396484375, 9.19482421875, 9.5465087890625, 9.898193359375, 10.2498779296875, 10.6015625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 13.0, 12.0, 8.0, 21.0, 32.0, 35.0, 63.0, 102.0, 159.0, 253.0, 416.0, 804.0, 1399.0, 2894.0, 5766.0, 12863.0, 32104.0, 90996.0, 418502.0, 336029.0, 90100.0, 31527.0, 12667.0, 5673.0, 2778.0, 1446.0, 763.0, 473.0, 235.0, 148.0, 93.0, 44.0, 50.0, 26.0, 15.0, 16.0, 11.0, 6.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.962890625, -1.90679931640625, -1.8507080078125, -1.79461669921875, -1.738525390625, -1.68243408203125, -1.6263427734375, -1.57025146484375, -1.51416015625, -1.45806884765625, -1.4019775390625, -1.34588623046875, -1.289794921875, -1.23370361328125, -1.1776123046875, -1.12152099609375, -1.0654296875, -1.00933837890625, -0.9532470703125, -0.89715576171875, -0.841064453125, -0.78497314453125, -0.7288818359375, -0.67279052734375, -0.61669921875, -0.56060791015625, -0.5045166015625, -0.44842529296875, -0.392333984375, -0.33624267578125, -0.2801513671875, -0.22406005859375, -0.16796875, -0.11187744140625, -0.0557861328125, 0.00030517578125, 0.056396484375, 0.11248779296875, 0.1685791015625, 0.22467041015625, 0.28076171875, 0.33685302734375, 0.3929443359375, 0.44903564453125, 0.505126953125, 0.56121826171875, 0.6173095703125, 0.67340087890625, 0.7294921875, 0.78558349609375, 0.8416748046875, 0.89776611328125, 0.953857421875, 1.00994873046875, 1.0660400390625, 1.12213134765625, 1.17822265625, 1.23431396484375, 1.2904052734375, 1.34649658203125, 1.402587890625, 1.45867919921875, 1.5147705078125, 1.57086181640625, 1.626953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 8.0, 2.0, 10.0, 14.0, 17.0, 12.0, 22.0, 54.0, 76.0, 91.0, 146.0, 146.0, 112.0, 93.0, 55.0, 44.0, 27.0, 20.0, 8.0, 11.0, 5.0, 5.0, 9.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009098052978515625, -0.0008807331323623657, -0.0008516609668731689, -0.0008225888013839722, -0.0007935166358947754, -0.0007644444704055786, -0.0007353723049163818, -0.0007063001394271851, -0.0006772279739379883, -0.0006481558084487915, -0.0006190836429595947, -0.000590011477470398, -0.0005609393119812012, -0.0005318671464920044, -0.0005027949810028076, -0.00047372281551361084, -0.00044465065002441406, -0.0004155784845352173, -0.0003865063190460205, -0.00035743415355682373, -0.00032836198806762695, -0.0002992898225784302, -0.0002702176570892334, -0.00024114549160003662, -0.00021207332611083984, -0.00018300116062164307, -0.0001539289951324463, -0.0001248568296432495, -9.578466415405273e-05, -6.671249866485596e-05, -3.764033317565918e-05, -8.568167686462402e-06, 2.0503997802734375e-05, 4.957616329193115e-05, 7.864832878112793e-05, 0.00010772049427032471, 0.00013679265975952148, 0.00016586482524871826, 0.00019493699073791504, 0.00022400915622711182, 0.0002530813217163086, 0.00028215348720550537, 0.00031122565269470215, 0.0003402978181838989, 0.0003693699836730957, 0.0003984421491622925, 0.00042751431465148926, 0.00045658648014068604, 0.0004856586456298828, 0.0005147308111190796, 0.0005438029766082764, 0.0005728751420974731, 0.0006019473075866699, 0.0006310194730758667, 0.0006600916385650635, 0.0006891638040542603, 0.000718235969543457, 0.0007473081350326538, 0.0007763803005218506, 0.0008054524660110474, 0.0008345246315002441, 0.0008635967969894409, 0.0008926689624786377, 0.0009217411279678345, 0.0009508132934570312]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 14.0, 14.0, 26.0, 53.0, 88.0, 173.0, 361.0, 704.0, 1642.0, 4646.0, 14760.0, 57730.0, 285811.0, 566907.0, 85566.0, 20195.0, 6002.0, 2136.0, 885.0, 432.0, 193.0, 87.0, 62.0, 28.0, 17.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.64453125, -2.5595703125, -2.474609375, -2.3896484375, -2.3046875, -2.2197265625, -2.134765625, -2.0498046875, -1.96484375, -1.8798828125, -1.794921875, -1.7099609375, -1.625, -1.5400390625, -1.455078125, -1.3701171875, -1.28515625, -1.2001953125, -1.115234375, -1.0302734375, -0.9453125, -0.8603515625, -0.775390625, -0.6904296875, -0.60546875, -0.5205078125, -0.435546875, -0.3505859375, -0.265625, -0.1806640625, -0.095703125, -0.0107421875, 0.07421875, 0.1591796875, 0.244140625, 0.3291015625, 0.4140625, 0.4990234375, 0.583984375, 0.6689453125, 0.75390625, 0.8388671875, 0.923828125, 1.0087890625, 1.09375, 1.1787109375, 1.263671875, 1.3486328125, 1.43359375, 1.5185546875, 1.603515625, 1.6884765625, 1.7734375, 1.8583984375, 1.943359375, 2.0283203125, 2.11328125, 2.1982421875, 2.283203125, 2.3681640625, 2.453125, 2.5380859375, 2.623046875, 2.7080078125, 2.79296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 16.0, 13.0, 22.0, 16.0, 27.0, 31.0, 39.0, 55.0, 54.0, 84.0, 79.0, 72.0, 86.0, 74.0, 72.0, 59.0, 32.0, 28.0, 26.0, 18.0, 15.0, 17.0, 10.0, 8.0, 5.0, 4.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1484375, -2.078094482421875, -2.00775146484375, -1.937408447265625, -1.8670654296875, -1.796722412109375, -1.72637939453125, -1.656036376953125, -1.585693359375, -1.515350341796875, -1.44500732421875, -1.374664306640625, -1.3043212890625, -1.233978271484375, -1.16363525390625, -1.093292236328125, -1.02294921875, -0.952606201171875, -0.88226318359375, -0.811920166015625, -0.7415771484375, -0.671234130859375, -0.60089111328125, -0.530548095703125, -0.460205078125, -0.389862060546875, -0.31951904296875, -0.249176025390625, -0.1788330078125, -0.108489990234375, -0.03814697265625, 0.032196044921875, 0.1025390625, 0.172882080078125, 0.24322509765625, 0.313568115234375, 0.3839111328125, 0.454254150390625, 0.52459716796875, 0.594940185546875, 0.665283203125, 0.735626220703125, 0.80596923828125, 0.876312255859375, 0.9466552734375, 1.016998291015625, 1.08734130859375, 1.157684326171875, 1.22802734375, 1.298370361328125, 1.36871337890625, 1.439056396484375, 1.5093994140625, 1.579742431640625, 1.65008544921875, 1.720428466796875, 1.790771484375, 1.861114501953125, 1.93145751953125, 2.001800537109375, 2.0721435546875, 2.142486572265625, 2.21282958984375, 2.283172607421875, 2.353515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 9.0, 20.0, 32.0, 82.0, 126.0, 257.0, 263.0, 107.0, 48.0, 18.0, 11.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.70498657226562, -81.24508666992188, -78.7851791381836, -76.32527923583984, -73.86537170410156, -71.40547180175781, -68.94557189941406, -66.48567199707031, -64.02576446533203, -61.565860748291016, -59.10595703125, -56.64605712890625, -54.186153411865234, -51.72624969482422, -49.26634979248047, -46.80644607543945, -44.34654235839844, -41.88663864135742, -39.426734924316406, -36.966835021972656, -34.50693130493164, -32.047027587890625, -29.587125778198242, -27.12722396850586, -24.667320251464844, -22.207416534423828, -19.747514724731445, -17.287612915039062, -14.827709197998047, -12.367806434631348, -9.907903671264648, -7.448001861572266, -4.98809814453125, -2.528195381164551, -0.06829261779785156, 2.3916101455688477, 4.851512908935547, 7.311415672302246, 9.771318435668945, 12.231220245361328, 14.691123962402344, 17.15102767944336, 19.610929489135742, 22.070831298828125, 24.53073501586914, 26.990638732910156, 29.45054054260254, 31.910442352294922, 34.37034606933594, 36.83024978637695, 39.29015350341797, 41.75005340576172, 44.209957122802734, 46.66986083984375, 49.1297607421875, 51.589664459228516, 54.04956817626953, 56.50947189331055, 58.96937561035156, 61.42927551269531, 63.88917922973633, 66.34908294677734, 68.8089828491211, 71.26889038085938, 73.72879028320312]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 5.0, 8.0, 14.0, 5.0, 14.0, 12.0, 15.0, 15.0, 25.0, 20.0, 20.0, 32.0, 28.0, 30.0, 28.0, 38.0, 45.0, 57.0, 61.0, 60.0, 74.0, 43.0, 33.0, 40.0, 27.0, 28.0, 22.0, 14.0, 15.0, 18.0, 18.0, 19.0, 9.0, 18.0, 9.0, 10.0, 10.0, 9.0, 10.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-31.554216384887695, -30.53770637512207, -29.521196365356445, -28.50468635559082, -27.488174438476562, -26.471664428710938, -25.455154418945312, -24.438644409179688, -23.422134399414062, -22.405624389648438, -21.389114379882812, -20.372604370117188, -19.356094360351562, -18.339584350585938, -17.32307243347168, -16.306562423706055, -15.29005241394043, -14.273542404174805, -13.25703239440918, -12.240521430969238, -11.224011421203613, -10.207501411437988, -9.190990447998047, -8.174480438232422, -7.157970428466797, -6.141460418701172, -5.124949932098389, -4.1084394454956055, -3.0919294357299805, -2.0754194259643555, -1.0589089393615723, -0.04239845275878906, 0.9741096496582031, 1.9906198978424072, 3.0071301460266113, 4.0236406326293945, 5.0401506423950195, 6.0566606521606445, 7.073171138763428, 8.089681625366211, 9.106191635131836, 10.122701644897461, 11.139211654663086, 12.155722618103027, 13.172232627868652, 14.188742637634277, 15.205253601074219, 16.221763610839844, 17.23827362060547, 18.254783630371094, 19.27129364013672, 20.287803649902344, 21.30431365966797, 22.320823669433594, 23.33733558654785, 24.353845596313477, 25.3703556060791, 26.386865615844727, 27.40337562561035, 28.419885635375977, 29.436397552490234, 30.45290756225586, 31.469417572021484, 32.48592758178711, 33.502437591552734]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 3.0, 7.0, 8.0, 8.0, 11.0, 15.0, 24.0, 43.0, 80.0, 172.0, 495.0, 1246.0, 4243.0, 18424.0, 206570.0, 3630039.0, 302969.0, 22544.0, 4852.0, 1489.0, 529.0, 241.0, 119.0, 54.0, 38.0, 17.0, 12.0, 16.0, 5.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.171875, -8.91387939453125, -8.6558837890625, -8.39788818359375, -8.139892578125, -7.88189697265625, -7.6239013671875, -7.36590576171875, -7.10791015625, -6.84991455078125, -6.5919189453125, -6.33392333984375, -6.075927734375, -5.81793212890625, -5.5599365234375, -5.30194091796875, -5.0439453125, -4.78594970703125, -4.5279541015625, -4.26995849609375, -4.011962890625, -3.75396728515625, -3.4959716796875, -3.23797607421875, -2.97998046875, -2.72198486328125, -2.4639892578125, -2.20599365234375, -1.947998046875, -1.69000244140625, -1.4320068359375, -1.17401123046875, -0.916015625, -0.65802001953125, -0.4000244140625, -0.14202880859375, 0.115966796875, 0.37396240234375, 0.6319580078125, 0.88995361328125, 1.14794921875, 1.40594482421875, 1.6639404296875, 1.92193603515625, 2.179931640625, 2.43792724609375, 2.6959228515625, 2.95391845703125, 3.2119140625, 3.46990966796875, 3.7279052734375, 3.98590087890625, 4.243896484375, 4.50189208984375, 4.7598876953125, 5.01788330078125, 5.27587890625, 5.53387451171875, 5.7918701171875, 6.04986572265625, 6.307861328125, 6.56585693359375, 6.8238525390625, 7.08184814453125, 7.33984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 2.0, 7.0, 9.0, 15.0, 6.0, 17.0, 16.0, 17.0, 27.0, 28.0, 29.0, 34.0, 38.0, 49.0, 44.0, 45.0, 57.0, 51.0, 50.0, 48.0, 45.0, 46.0, 47.0, 35.0, 35.0, 35.0, 27.0, 27.0, 20.0, 15.0, 15.0, 13.0, 16.0, 8.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.015625, -2.927154541015625, -2.83868408203125, -2.750213623046875, -2.6617431640625, -2.573272705078125, -2.48480224609375, -2.396331787109375, -2.307861328125, -2.219390869140625, -2.13092041015625, -2.042449951171875, -1.9539794921875, -1.865509033203125, -1.77703857421875, -1.688568115234375, -1.60009765625, -1.511627197265625, -1.42315673828125, -1.334686279296875, -1.2462158203125, -1.157745361328125, -1.06927490234375, -0.980804443359375, -0.892333984375, -0.803863525390625, -0.71539306640625, -0.626922607421875, -0.5384521484375, -0.449981689453125, -0.36151123046875, -0.273040771484375, -0.1845703125, -0.096099853515625, -0.00762939453125, 0.080841064453125, 0.1693115234375, 0.257781982421875, 0.34625244140625, 0.434722900390625, 0.523193359375, 0.611663818359375, 0.70013427734375, 0.788604736328125, 0.8770751953125, 0.965545654296875, 1.05401611328125, 1.142486572265625, 1.23095703125, 1.319427490234375, 1.40789794921875, 1.496368408203125, 1.5848388671875, 1.673309326171875, 1.76177978515625, 1.850250244140625, 1.938720703125, 2.027191162109375, 2.11566162109375, 2.204132080078125, 2.2926025390625, 2.381072998046875, 2.46954345703125, 2.558013916015625, 2.646484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 26.0, 36.0, 82.0, 182.0, 360.0, 1084.0, 9929.0, 2751260.0, 1421442.0, 8182.0, 980.0, 349.0, 155.0, 97.0, 48.0, 25.0, 18.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -17.913818359375, -17.24951171875, -16.585205078125, -15.9208984375, -15.256591796875, -14.59228515625, -13.927978515625, -13.263671875, -12.599365234375, -11.93505859375, -11.270751953125, -10.6064453125, -9.942138671875, -9.27783203125, -8.613525390625, -7.94921875, -7.284912109375, -6.62060546875, -5.956298828125, -5.2919921875, -4.627685546875, -3.96337890625, -3.299072265625, -2.634765625, -1.970458984375, -1.30615234375, -0.641845703125, 0.0224609375, 0.686767578125, 1.35107421875, 2.015380859375, 2.6796875, 3.343994140625, 4.00830078125, 4.672607421875, 5.3369140625, 6.001220703125, 6.66552734375, 7.329833984375, 7.994140625, 8.658447265625, 9.32275390625, 9.987060546875, 10.6513671875, 11.315673828125, 11.97998046875, 12.644287109375, 13.30859375, 13.972900390625, 14.63720703125, 15.301513671875, 15.9658203125, 16.630126953125, 17.29443359375, 17.958740234375, 18.623046875, 19.287353515625, 19.95166015625, 20.615966796875, 21.2802734375, 21.944580078125, 22.60888671875, 23.273193359375, 23.9375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 9.0, 8.0, 13.0, 21.0, 32.0, 37.0, 79.0, 149.0, 318.0, 744.0, 1184.0, 752.0, 350.0, 167.0, 77.0, 47.0, 24.0, 18.0, 12.0, 9.0, 9.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.26171875, -6.96490478515625, -6.6680908203125, -6.37127685546875, -6.074462890625, -5.77764892578125, -5.4808349609375, -5.18402099609375, -4.88720703125, -4.59039306640625, -4.2935791015625, -3.99676513671875, -3.699951171875, -3.40313720703125, -3.1063232421875, -2.80950927734375, -2.5126953125, -2.21588134765625, -1.9190673828125, -1.62225341796875, -1.325439453125, -1.02862548828125, -0.7318115234375, -0.43499755859375, -0.13818359375, 0.15863037109375, 0.4554443359375, 0.75225830078125, 1.049072265625, 1.34588623046875, 1.6427001953125, 1.93951416015625, 2.236328125, 2.53314208984375, 2.8299560546875, 3.12677001953125, 3.423583984375, 3.72039794921875, 4.0172119140625, 4.31402587890625, 4.61083984375, 4.90765380859375, 5.2044677734375, 5.50128173828125, 5.798095703125, 6.09490966796875, 6.3917236328125, 6.68853759765625, 6.9853515625, 7.28216552734375, 7.5789794921875, 7.87579345703125, 8.172607421875, 8.46942138671875, 8.7662353515625, 9.06304931640625, 9.35986328125, 9.65667724609375, 9.9534912109375, 10.25030517578125, 10.547119140625, 10.84393310546875, 11.1407470703125, 11.43756103515625, 11.734375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 10.0, 18.0, 54.0, 73.0, 105.0, 145.0, 189.0, 141.0, 114.0, 62.0, 31.0, 23.0, 9.0, 8.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.0606689453125, -90.87197875976562, -88.68328857421875, -86.4946060180664, -84.30591583251953, -82.11722564697266, -79.92854309082031, -77.73985290527344, -75.55116271972656, -73.36247253417969, -71.17378234863281, -68.98509979248047, -66.7964096069336, -64.60771942138672, -62.41903305053711, -60.2303466796875, -58.041656494140625, -55.85296630859375, -53.66427993774414, -51.47559356689453, -49.286903381347656, -47.09821319580078, -44.90952682495117, -42.72084045410156, -40.53215026855469, -38.34346008300781, -36.1547737121582, -33.966087341308594, -31.77739715576172, -29.588708877563477, -27.400020599365234, -25.211332321166992, -23.02264404296875, -20.833955764770508, -18.645267486572266, -16.456579208374023, -14.267890930175781, -12.079202651977539, -9.890514373779297, -7.701826095581055, -5.5131378173828125, -3.3244495391845703, -1.1357612609863281, 1.052927017211914, 3.2416152954101562, 5.430303573608398, 7.618991851806641, 9.807680130004883, 11.996368408203125, 14.185056686401367, 16.37374496459961, 18.56243324279785, 20.751121520996094, 22.939809799194336, 25.128498077392578, 27.31718635559082, 29.505874633789062, 31.694562911987305, 33.88325119018555, 36.071937561035156, 38.26062774658203, 40.449317932128906, 42.638004302978516, 44.826690673828125, 47.015380859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 7.0, 2.0, 8.0, 6.0, 10.0, 14.0, 13.0, 25.0, 26.0, 34.0, 33.0, 53.0, 59.0, 56.0, 47.0, 55.0, 46.0, 50.0, 56.0, 46.0, 39.0, 40.0, 49.0, 30.0, 35.0, 33.0, 22.0, 26.0, 16.0, 16.0, 10.0, 8.0, 10.0, 5.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.73828887939453, -34.621551513671875, -33.504817962646484, -32.388084411621094, -31.271347045898438, -30.154611587524414, -29.03787612915039, -27.921140670776367, -26.804405212402344, -25.68766975402832, -24.570934295654297, -23.454198837280273, -22.33746337890625, -21.220727920532227, -20.103992462158203, -18.98725700378418, -17.870521545410156, -16.753786087036133, -15.63705062866211, -14.520315170288086, -13.403579711914062, -12.286844253540039, -11.170108795166016, -10.053373336791992, -8.936637878417969, -7.819902420043945, -6.703166961669922, -5.586431503295898, -4.469696044921875, -3.3529605865478516, -2.236225128173828, -1.1194896697998047, -0.002750396728515625, 1.1139850616455078, 2.2307205200195312, 3.3474559783935547, 4.464191436767578, 5.580926895141602, 6.697662353515625, 7.814397811889648, 8.931133270263672, 10.047868728637695, 11.164604187011719, 12.281339645385742, 13.398075103759766, 14.514810562133789, 15.631546020507812, 16.748281478881836, 17.86501693725586, 18.981752395629883, 20.098487854003906, 21.21522331237793, 22.331958770751953, 23.448694229125977, 24.5654296875, 25.682165145874023, 26.798900604248047, 27.91563606262207, 29.032371520996094, 30.149106979370117, 31.26584243774414, 32.38257598876953, 33.49931335449219, 34.616050720214844, 35.732784271240234]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 14.0, 10.0, 14.0, 56.0, 90.0, 165.0, 392.0, 1051.0, 3017.0, 10336.0, 49125.0, 328098.0, 544558.0, 88188.0, 16695.0, 4326.0, 1369.0, 591.0, 234.0, 104.0, 50.0, 30.0, 15.0, 11.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.0067138671875, -7.732177734375, -7.4576416015625, -7.18310546875, -6.9085693359375, -6.634033203125, -6.3594970703125, -6.0849609375, -5.8104248046875, -5.535888671875, -5.2613525390625, -4.98681640625, -4.7122802734375, -4.437744140625, -4.1632080078125, -3.888671875, -3.6141357421875, -3.339599609375, -3.0650634765625, -2.79052734375, -2.5159912109375, -2.241455078125, -1.9669189453125, -1.6923828125, -1.4178466796875, -1.143310546875, -0.8687744140625, -0.59423828125, -0.3197021484375, -0.045166015625, 0.2293701171875, 0.50390625, 0.7784423828125, 1.052978515625, 1.3275146484375, 1.60205078125, 1.8765869140625, 2.151123046875, 2.4256591796875, 2.7001953125, 2.9747314453125, 3.249267578125, 3.5238037109375, 3.79833984375, 4.0728759765625, 4.347412109375, 4.6219482421875, 4.896484375, 5.1710205078125, 5.445556640625, 5.7200927734375, 5.99462890625, 6.2691650390625, 6.543701171875, 6.8182373046875, 7.0927734375, 7.3673095703125, 7.641845703125, 7.9163818359375, 8.19091796875, 8.4654541015625, 8.739990234375, 9.0145263671875, 9.2890625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 5.0, 8.0, 8.0, 11.0, 9.0, 7.0, 18.0, 25.0, 16.0, 25.0, 29.0, 37.0, 38.0, 39.0, 42.0, 31.0, 48.0, 41.0, 45.0, 44.0, 47.0, 53.0, 47.0, 47.0, 40.0, 31.0, 32.0, 29.0, 25.0, 24.0, 22.0, 15.0, 15.0, 11.0, 7.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.041015625, -2.94915771484375, -2.8572998046875, -2.76544189453125, -2.673583984375, -2.58172607421875, -2.4898681640625, -2.39801025390625, -2.30615234375, -2.21429443359375, -2.1224365234375, -2.03057861328125, -1.938720703125, -1.84686279296875, -1.7550048828125, -1.66314697265625, -1.5712890625, -1.47943115234375, -1.3875732421875, -1.29571533203125, -1.203857421875, -1.11199951171875, -1.0201416015625, -0.92828369140625, -0.83642578125, -0.74456787109375, -0.6527099609375, -0.56085205078125, -0.468994140625, -0.37713623046875, -0.2852783203125, -0.19342041015625, -0.1015625, -0.00970458984375, 0.0821533203125, 0.17401123046875, 0.265869140625, 0.35772705078125, 0.4495849609375, 0.54144287109375, 0.63330078125, 0.72515869140625, 0.8170166015625, 0.90887451171875, 1.000732421875, 1.09259033203125, 1.1844482421875, 1.27630615234375, 1.3681640625, 1.46002197265625, 1.5518798828125, 1.64373779296875, 1.735595703125, 1.82745361328125, 1.9193115234375, 2.01116943359375, 2.10302734375, 2.19488525390625, 2.2867431640625, 2.37860107421875, 2.470458984375, 2.56231689453125, 2.6541748046875, 2.74603271484375, 2.837890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 12.0, 5.0, 19.0, 25.0, 27.0, 32.0, 59.0, 89.0, 143.0, 201.0, 363.0, 667.0, 1414.0, 4193.0, 18018.0, 140661.0, 778332.0, 85434.0, 12858.0, 3364.0, 1184.0, 584.0, 310.0, 194.0, 113.0, 96.0, 51.0, 34.0, 21.0, 14.0, 17.0, 7.0, 1.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8671875, -8.53125, -8.1953125, -7.859375, -7.5234375, -7.1875, -6.8515625, -6.515625, -6.1796875, -5.84375, -5.5078125, -5.171875, -4.8359375, -4.5, -4.1640625, -3.828125, -3.4921875, -3.15625, -2.8203125, -2.484375, -2.1484375, -1.8125, -1.4765625, -1.140625, -0.8046875, -0.46875, -0.1328125, 0.203125, 0.5390625, 0.875, 1.2109375, 1.546875, 1.8828125, 2.21875, 2.5546875, 2.890625, 3.2265625, 3.5625, 3.8984375, 4.234375, 4.5703125, 4.90625, 5.2421875, 5.578125, 5.9140625, 6.25, 6.5859375, 6.921875, 7.2578125, 7.59375, 7.9296875, 8.265625, 8.6015625, 8.9375, 9.2734375, 9.609375, 9.9453125, 10.28125, 10.6171875, 10.953125, 11.2890625, 11.625, 11.9609375, 12.296875, 12.6328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 1.0, 5.0, 7.0, 7.0, 7.0, 8.0, 12.0, 11.0, 18.0, 21.0, 15.0, 22.0, 21.0, 28.0, 39.0, 41.0, 46.0, 47.0, 58.0, 56.0, 49.0, 51.0, 57.0, 44.0, 64.0, 42.0, 37.0, 31.0, 35.0, 23.0, 18.0, 14.0, 16.0, 13.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.859375, -10.48583984375, -10.1123046875, -9.73876953125, -9.365234375, -8.99169921875, -8.6181640625, -8.24462890625, -7.87109375, -7.49755859375, -7.1240234375, -6.75048828125, -6.376953125, -6.00341796875, -5.6298828125, -5.25634765625, -4.8828125, -4.50927734375, -4.1357421875, -3.76220703125, -3.388671875, -3.01513671875, -2.6416015625, -2.26806640625, -1.89453125, -1.52099609375, -1.1474609375, -0.77392578125, -0.400390625, -0.02685546875, 0.3466796875, 0.72021484375, 1.09375, 1.46728515625, 1.8408203125, 2.21435546875, 2.587890625, 2.96142578125, 3.3349609375, 3.70849609375, 4.08203125, 4.45556640625, 4.8291015625, 5.20263671875, 5.576171875, 5.94970703125, 6.3232421875, 6.69677734375, 7.0703125, 7.44384765625, 7.8173828125, 8.19091796875, 8.564453125, 8.93798828125, 9.3115234375, 9.68505859375, 10.05859375, 10.43212890625, 10.8056640625, 11.17919921875, 11.552734375, 11.92626953125, 12.2998046875, 12.67333984375, 13.046875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 15.0, 16.0, 17.0, 18.0, 44.0, 48.0, 90.0, 156.0, 204.0, 405.0, 722.0, 1345.0, 2907.0, 6967.0, 19566.0, 66449.0, 604786.0, 266721.0, 51024.0, 15863.0, 5925.0, 2598.0, 1165.0, 595.0, 343.0, 218.0, 114.0, 70.0, 60.0, 37.0, 17.0, 19.0, 8.0, 4.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.044921875, -2.960113525390625, -2.87530517578125, -2.790496826171875, -2.7056884765625, -2.620880126953125, -2.53607177734375, -2.451263427734375, -2.366455078125, -2.281646728515625, -2.19683837890625, -2.112030029296875, -2.0272216796875, -1.942413330078125, -1.85760498046875, -1.772796630859375, -1.68798828125, -1.603179931640625, -1.51837158203125, -1.433563232421875, -1.3487548828125, -1.263946533203125, -1.17913818359375, -1.094329833984375, -1.009521484375, -0.924713134765625, -0.83990478515625, -0.755096435546875, -0.6702880859375, -0.585479736328125, -0.50067138671875, -0.415863037109375, -0.3310546875, -0.246246337890625, -0.16143798828125, -0.076629638671875, 0.0081787109375, 0.092987060546875, 0.17779541015625, 0.262603759765625, 0.347412109375, 0.432220458984375, 0.51702880859375, 0.601837158203125, 0.6866455078125, 0.771453857421875, 0.85626220703125, 0.941070556640625, 1.02587890625, 1.110687255859375, 1.19549560546875, 1.280303955078125, 1.3651123046875, 1.449920654296875, 1.53472900390625, 1.619537353515625, 1.704345703125, 1.789154052734375, 1.87396240234375, 1.958770751953125, 2.0435791015625, 2.128387451171875, 2.21319580078125, 2.298004150390625, 2.3828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 3.0, 9.0, 6.0, 15.0, 29.0, 39.0, 62.0, 126.0, 252.0, 203.0, 93.0, 54.0, 30.0, 24.0, 12.0, 7.0, 7.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013713836669921875, -0.0013296008110046387, -0.0012878179550170898, -0.001246035099029541, -0.0012042522430419922, -0.0011624693870544434, -0.0011206865310668945, -0.0010789036750793457, -0.0010371208190917969, -0.000995337963104248, -0.0009535551071166992, -0.0009117722511291504, -0.0008699893951416016, -0.0008282065391540527, -0.0007864236831665039, -0.0007446408271789551, -0.0007028579711914062, -0.0006610751152038574, -0.0006192922592163086, -0.0005775094032287598, -0.0005357265472412109, -0.0004939436912536621, -0.0004521608352661133, -0.00041037797927856445, -0.0003685951232910156, -0.0003268122673034668, -0.00028502941131591797, -0.00024324655532836914, -0.0002014636993408203, -0.00015968084335327148, -0.00011789798736572266, -7.611513137817383e-05, -3.4332275390625e-05, 7.450580596923828e-06, 4.9233436584472656e-05, 9.101629257202148e-05, 0.0001327991485595703, 0.00017458200454711914, 0.00021636486053466797, 0.0002581477165222168, 0.0002999305725097656, 0.00034171342849731445, 0.0003834962844848633, 0.0004252791404724121, 0.00046706199645996094, 0.0005088448524475098, 0.0005506277084350586, 0.0005924105644226074, 0.0006341934204101562, 0.0006759762763977051, 0.0007177591323852539, 0.0007595419883728027, 0.0008013248443603516, 0.0008431077003479004, 0.0008848905563354492, 0.000926673412322998, 0.0009684562683105469, 0.0010102391242980957, 0.0010520219802856445, 0.0010938048362731934, 0.0011355876922607422, 0.001177370548248291, 0.0012191534042358398, 0.0012609362602233887, 0.0013027191162109375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 27.0, 26.0, 46.0, 37.0, 69.0, 130.0, 200.0, 296.0, 542.0, 998.0, 1861.0, 4145.0, 10466.0, 33125.0, 144833.0, 706200.0, 103557.0, 25972.0, 8715.0, 3622.0, 1675.0, 788.0, 443.0, 273.0, 165.0, 112.0, 76.0, 41.0, 35.0, 25.0, 18.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.998046875, -2.905517578125, -2.81298828125, -2.720458984375, -2.6279296875, -2.535400390625, -2.44287109375, -2.350341796875, -2.2578125, -2.165283203125, -2.07275390625, -1.980224609375, -1.8876953125, -1.795166015625, -1.70263671875, -1.610107421875, -1.517578125, -1.425048828125, -1.33251953125, -1.239990234375, -1.1474609375, -1.054931640625, -0.96240234375, -0.869873046875, -0.77734375, -0.684814453125, -0.59228515625, -0.499755859375, -0.4072265625, -0.314697265625, -0.22216796875, -0.129638671875, -0.037109375, 0.055419921875, 0.14794921875, 0.240478515625, 0.3330078125, 0.425537109375, 0.51806640625, 0.610595703125, 0.703125, 0.795654296875, 0.88818359375, 0.980712890625, 1.0732421875, 1.165771484375, 1.25830078125, 1.350830078125, 1.443359375, 1.535888671875, 1.62841796875, 1.720947265625, 1.8134765625, 1.906005859375, 1.99853515625, 2.091064453125, 2.18359375, 2.276123046875, 2.36865234375, 2.461181640625, 2.5537109375, 2.646240234375, 2.73876953125, 2.831298828125, 2.923828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 9.0, 9.0, 11.0, 17.0, 25.0, 31.0, 31.0, 45.0, 76.0, 116.0, 165.0, 137.0, 92.0, 63.0, 42.0, 34.0, 21.0, 11.0, 12.0, 16.0, 8.0, 7.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37890625, -2.2740478515625, -2.169189453125, -2.0643310546875, -1.95947265625, -1.8546142578125, -1.749755859375, -1.6448974609375, -1.5400390625, -1.4351806640625, -1.330322265625, -1.2254638671875, -1.12060546875, -1.0157470703125, -0.910888671875, -0.8060302734375, -0.701171875, -0.5963134765625, -0.491455078125, -0.3865966796875, -0.28173828125, -0.1768798828125, -0.072021484375, 0.0328369140625, 0.1376953125, 0.2425537109375, 0.347412109375, 0.4522705078125, 0.55712890625, 0.6619873046875, 0.766845703125, 0.8717041015625, 0.9765625, 1.0814208984375, 1.186279296875, 1.2911376953125, 1.39599609375, 1.5008544921875, 1.605712890625, 1.7105712890625, 1.8154296875, 1.9202880859375, 2.025146484375, 2.1300048828125, 2.23486328125, 2.3397216796875, 2.444580078125, 2.5494384765625, 2.654296875, 2.7591552734375, 2.864013671875, 2.9688720703125, 3.07373046875, 3.1785888671875, 3.283447265625, 3.3883056640625, 3.4931640625, 3.5980224609375, 3.702880859375, 3.8077392578125, 3.91259765625, 4.0174560546875, 4.122314453125, 4.2271728515625, 4.33203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 19.0, 19.0, 48.0, 71.0, 125.0, 283.0, 220.0, 101.0, 52.0, 25.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.37322998046875, -61.88349914550781, -59.393768310546875, -56.90403747558594, -54.414306640625, -51.92457580566406, -49.43484115600586, -46.94511032104492, -44.455379486083984, -41.96564865112305, -39.47591781616211, -36.98618698120117, -34.49645233154297, -32.00672149658203, -29.516990661621094, -27.027259826660156, -24.53752899169922, -22.04779815673828, -19.558067321777344, -17.068334579467773, -14.578603744506836, -12.088872909545898, -9.599141120910645, -7.109409332275391, -4.619678497314453, -2.1299471855163574, 0.3597841262817383, 2.849515438079834, 5.33924674987793, 7.828977584838867, 10.318709373474121, 12.808441162109375, 15.298171997070312, 17.78790283203125, 20.277633666992188, 22.767366409301758, 25.257097244262695, 27.746828079223633, 30.236560821533203, 32.72629165649414, 35.21602249145508, 37.705753326416016, 40.19548416137695, 42.68521499633789, 45.174949645996094, 47.66468048095703, 50.15441131591797, 52.644142150878906, 55.133872985839844, 57.62360382080078, 60.11333465576172, 62.603065490722656, 65.0927963256836, 67.58252716064453, 70.07225799560547, 72.56199645996094, 75.05172729492188, 77.54145812988281, 80.03118896484375, 82.52091979980469, 85.01065063476562, 87.50038146972656, 89.9901123046875, 92.47984313964844, 94.96957397460938]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 1.0, 1.0, 6.0, 6.0, 13.0, 9.0, 8.0, 8.0, 15.0, 14.0, 18.0, 13.0, 18.0, 25.0, 18.0, 24.0, 21.0, 32.0, 30.0, 44.0, 56.0, 77.0, 98.0, 80.0, 58.0, 42.0, 27.0, 31.0, 16.0, 27.0, 23.0, 25.0, 14.0, 10.0, 13.0, 14.0, 9.0, 10.0, 8.0, 8.0, 7.0, 7.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.349151611328125, -38.01227569580078, -36.6754035949707, -35.33852767944336, -34.001651763916016, -32.66477966308594, -31.327903747558594, -29.991029739379883, -28.654155731201172, -27.31728172302246, -25.980405807495117, -24.643531799316406, -23.306657791137695, -21.969783782958984, -20.63290786743164, -19.29603385925293, -17.959157943725586, -16.622283935546875, -15.285408973693848, -13.94853401184082, -12.61166000366211, -11.274785041809082, -9.937910079956055, -8.601036071777344, -7.264161109924316, -5.927286624908447, -4.590412139892578, -3.253537178039551, -1.9166626930236816, -0.5797882080078125, 0.7570867538452148, 2.093960762023926, 3.430835723876953, 4.767710208892822, 6.104584693908691, 7.441459655761719, 8.77833366394043, 10.115208625793457, 11.452083587646484, 12.788957595825195, 14.125832557678223, 15.46270751953125, 16.79958152770996, 18.136455535888672, 19.473331451416016, 20.810205459594727, 22.147079467773438, 23.48395538330078, 24.820829391479492, 26.157703399658203, 27.494579315185547, 28.831453323364258, 30.16832733154297, 31.505203247070312, 32.842079162597656, 34.178951263427734, 35.51582717895508, 36.85270309448242, 38.1895751953125, 39.526451110839844, 40.86332702636719, 42.200199127197266, 43.53707504272461, 44.87394714355469, 46.21082305908203]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 6.0, 9.0, 18.0, 22.0, 34.0, 39.0, 78.0, 134.0, 347.0, 845.0, 2740.0, 13030.0, 164695.0, 3698256.0, 291817.0, 17061.0, 3424.0, 984.0, 395.0, 145.0, 62.0, 42.0, 37.0, 15.0, 8.0, 10.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.5625, -11.2374267578125, -10.912353515625, -10.5872802734375, -10.26220703125, -9.9371337890625, -9.612060546875, -9.2869873046875, -8.9619140625, -8.6368408203125, -8.311767578125, -7.9866943359375, -7.66162109375, -7.3365478515625, -7.011474609375, -6.6864013671875, -6.361328125, -6.0362548828125, -5.711181640625, -5.3861083984375, -5.06103515625, -4.7359619140625, -4.410888671875, -4.0858154296875, -3.7607421875, -3.4356689453125, -3.110595703125, -2.7855224609375, -2.46044921875, -2.1353759765625, -1.810302734375, -1.4852294921875, -1.16015625, -0.8350830078125, -0.510009765625, -0.1849365234375, 0.14013671875, 0.4652099609375, 0.790283203125, 1.1153564453125, 1.4404296875, 1.7655029296875, 2.090576171875, 2.4156494140625, 2.74072265625, 3.0657958984375, 3.390869140625, 3.7159423828125, 4.041015625, 4.3660888671875, 4.691162109375, 5.0162353515625, 5.34130859375, 5.6663818359375, 5.991455078125, 6.3165283203125, 6.6416015625, 6.9666748046875, 7.291748046875, 7.6168212890625, 7.94189453125, 8.2669677734375, 8.592041015625, 8.9171142578125, 9.2421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 4.0, 10.0, 5.0, 10.0, 14.0, 9.0, 12.0, 23.0, 20.0, 25.0, 31.0, 36.0, 36.0, 40.0, 45.0, 38.0, 55.0, 54.0, 45.0, 55.0, 53.0, 51.0, 44.0, 41.0, 37.0, 36.0, 33.0, 31.0, 18.0, 13.0, 23.0, 12.0, 15.0, 7.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.994140625, -2.8956298828125, -2.797119140625, -2.6986083984375, -2.60009765625, -2.5015869140625, -2.403076171875, -2.3045654296875, -2.2060546875, -2.1075439453125, -2.009033203125, -1.9105224609375, -1.81201171875, -1.7135009765625, -1.614990234375, -1.5164794921875, -1.41796875, -1.3194580078125, -1.220947265625, -1.1224365234375, -1.02392578125, -0.9254150390625, -0.826904296875, -0.7283935546875, -0.6298828125, -0.5313720703125, -0.432861328125, -0.3343505859375, -0.23583984375, -0.1373291015625, -0.038818359375, 0.0596923828125, 0.158203125, 0.2567138671875, 0.355224609375, 0.4537353515625, 0.55224609375, 0.6507568359375, 0.749267578125, 0.8477783203125, 0.9462890625, 1.0447998046875, 1.143310546875, 1.2418212890625, 1.34033203125, 1.4388427734375, 1.537353515625, 1.6358642578125, 1.734375, 1.8328857421875, 1.931396484375, 2.0299072265625, 2.12841796875, 2.2269287109375, 2.325439453125, 2.4239501953125, 2.5224609375, 2.6209716796875, 2.719482421875, 2.8179931640625, 2.91650390625, 3.0150146484375, 3.113525390625, 3.2120361328125, 3.310546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 7.0, 9.0, 16.0, 13.0, 17.0, 23.0, 27.0, 53.0, 69.0, 108.0, 211.0, 335.0, 746.0, 1940.0, 10261.0, 189519.0, 3907852.0, 73696.0, 6446.0, 1479.0, 620.0, 304.0, 185.0, 103.0, 57.0, 42.0, 42.0, 26.0, 12.0, 13.0, 10.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0], "bins": [-16.546875, -16.0655517578125, -15.584228515625, -15.1029052734375, -14.62158203125, -14.1402587890625, -13.658935546875, -13.1776123046875, -12.6962890625, -12.2149658203125, -11.733642578125, -11.2523193359375, -10.77099609375, -10.2896728515625, -9.808349609375, -9.3270263671875, -8.845703125, -8.3643798828125, -7.883056640625, -7.4017333984375, -6.92041015625, -6.4390869140625, -5.957763671875, -5.4764404296875, -4.9951171875, -4.5137939453125, -4.032470703125, -3.5511474609375, -3.06982421875, -2.5885009765625, -2.107177734375, -1.6258544921875, -1.14453125, -0.6632080078125, -0.181884765625, 0.2994384765625, 0.78076171875, 1.2620849609375, 1.743408203125, 2.2247314453125, 2.7060546875, 3.1873779296875, 3.668701171875, 4.1500244140625, 4.63134765625, 5.1126708984375, 5.593994140625, 6.0753173828125, 6.556640625, 7.0379638671875, 7.519287109375, 8.0006103515625, 8.48193359375, 8.9632568359375, 9.444580078125, 9.9259033203125, 10.4072265625, 10.8885498046875, 11.369873046875, 11.8511962890625, 12.33251953125, 12.8138427734375, 13.295166015625, 13.7764892578125, 14.2578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 12.0, 10.0, 16.0, 29.0, 32.0, 42.0, 71.0, 101.0, 191.0, 391.0, 627.0, 914.0, 685.0, 426.0, 207.0, 96.0, 72.0, 46.0, 27.0, 22.0, 13.0, 9.0, 6.0, 8.0, 7.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -7.055419921875, -6.76708984375, -6.478759765625, -6.1904296875, -5.902099609375, -5.61376953125, -5.325439453125, -5.037109375, -4.748779296875, -4.46044921875, -4.172119140625, -3.8837890625, -3.595458984375, -3.30712890625, -3.018798828125, -2.73046875, -2.442138671875, -2.15380859375, -1.865478515625, -1.5771484375, -1.288818359375, -1.00048828125, -0.712158203125, -0.423828125, -0.135498046875, 0.15283203125, 0.441162109375, 0.7294921875, 1.017822265625, 1.30615234375, 1.594482421875, 1.8828125, 2.171142578125, 2.45947265625, 2.747802734375, 3.0361328125, 3.324462890625, 3.61279296875, 3.901123046875, 4.189453125, 4.477783203125, 4.76611328125, 5.054443359375, 5.3427734375, 5.631103515625, 5.91943359375, 6.207763671875, 6.49609375, 6.784423828125, 7.07275390625, 7.361083984375, 7.6494140625, 7.937744140625, 8.22607421875, 8.514404296875, 8.802734375, 9.091064453125, 9.37939453125, 9.667724609375, 9.9560546875, 10.244384765625, 10.53271484375, 10.821044921875, 11.109375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 6.0, 12.0, 4.0, 10.0, 18.0, 21.0, 48.0, 61.0, 85.0, 102.0, 98.0, 111.0, 89.0, 88.0, 56.0, 41.0, 35.0, 24.0, 24.0, 14.0, 14.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.08250045776367, -56.4747314453125, -54.86695861816406, -53.25918960571289, -51.65142059326172, -50.04365158081055, -48.435882568359375, -46.82810974121094, -45.220340728759766, -43.612571716308594, -42.004798889160156, -40.397029876708984, -38.78926086425781, -37.18149185180664, -35.57372283935547, -33.96595001220703, -32.35818099975586, -30.750411987304688, -29.142641067504883, -27.534870147705078, -25.927101135253906, -24.319332122802734, -22.71156120300293, -21.103790283203125, -19.496021270751953, -17.88825225830078, -16.280481338500977, -14.672711372375488, -13.06494140625, -11.457171440124512, -9.849401473999023, -8.241631507873535, -6.633857727050781, -5.026087760925293, -3.4183177947998047, -1.8105478286743164, -0.20277786254882812, 1.4049921035766602, 3.0127620697021484, 4.620532035827637, 6.228302001953125, 7.836071968078613, 9.443841934204102, 11.05161190032959, 12.659381866455078, 14.267151832580566, 15.874921798706055, 17.48269271850586, 19.09046173095703, 20.698230743408203, 22.306001663208008, 23.913772583007812, 25.521541595458984, 27.129310607910156, 28.73708152770996, 30.344852447509766, 31.952621459960938, 33.56039047241211, 35.16815948486328, 36.77593231201172, 38.38370132446289, 39.99147033691406, 41.5992431640625, 43.20701217651367, 44.814781188964844]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 7.0, 14.0, 9.0, 13.0, 15.0, 15.0, 26.0, 22.0, 18.0, 37.0, 36.0, 38.0, 56.0, 39.0, 39.0, 43.0, 42.0, 33.0, 41.0, 45.0, 33.0, 33.0, 47.0, 27.0, 43.0, 27.0, 21.0, 23.0, 28.0, 27.0, 19.0, 13.0, 9.0, 11.0, 2.0, 12.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.074668884277344, -31.95806884765625, -30.841468811035156, -29.724868774414062, -28.60826873779297, -27.491668701171875, -26.37506866455078, -25.258468627929688, -24.141868591308594, -23.0252685546875, -21.908668518066406, -20.792068481445312, -19.67546844482422, -18.558868408203125, -17.44226837158203, -16.325668334960938, -15.209066390991211, -14.092466354370117, -12.975866317749023, -11.85926628112793, -10.742666244506836, -9.626066207885742, -8.509465217590332, -7.392865180969238, -6.2762651443481445, -5.159665107727051, -4.043065071105957, -2.926464557647705, -1.8098645210266113, -0.6932644844055176, 0.4233360290527344, 1.5399360656738281, 2.656536102294922, 3.7731361389160156, 4.889736175537109, 6.006336688995361, 7.122936725616455, 8.23953628540039, 9.3561372756958, 10.472737312316895, 11.589337348937988, 12.705937385559082, 13.822537422180176, 14.939138412475586, 16.05573844909668, 17.172338485717773, 18.288938522338867, 19.40553855895996, 20.522138595581055, 21.63873863220215, 22.755338668823242, 23.871938705444336, 24.98853874206543, 26.105138778686523, 27.22174072265625, 28.338340759277344, 29.454940795898438, 30.57154083251953, 31.688140869140625, 32.80474090576172, 33.92134094238281, 35.037940979003906, 36.154541015625, 37.271141052246094, 38.38774108886719]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 4.0, 7.0, 15.0, 17.0, 24.0, 32.0, 55.0, 79.0, 86.0, 151.0, 169.0, 307.0, 500.0, 751.0, 1130.0, 1953.0, 3205.0, 5724.0, 10185.0, 19624.0, 39682.0, 88460.0, 219362.0, 345381.0, 171160.0, 70640.0, 32688.0, 16151.0, 8826.0, 4861.0, 2667.0, 1633.0, 1049.0, 662.0, 452.0, 285.0, 168.0, 136.0, 78.0, 59.0, 35.0, 28.0, 19.0, 18.0, 12.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.15625, -4.01470947265625, -3.8731689453125, -3.73162841796875, -3.590087890625, -3.44854736328125, -3.3070068359375, -3.16546630859375, -3.02392578125, -2.88238525390625, -2.7408447265625, -2.59930419921875, -2.457763671875, -2.31622314453125, -2.1746826171875, -2.03314208984375, -1.8916015625, -1.75006103515625, -1.6085205078125, -1.46697998046875, -1.325439453125, -1.18389892578125, -1.0423583984375, -0.90081787109375, -0.75927734375, -0.61773681640625, -0.4761962890625, -0.33465576171875, -0.193115234375, -0.05157470703125, 0.0899658203125, 0.23150634765625, 0.373046875, 0.51458740234375, 0.6561279296875, 0.79766845703125, 0.939208984375, 1.08074951171875, 1.2222900390625, 1.36383056640625, 1.50537109375, 1.64691162109375, 1.7884521484375, 1.92999267578125, 2.071533203125, 2.21307373046875, 2.3546142578125, 2.49615478515625, 2.6376953125, 2.77923583984375, 2.9207763671875, 3.06231689453125, 3.203857421875, 3.34539794921875, 3.4869384765625, 3.62847900390625, 3.77001953125, 3.91156005859375, 4.0531005859375, 4.19464111328125, 4.336181640625, 4.47772216796875, 4.6192626953125, 4.76080322265625, 4.90234375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 1.0, 1.0, 9.0, 6.0, 14.0, 15.0, 9.0, 10.0, 19.0, 14.0, 21.0, 24.0, 31.0, 30.0, 35.0, 42.0, 43.0, 45.0, 62.0, 44.0, 58.0, 44.0, 34.0, 50.0, 37.0, 29.0, 36.0, 35.0, 23.0, 36.0, 27.0, 15.0, 15.0, 16.0, 18.0, 12.0, 14.0, 8.0, 8.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.01470947265625, -2.9161376953125, -2.81756591796875, -2.718994140625, -2.62042236328125, -2.5218505859375, -2.42327880859375, -2.32470703125, -2.22613525390625, -2.1275634765625, -2.02899169921875, -1.930419921875, -1.83184814453125, -1.7332763671875, -1.63470458984375, -1.5361328125, -1.43756103515625, -1.3389892578125, -1.24041748046875, -1.141845703125, -1.04327392578125, -0.9447021484375, -0.84613037109375, -0.74755859375, -0.64898681640625, -0.5504150390625, -0.45184326171875, -0.353271484375, -0.25469970703125, -0.1561279296875, -0.05755615234375, 0.041015625, 0.13958740234375, 0.2381591796875, 0.33673095703125, 0.435302734375, 0.53387451171875, 0.6324462890625, 0.73101806640625, 0.82958984375, 0.92816162109375, 1.0267333984375, 1.12530517578125, 1.223876953125, 1.32244873046875, 1.4210205078125, 1.51959228515625, 1.6181640625, 1.71673583984375, 1.8153076171875, 1.91387939453125, 2.012451171875, 2.11102294921875, 2.2095947265625, 2.30816650390625, 2.40673828125, 2.50531005859375, 2.6038818359375, 2.70245361328125, 2.801025390625, 2.89959716796875, 2.9981689453125, 3.09674072265625, 3.1953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 6.0, 10.0, 10.0, 15.0, 23.0, 21.0, 47.0, 61.0, 81.0, 105.0, 224.0, 278.0, 451.0, 795.0, 1582.0, 3674.0, 12752.0, 90053.0, 823811.0, 94419.0, 12913.0, 3736.0, 1469.0, 737.0, 444.0, 273.0, 166.0, 127.0, 77.0, 60.0, 41.0, 19.0, 19.0, 15.0, 10.0, 9.0, 5.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.671875, -12.293701171875, -11.91552734375, -11.537353515625, -11.1591796875, -10.781005859375, -10.40283203125, -10.024658203125, -9.646484375, -9.268310546875, -8.89013671875, -8.511962890625, -8.1337890625, -7.755615234375, -7.37744140625, -6.999267578125, -6.62109375, -6.242919921875, -5.86474609375, -5.486572265625, -5.1083984375, -4.730224609375, -4.35205078125, -3.973876953125, -3.595703125, -3.217529296875, -2.83935546875, -2.461181640625, -2.0830078125, -1.704833984375, -1.32666015625, -0.948486328125, -0.5703125, -0.192138671875, 0.18603515625, 0.564208984375, 0.9423828125, 1.320556640625, 1.69873046875, 2.076904296875, 2.455078125, 2.833251953125, 3.21142578125, 3.589599609375, 3.9677734375, 4.345947265625, 4.72412109375, 5.102294921875, 5.48046875, 5.858642578125, 6.23681640625, 6.614990234375, 6.9931640625, 7.371337890625, 7.74951171875, 8.127685546875, 8.505859375, 8.884033203125, 9.26220703125, 9.640380859375, 10.0185546875, 10.396728515625, 10.77490234375, 11.153076171875, 11.53125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 9.0, 4.0, 8.0, 6.0, 10.0, 10.0, 19.0, 33.0, 16.0, 30.0, 39.0, 40.0, 50.0, 42.0, 58.0, 44.0, 59.0, 50.0, 67.0, 52.0, 50.0, 45.0, 42.0, 45.0, 30.0, 22.0, 16.0, 18.0, 14.0, 12.0, 14.0, 12.0, 7.0, 4.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1015625, -12.7021484375, -12.302734375, -11.9033203125, -11.50390625, -11.1044921875, -10.705078125, -10.3056640625, -9.90625, -9.5068359375, -9.107421875, -8.7080078125, -8.30859375, -7.9091796875, -7.509765625, -7.1103515625, -6.7109375, -6.3115234375, -5.912109375, -5.5126953125, -5.11328125, -4.7138671875, -4.314453125, -3.9150390625, -3.515625, -3.1162109375, -2.716796875, -2.3173828125, -1.91796875, -1.5185546875, -1.119140625, -0.7197265625, -0.3203125, 0.0791015625, 0.478515625, 0.8779296875, 1.27734375, 1.6767578125, 2.076171875, 2.4755859375, 2.875, 3.2744140625, 3.673828125, 4.0732421875, 4.47265625, 4.8720703125, 5.271484375, 5.6708984375, 6.0703125, 6.4697265625, 6.869140625, 7.2685546875, 7.66796875, 8.0673828125, 8.466796875, 8.8662109375, 9.265625, 9.6650390625, 10.064453125, 10.4638671875, 10.86328125, 11.2626953125, 11.662109375, 12.0615234375, 12.4609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 7.0, 8.0, 12.0, 23.0, 24.0, 46.0, 59.0, 90.0, 138.0, 213.0, 388.0, 728.0, 1391.0, 3352.0, 10549.0, 52125.0, 829399.0, 123537.0, 17513.0, 4868.0, 1942.0, 970.0, 479.0, 235.0, 141.0, 101.0, 55.0, 49.0, 38.0, 26.0, 19.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.134521484375, -5.94091796875, -5.747314453125, -5.5537109375, -5.360107421875, -5.16650390625, -4.972900390625, -4.779296875, -4.585693359375, -4.39208984375, -4.198486328125, -4.0048828125, -3.811279296875, -3.61767578125, -3.424072265625, -3.23046875, -3.036865234375, -2.84326171875, -2.649658203125, -2.4560546875, -2.262451171875, -2.06884765625, -1.875244140625, -1.681640625, -1.488037109375, -1.29443359375, -1.100830078125, -0.9072265625, -0.713623046875, -0.52001953125, -0.326416015625, -0.1328125, 0.060791015625, 0.25439453125, 0.447998046875, 0.6416015625, 0.835205078125, 1.02880859375, 1.222412109375, 1.416015625, 1.609619140625, 1.80322265625, 1.996826171875, 2.1904296875, 2.384033203125, 2.57763671875, 2.771240234375, 2.96484375, 3.158447265625, 3.35205078125, 3.545654296875, 3.7392578125, 3.932861328125, 4.12646484375, 4.320068359375, 4.513671875, 4.707275390625, 4.90087890625, 5.094482421875, 5.2880859375, 5.481689453125, 5.67529296875, 5.868896484375, 6.0625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 10.0, 13.0, 13.0, 31.0, 36.0, 43.0, 81.0, 148.0, 228.0, 136.0, 74.0, 51.0, 24.0, 20.0, 17.0, 10.0, 10.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0], "bins": [-0.0018157958984375, -0.0017684698104858398, -0.0017211437225341797, -0.0016738176345825195, -0.0016264915466308594, -0.0015791654586791992, -0.001531839370727539, -0.001484513282775879, -0.0014371871948242188, -0.0013898611068725586, -0.0013425350189208984, -0.0012952089309692383, -0.0012478828430175781, -0.001200556755065918, -0.0011532306671142578, -0.0011059045791625977, -0.0010585784912109375, -0.0010112524032592773, -0.0009639263153076172, -0.000916600227355957, -0.0008692741394042969, -0.0008219480514526367, -0.0007746219635009766, -0.0007272958755493164, -0.0006799697875976562, -0.0006326436996459961, -0.0005853176116943359, -0.0005379915237426758, -0.0004906654357910156, -0.00044333934783935547, -0.0003960132598876953, -0.00034868717193603516, -0.000301361083984375, -0.00025403499603271484, -0.0002067089080810547, -0.00015938282012939453, -0.00011205673217773438, -6.473064422607422e-05, -1.7404556274414062e-05, 2.9921531677246094e-05, 7.724761962890625e-05, 0.0001245737075805664, 0.00017189979553222656, 0.00021922588348388672, 0.0002665519714355469, 0.00031387805938720703, 0.0003612041473388672, 0.00040853023529052734, 0.0004558563232421875, 0.0005031824111938477, 0.0005505084991455078, 0.000597834587097168, 0.0006451606750488281, 0.0006924867630004883, 0.0007398128509521484, 0.0007871389389038086, 0.0008344650268554688, 0.0008817911148071289, 0.0009291172027587891, 0.0009764432907104492, 0.0010237693786621094, 0.0010710954666137695, 0.0011184215545654297, 0.0011657476425170898, 0.00121307373046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 13.0, 11.0, 18.0, 21.0, 33.0, 57.0, 62.0, 119.0, 233.0, 449.0, 895.0, 2245.0, 6949.0, 31940.0, 354561.0, 605819.0, 33678.0, 7241.0, 2277.0, 916.0, 446.0, 214.0, 119.0, 69.0, 49.0, 41.0, 28.0, 17.0, 6.0, 7.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.52734375, -5.34912109375, -5.1708984375, -4.99267578125, -4.814453125, -4.63623046875, -4.4580078125, -4.27978515625, -4.1015625, -3.92333984375, -3.7451171875, -3.56689453125, -3.388671875, -3.21044921875, -3.0322265625, -2.85400390625, -2.67578125, -2.49755859375, -2.3193359375, -2.14111328125, -1.962890625, -1.78466796875, -1.6064453125, -1.42822265625, -1.25, -1.07177734375, -0.8935546875, -0.71533203125, -0.537109375, -0.35888671875, -0.1806640625, -0.00244140625, 0.17578125, 0.35400390625, 0.5322265625, 0.71044921875, 0.888671875, 1.06689453125, 1.2451171875, 1.42333984375, 1.6015625, 1.77978515625, 1.9580078125, 2.13623046875, 2.314453125, 2.49267578125, 2.6708984375, 2.84912109375, 3.02734375, 3.20556640625, 3.3837890625, 3.56201171875, 3.740234375, 3.91845703125, 4.0966796875, 4.27490234375, 4.453125, 4.63134765625, 4.8095703125, 4.98779296875, 5.166015625, 5.34423828125, 5.5224609375, 5.70068359375, 5.87890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 7.0, 6.0, 5.0, 11.0, 7.0, 14.0, 26.0, 40.0, 45.0, 54.0, 83.0, 88.0, 137.0, 121.0, 90.0, 63.0, 49.0, 40.0, 31.0, 33.0, 22.0, 9.0, 11.0, 2.0, 8.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.673828125, -3.520599365234375, -3.36737060546875, -3.214141845703125, -3.0609130859375, -2.907684326171875, -2.75445556640625, -2.601226806640625, -2.447998046875, -2.294769287109375, -2.14154052734375, -1.988311767578125, -1.8350830078125, -1.681854248046875, -1.52862548828125, -1.375396728515625, -1.22216796875, -1.068939208984375, -0.91571044921875, -0.762481689453125, -0.6092529296875, -0.456024169921875, -0.30279541015625, -0.149566650390625, 0.003662109375, 0.156890869140625, 0.31011962890625, 0.463348388671875, 0.6165771484375, 0.769805908203125, 0.92303466796875, 1.076263427734375, 1.2294921875, 1.382720947265625, 1.53594970703125, 1.689178466796875, 1.8424072265625, 1.995635986328125, 2.14886474609375, 2.302093505859375, 2.455322265625, 2.608551025390625, 2.76177978515625, 2.915008544921875, 3.0682373046875, 3.221466064453125, 3.37469482421875, 3.527923583984375, 3.68115234375, 3.834381103515625, 3.98760986328125, 4.140838623046875, 4.2940673828125, 4.447296142578125, 4.60052490234375, 4.753753662109375, 4.906982421875, 5.060211181640625, 5.21343994140625, 5.366668701171875, 5.5198974609375, 5.673126220703125, 5.82635498046875, 5.979583740234375, 6.1328125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 10.0, 6.0, 20.0, 30.0, 77.0, 227.0, 541.0, 80.0, 13.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-419.19970703125, -410.7074890136719, -402.2152404785156, -393.7230224609375, -385.23077392578125, -376.7385559082031, -368.2463073730469, -359.75408935546875, -351.2618408203125, -342.7696228027344, -334.2773742675781, -325.78515625, -317.29290771484375, -308.8006896972656, -300.3084411621094, -291.81622314453125, -283.3240051269531, -274.831787109375, -266.33953857421875, -257.8473205566406, -249.35507202148438, -240.86285400390625, -232.37062072753906, -223.87838745117188, -215.3861541748047, -206.8939208984375, -198.4016876220703, -189.90945434570312, -181.417236328125, -172.92498779296875, -164.43276977539062, -155.94053649902344, -147.4483184814453, -138.95608520507812, -130.46385192871094, -121.97162628173828, -113.4793930053711, -104.9871597290039, -96.49493408203125, -88.00270080566406, -79.51046752929688, -71.01823425292969, -62.526004791259766, -54.033775329589844, -45.541542053222656, -37.04930877685547, -28.557079315185547, -20.064849853515625, -11.572616577148438, -3.080385208129883, 5.411846160888672, 13.904077529907227, 22.39630889892578, 30.88854217529297, 39.38077163696289, 47.87300109863281, 56.365234375, 64.85746765136719, 73.34970092773438, 81.84192657470703, 90.33415985107422, 98.8263931274414, 107.31861877441406, 115.81085205078125, 124.30308532714844]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 2.0, 6.0, 4.0, 11.0, 7.0, 10.0, 3.0, 13.0, 21.0, 15.0, 16.0, 30.0, 29.0, 31.0, 36.0, 34.0, 48.0, 62.0, 113.0, 138.0, 58.0, 54.0, 38.0, 26.0, 36.0, 34.0, 14.0, 20.0, 8.0, 13.0, 16.0, 10.0, 10.0, 5.0, 8.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.19107437133789, -53.47248077392578, -51.753883361816406, -50.0352897644043, -48.31669616699219, -46.59809875488281, -44.8795051574707, -43.160911560058594, -41.44231414794922, -39.72372055053711, -38.005123138427734, -36.286529541015625, -34.56793212890625, -32.84933853149414, -31.13074493408203, -29.41214942932129, -27.693553924560547, -25.974958419799805, -24.256362915039062, -22.537769317626953, -20.81917381286621, -19.10057830810547, -17.38198471069336, -15.663389205932617, -13.944793701171875, -12.226198196411133, -10.507603645324707, -8.789009094238281, -7.070413589477539, -5.351818084716797, -3.633223533630371, -1.9146289825439453, -0.19603729248046875, 1.5225577354431152, 3.241152763366699, 4.959747791290283, 6.678342819213867, 8.39693832397461, 10.115532875061035, 11.834127426147461, 13.552722930908203, 15.271318435668945, 16.989913940429688, 18.708507537841797, 20.42710304260254, 22.14569854736328, 23.86429214477539, 25.582887649536133, 27.301483154296875, 29.020078659057617, 30.73867416381836, 32.45726776123047, 34.175865173339844, 35.89445877075195, 37.61305236816406, 39.33164978027344, 41.05024337768555, 42.768836975097656, 44.48743438720703, 46.20602798461914, 47.92462158203125, 49.643218994140625, 51.361812591552734, 53.080406188964844, 54.79900360107422]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 9.0, 8.0, 14.0, 29.0, 46.0, 48.0, 83.0, 141.0, 207.0, 356.0, 645.0, 1334.0, 2976.0, 7153.0, 21991.0, 96140.0, 874706.0, 2653218.0, 451566.0, 57788.0, 15593.0, 5461.0, 2362.0, 1102.0, 526.0, 310.0, 173.0, 122.0, 45.0, 41.0, 35.0, 23.0, 8.0, 5.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -9.063232421875, -8.81396484375, -8.564697265625, -8.3154296875, -8.066162109375, -7.81689453125, -7.567626953125, -7.318359375, -7.069091796875, -6.81982421875, -6.570556640625, -6.3212890625, -6.072021484375, -5.82275390625, -5.573486328125, -5.32421875, -5.074951171875, -4.82568359375, -4.576416015625, -4.3271484375, -4.077880859375, -3.82861328125, -3.579345703125, -3.330078125, -3.080810546875, -2.83154296875, -2.582275390625, -2.3330078125, -2.083740234375, -1.83447265625, -1.585205078125, -1.3359375, -1.086669921875, -0.83740234375, -0.588134765625, -0.3388671875, -0.089599609375, 0.15966796875, 0.408935546875, 0.658203125, 0.907470703125, 1.15673828125, 1.406005859375, 1.6552734375, 1.904541015625, 2.15380859375, 2.403076171875, 2.65234375, 2.901611328125, 3.15087890625, 3.400146484375, 3.6494140625, 3.898681640625, 4.14794921875, 4.397216796875, 4.646484375, 4.895751953125, 5.14501953125, 5.394287109375, 5.6435546875, 5.892822265625, 6.14208984375, 6.391357421875, 6.640625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 6.0, 8.0, 14.0, 15.0, 18.0, 18.0, 18.0, 28.0, 36.0, 42.0, 41.0, 44.0, 44.0, 64.0, 46.0, 54.0, 54.0, 53.0, 54.0, 37.0, 48.0, 32.0, 39.0, 31.0, 24.0, 27.0, 28.0, 21.0, 9.0, 14.0, 12.0, 10.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.65234375, -2.54205322265625, -2.4317626953125, -2.32147216796875, -2.211181640625, -2.10089111328125, -1.9906005859375, -1.88031005859375, -1.77001953125, -1.65972900390625, -1.5494384765625, -1.43914794921875, -1.328857421875, -1.21856689453125, -1.1082763671875, -0.99798583984375, -0.8876953125, -0.77740478515625, -0.6671142578125, -0.55682373046875, -0.446533203125, -0.33624267578125, -0.2259521484375, -0.11566162109375, -0.00537109375, 0.10491943359375, 0.2152099609375, 0.32550048828125, 0.435791015625, 0.54608154296875, 0.6563720703125, 0.76666259765625, 0.876953125, 0.98724365234375, 1.0975341796875, 1.20782470703125, 1.318115234375, 1.42840576171875, 1.5386962890625, 1.64898681640625, 1.75927734375, 1.86956787109375, 1.9798583984375, 2.09014892578125, 2.200439453125, 2.31072998046875, 2.4210205078125, 2.53131103515625, 2.6416015625, 2.75189208984375, 2.8621826171875, 2.97247314453125, 3.082763671875, 3.19305419921875, 3.3033447265625, 3.41363525390625, 3.52392578125, 3.63421630859375, 3.7445068359375, 3.85479736328125, 3.965087890625, 4.07537841796875, 4.1856689453125, 4.29595947265625, 4.40625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 7.0, 4.0, 22.0, 66.0, 168.0, 517.0, 5571.0, 4183484.0, 3815.0, 429.0, 127.0, 54.0, 10.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.375, -88.046875, -84.71875, -81.390625, -78.0625, -74.734375, -71.40625, -68.078125, -64.75, -61.421875, -58.09375, -54.765625, -51.4375, -48.109375, -44.78125, -41.453125, -38.125, -34.796875, -31.46875, -28.140625, -24.8125, -21.484375, -18.15625, -14.828125, -11.5, -8.171875, -4.84375, -1.515625, 1.8125, 5.140625, 8.46875, 11.796875, 15.125, 18.453125, 21.78125, 25.109375, 28.4375, 31.765625, 35.09375, 38.421875, 41.75, 45.078125, 48.40625, 51.734375, 55.0625, 58.390625, 61.71875, 65.046875, 68.375, 71.703125, 75.03125, 78.359375, 81.6875, 85.015625, 88.34375, 91.671875, 95.0, 98.328125, 101.65625, 104.984375, 108.3125, 111.640625, 114.96875, 118.296875, 121.625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 23.0, 70.0, 222.0, 788.0, 2010.0, 677.0, 200.0, 59.0, 18.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.0625, -65.67578125, -64.2890625, -62.90234375, -61.515625, -60.12890625, -58.7421875, -57.35546875, -55.96875, -54.58203125, -53.1953125, -51.80859375, -50.421875, -49.03515625, -47.6484375, -46.26171875, -44.875, -43.48828125, -42.1015625, -40.71484375, -39.328125, -37.94140625, -36.5546875, -35.16796875, -33.78125, -32.39453125, -31.0078125, -29.62109375, -28.234375, -26.84765625, -25.4609375, -24.07421875, -22.6875, -21.30078125, -19.9140625, -18.52734375, -17.140625, -15.75390625, -14.3671875, -12.98046875, -11.59375, -10.20703125, -8.8203125, -7.43359375, -6.046875, -4.66015625, -3.2734375, -1.88671875, -0.5, 0.88671875, 2.2734375, 3.66015625, 5.046875, 6.43359375, 7.8203125, 9.20703125, 10.59375, 11.98046875, 13.3671875, 14.75390625, 16.140625, 17.52734375, 18.9140625, 20.30078125, 21.6875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 8.0, 17.0, 44.0, 69.0, 171.0, 287.0, 180.0, 95.0, 41.0, 22.0, 16.0, 4.0, 7.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-351.4676818847656, -344.0564880371094, -336.64532470703125, -329.234130859375, -321.8229675292969, -314.4117736816406, -307.0005798339844, -299.58941650390625, -292.17822265625, -284.76702880859375, -277.3558654785156, -269.9446716308594, -262.53350830078125, -255.122314453125, -247.7111358642578, -240.29995727539062, -232.88876342773438, -225.4775848388672, -218.06640625, -210.65521240234375, -203.24403381347656, -195.83285522460938, -188.4216766357422, -181.010498046875, -173.5993194580078, -166.18814086914062, -158.77696228027344, -151.3657684326172, -143.95458984375, -136.5434112548828, -129.13223266601562, -121.7210464477539, -114.30986022949219, -106.898681640625, -99.48749542236328, -92.0763168334961, -84.66513061523438, -77.25395202636719, -69.8427734375, -62.43158721923828, -55.02040481567383, -47.609222412109375, -40.19804000854492, -32.78685760498047, -25.37567710876465, -17.964496612548828, -10.553314208984375, -3.142131805419922, 4.269050598144531, 11.680233001708984, 19.091415405273438, 26.502595901489258, 33.913780212402344, 41.32495880126953, 48.736141204833984, 56.14732360839844, 63.55850601196289, 70.96968841552734, 78.38086700439453, 85.79205322265625, 93.20323181152344, 100.61441040039062, 108.02559661865234, 115.43678283691406, 122.84796142578125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 6.0, 7.0, 12.0, 21.0, 28.0, 43.0, 62.0, 87.0, 93.0, 107.0, 126.0, 124.0, 82.0, 62.0, 45.0, 31.0, 17.0, 11.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.00119018554688, -150.85809326171875, -144.71499633789062, -138.5718994140625, -132.42880249023438, -126.28569793701172, -120.14259338378906, -113.99949645996094, -107.85639953613281, -101.71330261230469, -95.57020568847656, -89.4271011352539, -83.28400421142578, -77.14090728759766, -70.997802734375, -64.85470581054688, -58.71160888671875, -52.568511962890625, -46.425411224365234, -40.282310485839844, -34.13921356201172, -27.99611473083496, -21.853015899658203, -15.709915161132812, -9.566818237304688, -3.4237194061279297, 2.719379425048828, 8.862478256225586, 15.005577087402344, 21.1486759185791, 27.29177474975586, 33.43487548828125, 39.577972412109375, 45.7210693359375, 51.86417007446289, 58.00727081298828, 64.1503677368164, 70.29346466064453, 76.43656921386719, 82.57966613769531, 88.72276306152344, 94.86585998535156, 101.00895690917969, 107.15206146240234, 113.29515838623047, 119.4382553100586, 125.58135986328125, 131.72445678710938, 137.8675537109375, 144.01065063476562, 150.15374755859375, 156.29684448242188, 162.43994140625, 168.5830535888672, 174.7261505126953, 180.86924743652344, 187.01234436035156, 193.1554412841797, 199.2985382080078, 205.44163513183594, 211.58474731445312, 217.72784423828125, 223.87094116210938, 230.0140380859375, 236.15713500976562]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 6.0, 16.0, 20.0, 20.0, 22.0, 35.0, 44.0, 65.0, 73.0, 83.0, 142.0, 221.0, 341.0, 554.0, 895.0, 1516.0, 2814.0, 5628.0, 12904.0, 35996.0, 144215.0, 628438.0, 150916.0, 37654.0, 13228.0, 5774.0, 2819.0, 1559.0, 851.0, 531.0, 345.0, 223.0, 146.0, 112.0, 81.0, 62.0, 51.0, 42.0, 25.0, 16.0, 16.0, 14.0, 10.0, 9.0, 9.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.37890625, -6.16986083984375, -5.9608154296875, -5.75177001953125, -5.542724609375, -5.33367919921875, -5.1246337890625, -4.91558837890625, -4.70654296875, -4.49749755859375, -4.2884521484375, -4.07940673828125, -3.870361328125, -3.66131591796875, -3.4522705078125, -3.24322509765625, -3.0341796875, -2.82513427734375, -2.6160888671875, -2.40704345703125, -2.197998046875, -1.98895263671875, -1.7799072265625, -1.57086181640625, -1.36181640625, -1.15277099609375, -0.9437255859375, -0.73468017578125, -0.525634765625, -0.31658935546875, -0.1075439453125, 0.10150146484375, 0.310546875, 0.51959228515625, 0.7286376953125, 0.93768310546875, 1.146728515625, 1.35577392578125, 1.5648193359375, 1.77386474609375, 1.98291015625, 2.19195556640625, 2.4010009765625, 2.61004638671875, 2.819091796875, 3.02813720703125, 3.2371826171875, 3.44622802734375, 3.6552734375, 3.86431884765625, 4.0733642578125, 4.28240966796875, 4.491455078125, 4.70050048828125, 4.9095458984375, 5.11859130859375, 5.32763671875, 5.53668212890625, 5.7457275390625, 5.95477294921875, 6.163818359375, 6.37286376953125, 6.5819091796875, 6.79095458984375, 7.0]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 7.0, 12.0, 8.0, 13.0, 23.0, 35.0, 43.0, 57.0, 65.0, 74.0, 75.0, 74.0, 77.0, 73.0, 80.0, 63.0, 45.0, 45.0, 36.0, 29.0, 10.0, 18.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80078125, -6.575439453125, -6.35009765625, -6.124755859375, -5.8994140625, -5.674072265625, -5.44873046875, -5.223388671875, -4.998046875, -4.772705078125, -4.54736328125, -4.322021484375, -4.0966796875, -3.871337890625, -3.64599609375, -3.420654296875, -3.1953125, -2.969970703125, -2.74462890625, -2.519287109375, -2.2939453125, -2.068603515625, -1.84326171875, -1.617919921875, -1.392578125, -1.167236328125, -0.94189453125, -0.716552734375, -0.4912109375, -0.265869140625, -0.04052734375, 0.184814453125, 0.41015625, 0.635498046875, 0.86083984375, 1.086181640625, 1.3115234375, 1.536865234375, 1.76220703125, 1.987548828125, 2.212890625, 2.438232421875, 2.66357421875, 2.888916015625, 3.1142578125, 3.339599609375, 3.56494140625, 3.790283203125, 4.015625, 4.240966796875, 4.46630859375, 4.691650390625, 4.9169921875, 5.142333984375, 5.36767578125, 5.593017578125, 5.818359375, 6.043701171875, 6.26904296875, 6.494384765625, 6.7197265625, 6.945068359375, 7.17041015625, 7.395751953125, 7.62109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 5.0, 11.0, 18.0, 21.0, 28.0, 43.0, 71.0, 94.0, 202.0, 306.0, 713.0, 2207.0, 13914.0, 860812.0, 159126.0, 8000.0, 1579.0, 578.0, 315.0, 170.0, 97.0, 69.0, 55.0, 27.0, 23.0, 17.0, 9.0, 3.0, 10.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.328125, -15.81591796875, -15.3037109375, -14.79150390625, -14.279296875, -13.76708984375, -13.2548828125, -12.74267578125, -12.23046875, -11.71826171875, -11.2060546875, -10.69384765625, -10.181640625, -9.66943359375, -9.1572265625, -8.64501953125, -8.1328125, -7.62060546875, -7.1083984375, -6.59619140625, -6.083984375, -5.57177734375, -5.0595703125, -4.54736328125, -4.03515625, -3.52294921875, -3.0107421875, -2.49853515625, -1.986328125, -1.47412109375, -0.9619140625, -0.44970703125, 0.0625, 0.57470703125, 1.0869140625, 1.59912109375, 2.111328125, 2.62353515625, 3.1357421875, 3.64794921875, 4.16015625, 4.67236328125, 5.1845703125, 5.69677734375, 6.208984375, 6.72119140625, 7.2333984375, 7.74560546875, 8.2578125, 8.77001953125, 9.2822265625, 9.79443359375, 10.306640625, 10.81884765625, 11.3310546875, 11.84326171875, 12.35546875, 12.86767578125, 13.3798828125, 13.89208984375, 14.404296875, 14.91650390625, 15.4287109375, 15.94091796875, 16.453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 5.0, 8.0, 10.0, 9.0, 6.0, 7.0, 15.0, 18.0, 12.0, 12.0, 29.0, 28.0, 22.0, 44.0, 52.0, 58.0, 63.0, 76.0, 73.0, 87.0, 63.0, 52.0, 41.0, 35.0, 26.0, 21.0, 28.0, 18.0, 16.0, 15.0, 9.0, 9.0, 7.0, 12.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.421875, -17.718017578125, -17.01416015625, -16.310302734375, -15.6064453125, -14.902587890625, -14.19873046875, -13.494873046875, -12.791015625, -12.087158203125, -11.38330078125, -10.679443359375, -9.9755859375, -9.271728515625, -8.56787109375, -7.864013671875, -7.16015625, -6.456298828125, -5.75244140625, -5.048583984375, -4.3447265625, -3.640869140625, -2.93701171875, -2.233154296875, -1.529296875, -0.825439453125, -0.12158203125, 0.582275390625, 1.2861328125, 1.989990234375, 2.69384765625, 3.397705078125, 4.1015625, 4.805419921875, 5.50927734375, 6.213134765625, 6.9169921875, 7.620849609375, 8.32470703125, 9.028564453125, 9.732421875, 10.436279296875, 11.14013671875, 11.843994140625, 12.5478515625, 13.251708984375, 13.95556640625, 14.659423828125, 15.36328125, 16.067138671875, 16.77099609375, 17.474853515625, 18.1787109375, 18.882568359375, 19.58642578125, 20.290283203125, 20.994140625, 21.697998046875, 22.40185546875, 23.105712890625, 23.8095703125, 24.513427734375, 25.21728515625, 25.921142578125, 26.625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 12.0, 9.0, 15.0, 28.0, 21.0, 27.0, 55.0, 70.0, 94.0, 151.0, 246.0, 494.0, 1047.0, 3062.0, 13205.0, 200382.0, 807031.0, 16353.0, 3552.0, 1297.0, 591.0, 297.0, 159.0, 96.0, 71.0, 49.0, 27.0, 33.0, 18.0, 12.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.677734375, -2.588653564453125, -2.49957275390625, -2.410491943359375, -2.3214111328125, -2.232330322265625, -2.14324951171875, -2.054168701171875, -1.965087890625, -1.876007080078125, -1.78692626953125, -1.697845458984375, -1.6087646484375, -1.519683837890625, -1.43060302734375, -1.341522216796875, -1.25244140625, -1.163360595703125, -1.07427978515625, -0.985198974609375, -0.8961181640625, -0.807037353515625, -0.71795654296875, -0.628875732421875, -0.539794921875, -0.450714111328125, -0.36163330078125, -0.272552490234375, -0.1834716796875, -0.094390869140625, -0.00531005859375, 0.083770751953125, 0.1728515625, 0.261932373046875, 0.35101318359375, 0.440093994140625, 0.5291748046875, 0.618255615234375, 0.70733642578125, 0.796417236328125, 0.885498046875, 0.974578857421875, 1.06365966796875, 1.152740478515625, 1.2418212890625, 1.330902099609375, 1.41998291015625, 1.509063720703125, 1.59814453125, 1.687225341796875, 1.77630615234375, 1.865386962890625, 1.9544677734375, 2.043548583984375, 2.13262939453125, 2.221710205078125, 2.310791015625, 2.399871826171875, 2.48895263671875, 2.578033447265625, 2.6671142578125, 2.756195068359375, 2.84527587890625, 2.934356689453125, 3.0234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 12.0, 9.0, 16.0, 15.0, 26.0, 35.0, 46.0, 67.0, 140.0, 201.0, 153.0, 94.0, 55.0, 40.0, 28.0, 21.0, 6.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005412101745605469, -0.0005235373973846436, -0.0005058646202087402, -0.0004881918430328369, -0.0004705190658569336, -0.0004528462886810303, -0.00043517351150512695, -0.00041750073432922363, -0.0003998279571533203, -0.000382155179977417, -0.00036448240280151367, -0.00034680962562561035, -0.00032913684844970703, -0.0003114640712738037, -0.0002937912940979004, -0.00027611851692199707, -0.00025844573974609375, -0.00024077296257019043, -0.0002231001853942871, -0.0002054274082183838, -0.00018775463104248047, -0.00017008185386657715, -0.00015240907669067383, -0.0001347362995147705, -0.00011706352233886719, -9.939074516296387e-05, -8.171796798706055e-05, -6.404519081115723e-05, -4.6372413635253906e-05, -2.8699636459350586e-05, -1.1026859283447266e-05, 6.645917892456055e-06, 2.4318695068359375e-05, 4.1991472244262695e-05, 5.9664249420166016e-05, 7.733702659606934e-05, 9.500980377197266e-05, 0.00011268258094787598, 0.0001303553581237793, 0.00014802813529968262, 0.00016570091247558594, 0.00018337368965148926, 0.00020104646682739258, 0.0002187192440032959, 0.00023639202117919922, 0.00025406479835510254, 0.00027173757553100586, 0.0002894103527069092, 0.0003070831298828125, 0.0003247559070587158, 0.00034242868423461914, 0.00036010146141052246, 0.0003777742385864258, 0.0003954470157623291, 0.0004131197929382324, 0.00043079257011413574, 0.00044846534729003906, 0.0004661381244659424, 0.0004838109016418457, 0.000501483678817749, 0.0005191564559936523, 0.0005368292331695557, 0.000554502010345459, 0.0005721747875213623, 0.0005898475646972656]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 14.0, 8.0, 15.0, 20.0, 32.0, 48.0, 88.0, 191.0, 376.0, 824.0, 2223.0, 6924.0, 26448.0, 246707.0, 722413.0, 30098.0, 7733.0, 2445.0, 966.0, 410.0, 215.0, 97.0, 75.0, 49.0, 26.0, 23.0, 15.0, 13.0, 8.0, 5.0, 5.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5927734375, -1.537933349609375, -1.48309326171875, -1.428253173828125, -1.3734130859375, -1.318572998046875, -1.26373291015625, -1.208892822265625, -1.154052734375, -1.099212646484375, -1.04437255859375, -0.989532470703125, -0.9346923828125, -0.879852294921875, -0.82501220703125, -0.770172119140625, -0.71533203125, -0.660491943359375, -0.60565185546875, -0.550811767578125, -0.4959716796875, -0.441131591796875, -0.38629150390625, -0.331451416015625, -0.276611328125, -0.221771240234375, -0.16693115234375, -0.112091064453125, -0.0572509765625, -0.002410888671875, 0.05242919921875, 0.107269287109375, 0.162109375, 0.216949462890625, 0.27178955078125, 0.326629638671875, 0.3814697265625, 0.436309814453125, 0.49114990234375, 0.545989990234375, 0.600830078125, 0.655670166015625, 0.71051025390625, 0.765350341796875, 0.8201904296875, 0.875030517578125, 0.92987060546875, 0.984710693359375, 1.03955078125, 1.094390869140625, 1.14923095703125, 1.204071044921875, 1.2589111328125, 1.313751220703125, 1.36859130859375, 1.423431396484375, 1.478271484375, 1.533111572265625, 1.58795166015625, 1.642791748046875, 1.6976318359375, 1.752471923828125, 1.80731201171875, 1.862152099609375, 1.9169921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 3.0, 15.0, 10.0, 16.0, 26.0, 21.0, 38.0, 62.0, 110.0, 159.0, 179.0, 114.0, 62.0, 48.0, 25.0, 12.0, 11.0, 18.0, 6.0, 6.0, 6.0, 7.0, 4.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.130859375, -2.05194091796875, -1.9730224609375, -1.89410400390625, -1.815185546875, -1.73626708984375, -1.6573486328125, -1.57843017578125, -1.49951171875, -1.42059326171875, -1.3416748046875, -1.26275634765625, -1.183837890625, -1.10491943359375, -1.0260009765625, -0.94708251953125, -0.8681640625, -0.78924560546875, -0.7103271484375, -0.63140869140625, -0.552490234375, -0.47357177734375, -0.3946533203125, -0.31573486328125, -0.23681640625, -0.15789794921875, -0.0789794921875, -6.103515625e-05, 0.078857421875, 0.15777587890625, 0.2366943359375, 0.31561279296875, 0.39453125, 0.47344970703125, 0.5523681640625, 0.63128662109375, 0.710205078125, 0.78912353515625, 0.8680419921875, 0.94696044921875, 1.02587890625, 1.10479736328125, 1.1837158203125, 1.26263427734375, 1.341552734375, 1.42047119140625, 1.4993896484375, 1.57830810546875, 1.6572265625, 1.73614501953125, 1.8150634765625, 1.89398193359375, 1.972900390625, 2.05181884765625, 2.1307373046875, 2.20965576171875, 2.28857421875, 2.36749267578125, 2.4464111328125, 2.52532958984375, 2.604248046875, 2.68316650390625, 2.7620849609375, 2.84100341796875, 2.919921875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 18.0, 70.0, 564.0, 241.0, 57.0, 22.0, 13.0, 6.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.38475036621094, -92.17329406738281, -85.96183776855469, -79.75038146972656, -73.53892517089844, -67.32746887207031, -61.11601257324219, -54.90455627441406, -48.69309997558594, -42.48164367675781, -36.27018737792969, -30.058731079101562, -23.847274780273438, -17.635818481445312, -11.424362182617188, -5.2129058837890625, 0.9985504150390625, 7.2100067138671875, 13.421463012695312, 19.632919311523438, 25.844375610351562, 32.05583190917969, 38.26728820800781, 44.47874450683594, 50.69020080566406, 56.90165710449219, 63.11311340332031, 69.32456970214844, 75.53602600097656, 81.74748229980469, 87.95893859863281, 94.17039489746094, 100.3818359375, 106.59329223632812, 112.80474853515625, 119.01620483398438, 125.2276611328125, 131.43911743164062, 137.65057373046875, 143.86203002929688, 150.073486328125, 156.28494262695312, 162.49639892578125, 168.70785522460938, 174.9193115234375, 181.13076782226562, 187.34222412109375, 193.55368041992188, 199.76513671875, 205.97659301757812, 212.18804931640625, 218.39950561523438, 224.6109619140625, 230.82241821289062, 237.03387451171875, 243.24533081054688, 249.456787109375, 255.66824340820312, 261.87969970703125, 268.0911560058594, 274.3026123046875, 280.5140686035156, 286.72552490234375, 292.9369812011719, 299.1484375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 4.0, 11.0, 11.0, 12.0, 16.0, 14.0, 27.0, 32.0, 33.0, 26.0, 132.0, 228.0, 178.0, 61.0, 26.0, 29.0, 20.0, 23.0, 23.0, 18.0, 20.0, 10.0, 8.0, 9.0, 8.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-103.32322692871094, -100.2532730102539, -97.1833267211914, -94.11337280273438, -91.04342651367188, -87.97347259521484, -84.90351867675781, -81.83357238769531, -78.76362609863281, -75.69367218017578, -72.62372589111328, -69.55377197265625, -66.48382568359375, -63.41387176513672, -60.34392166137695, -57.27397155761719, -54.204017639160156, -51.13406753540039, -48.064117431640625, -44.994163513183594, -41.924217224121094, -38.85426330566406, -35.7843132019043, -32.71436309814453, -29.644412994384766, -26.574462890625, -23.504512786865234, -20.434560775756836, -17.36461067199707, -14.294660568237305, -11.224708557128906, -8.15475845336914, -5.084800720214844, -2.01485013961792, 1.055100440979004, 4.125051498413086, 7.195001602172852, 10.264951705932617, 13.334903717041016, 16.40485382080078, 19.474803924560547, 22.544754028320312, 25.614704132080078, 28.684656143188477, 31.754606246948242, 34.824554443359375, 37.894508361816406, 40.96445846557617, 44.03440856933594, 47.1043586730957, 50.17430877685547, 53.2442626953125, 56.314208984375, 59.38416290283203, 62.4541130065918, 65.52406311035156, 68.59400939941406, 71.6639633178711, 74.7339096069336, 77.80386352539062, 80.87380981445312, 83.94376373291016, 87.01371765136719, 90.08366394042969, 93.15361785888672]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 12.0, 18.0, 29.0, 36.0, 43.0, 52.0, 68.0, 364.0, 91.0, 60.0, 53.0, 43.0, 45.0, 20.0, 17.0, 12.0, 7.0, 10.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.670654296875, -5.41943359375, -5.168212890625, -4.9169921875, -4.665771484375, -4.41455078125, -4.163330078125, -3.912109375, -3.660888671875, -3.40966796875, -3.158447265625, -2.9072265625, -2.656005859375, -2.40478515625, -2.153564453125, -1.90234375, -1.651123046875, -1.39990234375, -1.148681640625, -0.8974609375, -0.646240234375, -0.39501953125, -0.143798828125, 0.107421875, 0.358642578125, 0.60986328125, 0.861083984375, 1.1123046875, 1.363525390625, 1.61474609375, 1.865966796875, 2.1171875, 2.368408203125, 2.61962890625, 2.870849609375, 3.1220703125, 3.373291015625, 3.62451171875, 3.875732421875, 4.126953125, 4.378173828125, 4.62939453125, 4.880615234375, 5.1318359375, 5.383056640625, 5.63427734375, 5.885498046875, 6.13671875, 6.387939453125, 6.63916015625, 6.890380859375, 7.1416015625, 7.392822265625, 7.64404296875, 7.895263671875, 8.146484375, 8.397705078125, 8.64892578125, 8.900146484375, 9.1513671875, 9.402587890625, 9.65380859375, 9.905029296875, 10.15625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 8.0, 19.0, 14.0, 19.0, 30.0, 45.0, 83.0, 171.0, 507.0, 1522.0, 8938.0, 8353223.0, 20485.0, 2333.0, 653.0, 239.0, 111.0, 49.0, 35.0, 24.0, 23.0, 12.0, 6.0, 7.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-69.6004409790039, -67.46888732910156, -65.33732604980469, -63.205772399902344, -61.074214935302734, -58.942657470703125, -56.81110382080078, -54.67954635620117, -52.54798889160156, -50.41643142700195, -48.284873962402344, -46.1533203125, -44.02176284790039, -41.89020538330078, -39.75865173339844, -37.62709426879883, -35.49553680419922, -33.36397933959961, -31.232423782348633, -29.100868225097656, -26.969310760498047, -24.837753295898438, -22.70619773864746, -20.574642181396484, -18.443084716796875, -16.311527252197266, -14.179971694946289, -12.048415184020996, -9.916858673095703, -7.78530216217041, -5.653745651245117, -3.522189140319824, -1.3906326293945312, 0.7409238815307617, 2.8724803924560547, 5.004036903381348, 7.135593414306641, 9.267149925231934, 11.398706436157227, 13.53026294708252, 15.661819458007812, 17.793376922607422, 19.9249324798584, 22.056488037109375, 24.188045501708984, 26.319602966308594, 28.45115852355957, 30.582714080810547, 32.714271545410156, 34.845829010009766, 36.977386474609375, 39.10894012451172, 41.24049758911133, 43.37205505371094, 45.50360870361328, 47.63516616821289, 49.7667236328125, 51.89828109741211, 54.02983856201172, 56.16139221191406, 58.29294967651367, 60.42450714111328, 62.556060791015625, 64.6876220703125, 66.81917572021484]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 6.0, 7.0, 2.0, 3.0, 9.0, 5.0, 4.0, 6.0, 5.0, 2.0, 1.0, 4.0, 4.0, 8.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.514328002929688, -26.93609619140625, -25.35786247253418, -23.77962875366211, -22.201396942138672, -20.623165130615234, -19.044931411743164, -17.466697692871094, -15.888465881347656, -14.310233116149902, -12.732000350952148, -11.153767585754395, -9.57553482055664, -7.997302055358887, -6.419069290161133, -4.840836524963379, -3.262603759765625, -1.684370994567871, -0.10613822937011719, 1.4720945358276367, 3.0503273010253906, 4.6285600662231445, 6.206792831420898, 7.785025596618652, 9.363258361816406, 10.94149112701416, 12.519723892211914, 14.097956657409668, 15.676189422607422, 17.25442123413086, 18.83265495300293, 20.410888671875, 21.989120483398438, 23.567352294921875, 25.145586013793945, 26.723819732666016, 28.302051544189453, 29.88028335571289, 31.45851707458496, 33.03675079345703, 34.61498260498047, 36.193214416503906, 37.771446228027344, 39.34968185424805, 40.927913665771484, 42.50614547729492, 44.084381103515625, 45.66261291503906, 47.2408447265625, 48.81907653808594, 50.397308349609375, 51.97554397583008, 53.553775787353516, 55.13200759887695, 56.710243225097656, 58.288475036621094, 59.86670684814453, 61.44493865966797, 63.023170471191406, 64.60140228271484, 66.17964172363281, 67.75787353515625, 69.33610534667969, 70.91433715820312, 72.49256896972656]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 7.0, 14.0, 23.0, 38.0, 51.0, 80.0, 161.0, 294.0, 660.0, 1571.0, 4504.0, 15379.0, 68568.0, 259713.0, 133941.0, 27641.0, 7184.0, 2402.0, 1008.0, 460.0, 245.0, 125.0, 80.0, 42.0, 21.0, 13.0, 16.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.1875, -47.5859375, -45.984375, -44.3828125, -42.78125, -41.1796875, -39.578125, -37.9765625, -36.375, -34.7734375, -33.171875, -31.5703125, -29.96875, -28.3671875, -26.765625, -25.1640625, -23.5625, -21.9609375, -20.359375, -18.7578125, -17.15625, -15.5546875, -13.953125, -12.3515625, -10.75, -9.1484375, -7.546875, -5.9453125, -4.34375, -2.7421875, -1.140625, 0.4609375, 2.0625, 3.6640625, 5.265625, 6.8671875, 8.46875, 10.0703125, 11.671875, 13.2734375, 14.875, 16.4765625, 18.078125, 19.6796875, 21.28125, 22.8828125, 24.484375, 26.0859375, 27.6875, 29.2890625, 30.890625, 32.4921875, 34.09375, 35.6953125, 37.296875, 38.8984375, 40.5, 42.1015625, 43.703125, 45.3046875, 46.90625, 48.5078125, 50.109375, 51.7109375, 53.3125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 6.0, 9.0, 8.0, 18.0, 25.0, 27.0, 30.0, 33.0, 44.0, 52.0, 72.0, 75.0, 73.0, 80.0, 74.0, 65.0, 55.0, 55.0, 40.0, 33.0, 26.0, 15.0, 10.0, 12.0, 7.0, 8.0, 10.0, 5.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.15234375, -5.96868896484375, -5.7850341796875, -5.60137939453125, -5.417724609375, -5.23406982421875, -5.0504150390625, -4.86676025390625, -4.68310546875, -4.49945068359375, -4.3157958984375, -4.13214111328125, -3.948486328125, -3.76483154296875, -3.5811767578125, -3.39752197265625, -3.2138671875, -3.03021240234375, -2.8465576171875, -2.66290283203125, -2.479248046875, -2.29559326171875, -2.1119384765625, -1.92828369140625, -1.74462890625, -1.56097412109375, -1.3773193359375, -1.19366455078125, -1.010009765625, -0.82635498046875, -0.6427001953125, -0.45904541015625, -0.275390625, -0.09173583984375, 0.0919189453125, 0.27557373046875, 0.459228515625, 0.64288330078125, 0.8265380859375, 1.01019287109375, 1.19384765625, 1.37750244140625, 1.5611572265625, 1.74481201171875, 1.928466796875, 2.11212158203125, 2.2957763671875, 2.47943115234375, 2.6630859375, 2.84674072265625, 3.0303955078125, 3.21405029296875, 3.397705078125, 3.58135986328125, 3.7650146484375, 3.94866943359375, 4.13232421875, 4.31597900390625, 4.4996337890625, 4.68328857421875, 4.866943359375, 5.05059814453125, 5.2342529296875, 5.41790771484375, 5.6015625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 8.0, 5.0, 15.0, 14.0, 32.0, 58.0, 82.0, 71.0, 63.0, 39.0, 18.0, 19.0, 12.0, 7.0, 4.0, 6.0, 8.0, 3.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.826414108276367, -24.456937789916992, -23.087461471557617, -21.71798324584961, -20.348506927490234, -18.97903060913086, -17.609554290771484, -16.24007797241211, -14.870601654052734, -13.50112533569336, -12.131649017333984, -10.762171745300293, -9.392695426940918, -8.023219108581543, -6.653741836547852, -5.284265518188477, -3.9147891998291016, -2.5453126430511475, -1.1758360862731934, 0.19364070892333984, 1.5631170272827148, 2.93259334564209, 4.302070617675781, 5.671546936035156, 7.041023254394531, 8.410499572753906, 9.779975891113281, 11.149453163146973, 12.518929481506348, 13.888405799865723, 15.257883071899414, 16.62735939025879, 17.99683380126953, 19.366310119628906, 20.73578643798828, 22.105262756347656, 23.47473907470703, 24.844215393066406, 26.213693618774414, 27.58316993713379, 28.952646255493164, 30.32212257385254, 31.691598892211914, 33.06107711791992, 34.4305534362793, 35.80002975463867, 37.16950607299805, 38.53898239135742, 39.9084587097168, 41.27793502807617, 42.64741134643555, 44.01688766479492, 45.3863639831543, 46.75584030151367, 48.12532043457031, 49.49479675292969, 50.86427307128906, 52.23374938964844, 53.60322570800781, 54.97270202636719, 56.34217834472656, 57.71165466308594, 59.08113098144531, 60.45060729980469, 61.82008361816406]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 0.0, 5.0, 5.0, 1.0, 1.0, 5.0, 0.0, 10.0, 14.0, 29.0, 42.0, 59.0, 84.0, 63.0, 56.0, 39.0, 19.0, 17.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.326555252075195, -26.490676879882812, -25.65479850769043, -24.818920135498047, -23.983043670654297, -23.14716339111328, -22.31128692626953, -21.47540855407715, -20.639530181884766, -19.803651809692383, -18.9677734375, -18.131895065307617, -17.296016693115234, -16.460140228271484, -15.624261856079102, -14.788383483886719, -13.952505111694336, -13.116626739501953, -12.28074836730957, -11.444870948791504, -10.608992576599121, -9.773114204406738, -8.937236785888672, -8.101358413696289, -7.265480041503906, -6.429601669311523, -5.593723773956299, -4.757845878601074, -3.9219675064086914, -3.0860891342163086, -2.250211238861084, -1.4143333435058594, -0.5784568786621094, 0.25742125511169434, 1.093299388885498, 1.9291775226593018, 2.7650556564331055, 3.6009340286254883, 4.436811923980713, 5.2726898193359375, 6.10856819152832, 6.944446563720703, 7.780324459075928, 8.616202354431152, 9.452080726623535, 10.287959098815918, 11.123836517333984, 11.959714889526367, 12.79559326171875, 13.631471633911133, 14.467350006103516, 15.303227424621582, 16.13910675048828, 16.97498321533203, 17.810861587524414, 18.646739959716797, 19.48261833190918, 20.318496704101562, 21.154375076293945, 21.990253448486328, 22.826129913330078, 23.662010192871094, 24.497886657714844, 25.333765029907227, 26.16964340209961]}, "eval/loss": 5.3852667808532715, "eval/wer": 1.35650535501785, "eval/runtime": 686.8292, "eval/samples_per_second": 3.847, "eval/steps_per_second": 0.482} \ No newline at end of file